Source code for InnerEye.ML.utils.supervised_criterion

#  ------------------------------------------------------------------------------------------
#  Copyright (c) Microsoft Corporation. All rights reserved.
#  Licensed under the MIT License (MIT). See LICENSE in the repo root for license information.
#  ------------------------------------------------------------------------------------------
import abc
from typing import Any, Dict, List, Optional

import torch
from torch.nn import BCEWithLogitsLoss


[docs]class SupervisedLearningCriterion(torch.nn.Module, abc.ABC):
    """
    Base class for criterion functions used for supervised learning, with the ability to
    smooth labels if required.
    """

    def __init__(self, smoothing_eps: float = 0.0, is_binary_classification: bool = False):
        super().__init__()
        if not (0.0 <= smoothing_eps <= 1.0):
            raise ValueError(f"Expected 0.0 <= smoothing_eps <= 1.0 found {smoothing_eps}")
        self.smoothing_eps = smoothing_eps
        self.is_binary_classification = is_binary_classification

[docs]    def forward(self, *input: torch.Tensor, **kwargs: Any) -> Any:
        def _smooth_target(target: torch.Tensor) -> torch.Tensor:
            if self.is_binary_classification or len(target.shape) <= 2:
                _num_classes = 2
            else:
                # Get the number of classes from the class dimension, otherwise assume binary problem
                _num_classes = target.shape[min(1, len(target.shape))]
            # Smooth the one-hot target: 1.0 becomes 1.0-eps, 0.0 becomes eps / (nClasses - 1)
            # noinspection PyTypeChecker
            return target * (1.0 - self.smoothing_eps) + \
                   (1.0 - target) * self.smoothing_eps / (_num_classes - 1.0)  # type: ignore

        _input: List[torch.Tensor] = list(input)
        if self.smoothing_eps > 0.0:
            _input[1] = _smooth_target(_input[1])

        return self.forward_minibatch(*_input, **kwargs)

[docs]    @abc.abstractmethod
    def forward_minibatch(self, output: Any, target: Any, **kwargs: Any) -> Any:
        raise NotImplementedError("forward must be implemented by sub classes")


[docs]class BinaryCrossEntropyWithLogitsLoss(SupervisedLearningCriterion):
    """A wrapper function for torch.nn.BCEWithLogitsLoss to enable label smoothing"""

    def __init__(self, num_classes: int,
                 class_counts: Optional[Dict[float, int]] = None,
                 num_train_samples: Optional[int] = None,
                 **kwargs: Any):
        """
        :param num_classes: The number of classes the model predicts. For binary classification num_classes is one
                            and for multi-label classification tasks num_classes will be greater than one.

        :param class_counts: The number of positive samples for each class. class_counts is a dictionary with key-value
                             pairs corresponding to each class and the positive sample count for the class.
                             For binary classification tasks, class_counts should have a single key-value pair
                             for the positive class.

        :param num_train_samples: The total number of training samples in the dataset.
        """
        super().__init__(is_binary_classification=True, **kwargs)
        if class_counts and not num_train_samples:
            raise ValueError("Need to specify the num_train_samples with class_counts")
        self._positive_class_weights = None
        self._class_counts = class_counts
        self._num_train_samples = num_train_samples
        self.num_classes = num_classes
        if class_counts:
            self._positive_class_weights = self.get_positive_class_weights()
            if torch.cuda.is_available():
                self._positive_class_weights = self._positive_class_weights.cuda()
        self._loss_fn = BCEWithLogitsLoss(pos_weight=self._positive_class_weights)

[docs]    def get_positive_class_weights(self) -> torch.Tensor:
        """
        Returns the weights of the positive class only from the list of
        dictionaries containing the counts for all classes for each
        target position.
        :return: a list of weights to use for the positive class for each target position.
        """
        assert self._class_counts and self._num_train_samples
        if len(self._class_counts) != self.num_classes:
            raise ValueError(f"Have {self.num_classes} classes but got counts for {len(self._class_counts)} classes "
                             f"Note: If this is a binary classification task, there should be a single class count "
                             f"corresponding to the positive class.")
        # These weights are given to the pos_weight parameter of Pytorch's BCEWithLogitsLoss.
        # Weights are calculated as (number of negative samples for class 'i')/(number of positive samples for class 'i')
        # for every class 'i' in a binary/multi-label classification task.
        # For a binary classification task, this reduces to (number of false samples / number of true samples).
        weights = [(self._num_train_samples - value) / value if value != 0 else 1.0 for (key, value) in
                   sorted(self._class_counts.items())]  # Uses the first number on the tuple to compare
        return torch.tensor(weights, dtype=torch.float32)

[docs]    def forward_minibatch(self, output: torch.Tensor, target: torch.Tensor, **kwargs: Any) -> Any:
        return self._loss_fn(output, target)