Source code for pytorch_ood.loss.conf

import torch
import torch.nn as nn
import torch.nn.functional as F

from ..utils import is_known



[docs]
class ConfidenceLoss(nn.Module):
    """
    Loss proposed in *Learning Confidence for Out-of-Distribution Detection in Neural Networks*.
    The models learns to predict a confidence :math:`c` in addition to the class membership.

    The loss minimized the Negative Log Likelihood for class membership prediction.

    .. math::
        \\mathcal{L}_{NLL} + \\alpha \\mathcal{L}_c = - \\sum_{i=1}^{M} \\log(p'_{i}) y_i - \\alpha \\log(c)

        \\text{where} \\quad p_i' = c \\cdot p_i + (1-c) y_i


    :see Paper: `ArXiv <https://arxiv.org/abs/1802.04865>`_


    .. note::
        * We implemented clipping for numerical stability.
        * This implementation uses mean reduction for batches.
        * The authors additionally used ODIN preprocessing

    """

    def __init__(self, alpha: float = 1.0, eps: float = 1e-24):
        """

        :param alpha: :math:`\\alpha` used to balance terms
        :param eps: Clipping value :math:`\\epsilon` used for numerical stability
        """
        super(ConfidenceLoss, self).__init__()
        self.alpha = alpha
        self.eps = eps


[docs]
    def forward(
        self, logits: torch.Tensor, confidence: torch.Tensor, target: torch.Tensor
    ) -> torch.Tensor:
        """
        :param logits: class logits for samples
        :param confidence: predicted confidence for samples
        :param target: labels for samples (not one-hot encoded)
        """
        known = is_known(target)

        if known.any():
            target_prob_dist = F.one_hot(target[known], num_classes=logits.size(1))
            prediction = F.softmax(logits[known], dim=1)
            adjusted_prediction = (
                prediction * confidence[known] + (1 - confidence[known]) * target_prob_dist
            )
            # calculate negative log likelihood
            adjusted_prediction = adjusted_prediction.clamp(self.eps, 1.0)
            loss_nll = -torch.sum(torch.log(adjusted_prediction) * target_prob_dist)
            confidence = confidence.clamp(self.eps, 1.0)
            loss_conf = -torch.log(confidence)
            # NOTE: we use mean as reduction for batches
            loss_conf = loss_conf.mean()
            return loss_nll + self.alpha * loss_conf
        else:
            return torch.zeros(size=(1,))