Source code for torch_uncertainty.post_processing.calibration.dirichlet_scaler

import logging
from typing import Literal

import torch
from torch import Tensor, device, nn
from torch.nn.functional import linear
from torch.optim import LBFGS
from torch.utils.data import DataLoader

from .matrix_scaler import MatrixScaler



[docs]
class DirichletScaler(MatrixScaler):
    def __init__(
        self,
        num_classes: int,
        model: nn.Module | None = None,
        init_weight_temperature: float = 1,
        init_bias_temperature: float | None = None,
        lr: float = 0.1,
        max_iter: int = 200,
        lambda_reg: float | None = None,
        mu_reg: float | None = None,
        eps: float = 1e-8,
        device: Literal["cpu", "cuda"] | device | None = None,
    ) -> None:
        r"""Dirichlet scaling post-processing for calibrated probabilities (Kull et al., 2019).

        Like :class:`MatrixScaler`, fits a full affine transformation of the logits

        .. math::
            \tilde{\mathbf{p}}(\mathbf{x}) = \mathrm{softmax}\!\left(\mathbf{W} \mathbf{z}(\mathbf{x}) + \mathbf{b}\right),

        but adds two off-diagonal :math:`\ell_2` regularisers that pull the
        transformation towards a temperature-scaling solution and avoid overfitting on
        small calibration sets:

        .. math::
            \mathcal{L} = \mathrm{CE}(\tilde{\mathbf{p}}, y)
            + \lambda \sum_{i \neq j} W_{ij}^2 + \mu \sum_{i} b_i^2.

        :math:`\lambda` (:attr:`lambda_reg`) and :math:`\mu` (:attr:`mu_reg`) typically
        need to be tuned on a held-out subset of the calibration data.

        Args:
            num_classes: Number of classes :math:`C`.
            model: Model to calibrate. Defaults to ``None``.
            init_weight_temperature: Initial value for the weight matrix. Defaults to ``1``.
            init_bias_temperature: Initial value for the bias. The inverse bias will be
                set to the ``0`` vector if set to ``None``. Defaults to ``None``.
            lr: Learning rate for the optimizer. Defaults to ``0.1``.
            max_iter: Maximum number of iterations for the optimizer. Defaults to ``200``.
            lambda_reg: Regularization coefficient :math:`\lambda` applied to the
                off-diagonal elements of the weight matrix. Used to mitigate overfitting.
                Defaults to ``None``.
            mu_reg: Regularization coefficient :math:`\mu` applied to the bias vector.
                Defaults to ``None``.
            eps: Small value for numerical stability. Defaults to ``1e-8``.
            device: Device to use for optimization. Defaults to ``None``.

        References:
            [1] `Kull, M., Perello-Nieto, M., Kängsepp, M., Silva Filho, T., Song, H., & Flach, P.
            (2019). Beyond temperature scaling: Obtaining well-calibrated multiclass
            probabilities with Dirichlet calibration. NeurIPS 2019
            <https://arxiv.org/abs/1910.12656>`_.

        Warning:
            For binary tasks, a sigmoid is applied before the prediction is transposed
            to the 2-class case.
        """
        super().__init__(
            num_classes=num_classes,
            model=model,
            init_weight_temperature=init_weight_temperature,
            init_bias_temperature=init_bias_temperature,
            lr=lr,
            max_iter=max_iter,
            eps=eps,
            device=device,
        )
        if lambda_reg is not None and lambda_reg < 0:
            raise ValueError(f"lambda_reg must be None or positive. Got {lambda_reg}.")
        if mu_reg is not None and mu_reg < 0:
            raise ValueError(f"mu_reg must be None or positive. Got {mu_reg}.")
        self.lambda_reg = lambda_reg
        self.mu_reg = mu_reg


[docs]
    def fit(
        self,
        dataloader: DataLoader,
        save_logits: bool = False,
        progress: bool = True,
    ) -> None:
        """Fit the temperature parameters to the calibration data.

        Args:
            dataloader: Dataloader with the calibration data. If there is no model,
                the dataloader should include the confidence score directly and not the logits.
            save_logits: Whether to save the logits and labels in memory. Defaults to ``False``.
            progress: Whether to show a progress bar. Defaults to ``True``.
        """
        if self.model is None or isinstance(self.model, nn.Identity):
            logging.warning(
                "model is None. Fitting post_processing method on the dataloader's data directly."
            )
            self.model = nn.Identity()

        all_logits, all_labels = self._extract_data(dataloader, progress)
        optimizer = LBFGS(self.inv_temperature, lr=self.lr, max_iter=self.max_iter)

        def calib_eval() -> float:
            optimizer.zero_grad()
            loss = self.criterion(self._scale(all_logits), all_labels)
            if self.lambda_reg is not None:
                off_diag_sq = (self.inv_temperature_weight**2).sum() - (
                    self.inv_temperature_weight.diagonal() ** 2
                ).sum()
                loss += self.lambda_reg * off_diag_sq / (self.num_classes * (self.num_classes - 1))
            if self.mu_reg is not None:
                loss += self.mu_reg * (self.inv_temperature_bias**2).mean()
            loss.backward()
            logging.debug("scaler loss: %f", loss.item())
            return loss

        optimizer.step(calib_eval)
        self.trained = True
        if save_logits:
            self.logits = all_logits
            self.labels = all_labels


    # Compute the product with the logprobs instead of the logits
    def _scale(self, logits: Tensor) -> Tensor:
        return linear(
            torch.log_softmax(logits, dim=1), self.inv_temperature_weight, self.inv_temperature_bias
        )

    @property
    def inv_temperature(self) -> list:
        return [self.inv_temperature_weight, self.inv_temperature_bias]

    @property
    def temperature(self) -> list:
        return [torch.inverse(self.inv_temperature_weight), 1 / self.inv_temperature_bias]