Shortcuts

Source code for torch_uncertainty.routines.segmentation

import torch
from einops import rearrange
from lightning.pytorch import LightningModule
from lightning.pytorch.loggers import Logger
from lightning.pytorch.utilities.types import STEP_OUTPUT
from torch import Tensor, nn
from torch.optim import Optimizer
from torchmetrics import Accuracy, MetricCollection
from torchvision.transforms.v2 import ToDtype
from torchvision.transforms.v2 import functional as F
from torchvision.utils import draw_segmentation_masks

from torch_uncertainty.metrics import (
    AUGRC,
    AURC,
    BrierScore,
    CalibrationError,
    CategoricalNLL,
    MeanIntersectionOverUnion,
)
from torch_uncertainty.models import (
    EPOCH_UPDATE_MODEL,
    STEP_UPDATE_MODEL,
)
from torch_uncertainty.utils.plotting import show


[docs]class SegmentationRoutine(LightningModule): def __init__( self, model: nn.Module, num_classes: int, loss: nn.Module, optim_recipe: dict | Optimizer | None = None, eval_shift: bool = False, format_batch_fn: nn.Module | None = None, metric_subsampling_rate: float = 1e-2, log_plots: bool = False, num_samples_to_plot: int = 3, num_calibration_bins: int = 15, ) -> None: r"""Routine for training & testing on **segmentation** tasks. Args: model (torch.nn.Module): Model to train. num_classes (int): Number of classes in the segmentation task. loss (torch.nn.Module): Loss function to optimize the :attr:`model`. optim_recipe (dict or Optimizer, optional): The optimizer and optionally the scheduler to use. Defaults to ``None``. eval_shift (bool, optional): Indicates whether to evaluate the Distribution shift performance. Defaults to ``False``. format_batch_fn (torch.nn.Module, optional): The function to format the batch. Defaults to ``None``. metric_subsampling_rate (float, optional): The rate of subsampling for the memory consuming metrics. Defaults to ``1e-2``. log_plots (bool, optional): Indicates whether to log plots from metrics. Defaults to ``False``. num_samples_to_plot (int, optional): Number of samples to plot in the segmentation results. Defaults to ``3``. num_calibration_bins (int, optional): Number of bins to compute calibration metrics. Defaults to ``15``. Warning: You must define :attr:`optim_recipe` if you do not use the CLI. Note: :attr:`optim_recipe` can be anything that can be returned by :meth:`LightningModule.configure_optimizers()`. Find more details `here <https://lightning.ai/docs/pytorch/stable/common/lightning_module.html#configure-optimizers>`_. """ super().__init__() _segmentation_routine_checks( num_classes=num_classes, metric_subsampling_rate=metric_subsampling_rate, num_calibration_bins=num_calibration_bins, ) if eval_shift: raise NotImplementedError( "Distribution shift evaluation not implemented yet. Raise an issue " "if needed." ) self.model = model self.num_classes = num_classes self.num_calibration_bins = num_calibration_bins self.loss = loss self.needs_epoch_update = isinstance(model, EPOCH_UPDATE_MODEL) self.needs_step_update = isinstance(model, STEP_UPDATE_MODEL) if format_batch_fn is None: format_batch_fn = nn.Identity() self.optim_recipe = optim_recipe self.format_batch_fn = format_batch_fn self.metric_subsampling_rate = metric_subsampling_rate self.log_plots = log_plots self._init_metrics() if log_plots: self.num_samples_to_plot = num_samples_to_plot self.sample_buffer = [] def _init_metrics(self) -> None: """Initialize the metrics depending on the exact task.""" seg_metrics = MetricCollection( { "seg/mIoU": MeanIntersectionOverUnion(num_classes=self.num_classes), }, compute_groups=False, ) sbsmpl_seg_metrics = MetricCollection( { "seg/mAcc": Accuracy( task="multiclass", average="macro", num_classes=self.num_classes ), "seg/Brier": BrierScore(num_classes=self.num_classes), "seg/NLL": CategoricalNLL(), "seg/pixAcc": Accuracy(task="multiclass", num_classes=self.num_classes), "cal/ECE": CalibrationError( task="multiclass", num_classes=self.num_classes, num_bins=self.num_calibration_bins, ), "cal/aECE": CalibrationError( task="multiclass", adaptive=True, num_classes=self.num_classes, num_bins=self.num_calibration_bins, ), "sc/AURC": AURC(), "sc/AUGRC": AUGRC(), }, compute_groups=[ ["seg/mAcc"], ["seg/Brier"], ["seg/NLL"], ["seg/pixAcc"], ["cal/ECE", "cal/aECE"], ["sc/AURC", "sc/AUGRC"], ], ) self.val_seg_metrics = seg_metrics.clone(prefix="val/") self.val_sbsmpl_seg_metrics = sbsmpl_seg_metrics.clone(prefix="val/") self.test_seg_metrics = seg_metrics.clone(prefix="test/") self.test_sbsmpl_seg_metrics = sbsmpl_seg_metrics.clone(prefix="test/") def configure_optimizers(self) -> Optimizer | dict: return self.optim_recipe
[docs] def forward(self, inputs: Tensor) -> Tensor: """Forward pass of the model. Args: inputs (Tensor): input tensor. Returns: Tensor: the prediction of the model. """ return self.model(inputs)
def on_train_start(self) -> None: if self.logger is not None: # coverage: ignore self.logger.log_hyperparams(self.hparams) def on_validation_start(self) -> None: if self.needs_epoch_update and not self.trainer.sanity_checking: self.model.update_wrapper(self.current_epoch) if hasattr(self.model, "need_bn_update"): self.model.bn_update(self.trainer.train_dataloader, device=self.device) def on_test_start(self) -> None: if hasattr(self.model, "need_bn_update"): self.model.bn_update(self.trainer.train_dataloader, device=self.device)
[docs] def training_step(self, batch: tuple[Tensor, Tensor]) -> STEP_OUTPUT: """Perform a single training step based on the input tensors. Args: batch (tuple[Tensor, Tensor]): the training images and their corresponding targets Returns: Tensor: the loss corresponding to this training step. """ img, target = self.format_batch_fn(batch) logits = self.forward(img) target = F.resize(target, logits.shape[-2:], interpolation=F.InterpolationMode.NEAREST) logits = rearrange(logits, "b c h w -> (b h w) c") target = target.flatten() valid_mask = target != 255 loss = self.loss(logits[valid_mask], target[valid_mask]) if self.needs_step_update: self.model.update_wrapper(self.current_epoch) self.log("train_loss", loss, prog_bar=True, logger=True) return loss
[docs] def validation_step(self, batch: tuple[Tensor, Tensor]) -> None: """Perform a single validation step based on the input tensors. Compute the prediction of the model and the value of the metrics on the validation batch. Args: batch (tuple[Tensor, Tensor]): the validation images and their corresponding targets """ img, targets = batch logits = self.forward(img) targets = F.resize( targets, logits.shape[-2:], interpolation=F.InterpolationMode.NEAREST, ) logits = rearrange(logits, "(m b) c h w -> (b h w) m c", b=targets.size(0)) probs_per_est = logits.softmax(dim=-1) probs = probs_per_est.mean(dim=1) targets = targets.flatten() valid_mask = targets != 255 probs, targets = probs[valid_mask], targets[valid_mask] self.val_seg_metrics.update(probs, targets) self.val_sbsmpl_seg_metrics.update(*self.subsample(probs, targets))
[docs] def test_step(self, batch: tuple[Tensor, Tensor]) -> None: """Perform a single test step based on the input tensors. Compute the prediction of the model and the value of the metrics on the test batch. Args: batch (tuple[Tensor, Tensor]): the test images and their corresponding targets """ img, targets = batch logits = self.forward(img) targets = F.resize( targets, logits.shape[-2:], interpolation=F.InterpolationMode.NEAREST, ) logits = rearrange(logits, "(m b) c h w -> b m c h w", b=targets.size(0)) probs_per_est = logits.softmax(dim=2) probs = probs_per_est.mean(dim=1) if self.log_plots and len(self.sample_buffer) < self.num_samples_to_plot: max_count = self.num_samples_to_plot - len(self.sample_buffer) for i, (_img, _prb, _tgt) in enumerate(zip(img, probs, targets, strict=False)): if i >= max_count: break _pred = _prb.argmax(dim=0, keepdim=True) self.sample_buffer.append((_img, _pred, _tgt)) probs = rearrange(probs, "b c h w -> (b h w) c") targets = targets.flatten() valid_mask = targets != 255 probs, targets = probs[valid_mask], targets[valid_mask] self.test_seg_metrics.update(probs, targets) self.test_sbsmpl_seg_metrics.update(*self.subsample(probs, targets))
[docs] def on_validation_epoch_end(self) -> None: """Compute and log the values of the collected metrics in `validation_step`.""" res_dict = self.val_seg_metrics.compute() self.log_dict(res_dict, logger=True, sync_dist=True) self.log( "mIoU%", res_dict["val/seg/mIoU"] * 100, prog_bar=True, sync_dist=True, ) self.log_dict(self.val_sbsmpl_seg_metrics.compute(), sync_dist=True) self.val_seg_metrics.reset() self.val_sbsmpl_seg_metrics.reset()
[docs] def on_test_epoch_end(self) -> None: """Compute, log, and plot the values of the collected metrics in `test_step`.""" self.log_dict(self.test_seg_metrics.compute(), sync_dist=True) self.log_dict(self.test_sbsmpl_seg_metrics.compute(), sync_dist=True) if isinstance(self.logger, Logger) and self.log_plots: self.logger.experiment.add_figure( "Calibration/Reliabity diagram", self.test_sbsmpl_seg_metrics["cal/ECE"].plot()[0], ) self.logger.experiment.add_figure( "Selective Classification/Risk-Coverage curve", self.test_sbsmpl_seg_metrics["sc/AURC"].plot()[0], ) self.logger.experiment.add_figure( "Selective Classification/Generalized Risk-Coverage curve", self.test_sbsmpl_seg_metrics["sc/AUGRC"].plot()[0], ) self.log_segmentation_plots()
[docs] def log_segmentation_plots(self) -> None: """Build and log examples of segmentation plots from the test set.""" for i, (img, pred, tgt) in enumerate(self.sample_buffer): pred = pred == torch.arange(self.num_classes, device=pred.device)[:, None, None] tgt = tgt == torch.arange(self.num_classes, device=tgt.device)[:, None, None] # Undo normalization on the image and convert to uint8. mean = torch.tensor(self.trainer.datamodule.mean, device=img.device) std = torch.tensor(self.trainer.datamodule.std, device=img.device) img = img * std[:, None, None] + mean[:, None, None] img = ToDtype(torch.uint8, scale=True)(img) dataset = self.trainer.datamodule.test color_palette = dataset.color_palette if hasattr(dataset, "color_palette") else None pred_mask = draw_segmentation_masks(img, pred, alpha=0.7, colors=color_palette) gt_mask = draw_segmentation_masks(img, tgt, alpha=0.7, colors=color_palette) self.logger.experiment.add_figure( f"Segmentation results/{i}", show(pred_mask, gt_mask), )
[docs] def subsample(self, pred: Tensor, target: Tensor) -> tuple[Tensor, Tensor]: """Select a random sample of the data to compute the loss onto. Args: pred (Tensor): the prediction tensor. target (Tensor): the target tensor. Returns: Tuple[Tensor, Tensor]: the subsampled prediction and target tensors. """ total_size = target.size(0) num_samples = max(1, int(total_size * self.metric_subsampling_rate)) indices = torch.randperm(total_size, device=pred.device)[:num_samples] return pred[indices], target[indices]
def _segmentation_routine_checks( num_classes: int, metric_subsampling_rate: float, num_calibration_bins: int, ) -> None: """Check the domains of the routine's parameters. Args: num_classes (int): the number of classes in the dataset. metric_subsampling_rate (float): the rate of subsampling to compute the metrics. num_calibration_bins (int): the number of bins for the evaluation of the calibration. """ if num_classes < 2: raise ValueError(f"num_classes must be at least 2, got {num_classes}.") if not 0 < metric_subsampling_rate <= 1: raise ValueError( f"metric_subsampling_rate must be in the range (0, 1], got {metric_subsampling_rate}." ) if num_calibration_bins < 2: raise ValueError(f"num_calibration_bins must be at least 2, got {num_calibration_bins}.")