Source code for incerto.calibration.base

"""
Base classes for calibration methods.

All calibration methods should inherit from BaseCalibrator and implement
the fit() and predict() methods.
"""

from abc import ABC, abstractmethod
import torch
from torch.distributions import Categorical


def _validate_logits(logits: torch.Tensor, context: str = "logits") -> None:
    """Validate that logits are a 2D tensor."""
    from ..exceptions import DataError

    if not isinstance(logits, torch.Tensor):
        raise DataError(
            f"{context} must be a torch.Tensor, got {type(logits).__name__}"
        )
    if logits.dim() != 2:
        raise DataError(
            f"{context} must be 2D (n_samples, n_classes), got shape {tuple(logits.shape)}"
        )


def _validate_fit_inputs(logits: torch.Tensor, labels: torch.Tensor) -> None:
    """Validate logits and labels for fit()."""
    from ..exceptions import DataError

    _validate_logits(logits)
    if not isinstance(labels, torch.Tensor):
        raise DataError(f"labels must be a torch.Tensor, got {type(labels).__name__}")
    if labels.dim() != 1:
        raise DataError(
            f"labels must be 1D (n_samples,), got shape {tuple(labels.shape)}"
        )
    if logits.shape[0] != labels.shape[0]:
        raise DataError(
            f"logits and labels must have the same number of samples, "
            f"got {logits.shape[0]} and {labels.shape[0]}"
        )



[docs]
class BaseCalibrator(ABC):
    """
    Abstract base class for all calibration methods.

    Calibrators are post-hoc methods that adjust a trained model's predicted
    probabilities to better match empirical frequencies. All calibrators follow
    a fit-predict pattern:

    1. fit(): Learn calibration parameters on a validation set
    2. predict(): Apply calibration to new logits

    Subclasses must implement both methods.

    Example:
        >>> class MyCalibrator(BaseCalibrator):
        ...     def fit(self, logits, labels):
        ...         # Learn calibration parameters
        ...         self.temperature = find_optimal_temperature(logits, labels)
        ...         return self
        ...
        ...     def predict(self, logits):
        ...         # Apply calibration
        ...         calibrated_logits = logits / self.temperature
        ...         probs = F.softmax(calibrated_logits, dim=-1)
        ...         return Categorical(probs=probs)
        ...
        >>> calibrator = MyCalibrator()
        >>> calibrator.fit(val_logits, val_labels)
        >>> calibrated_dist = calibrator.predict(test_logits)

    See Also:
        - TemperatureScaling: Simple and effective temperature-based calibration
        - VectorScaling: Class-wise temperature scaling
        - IsotonicRegression: Non-parametric calibration
    """


[docs]
    @abstractmethod
    def fit(self, logits: torch.Tensor, labels: torch.Tensor) -> "BaseCalibrator":
        """
        Fit the calibrator on a validation set.

        This method should learn any calibration parameters needed to map
        uncalibrated logits to calibrated probabilities.

        Args:
            logits: Uncalibrated model outputs of shape (n_samples, n_classes).
                   These should be raw logits before softmax.
            labels: True class labels of shape (n_samples,) with integer values
                   in range [0, n_classes-1].

        Returns:
            self: For method chaining

        Note:
            The validation set used here should be separate from both training
            and test sets to avoid overfitting the calibration parameters.
        """
        ...



[docs]
    @abstractmethod
    def predict(self, logits: torch.Tensor) -> Categorical:
        """
        Apply calibration to logits and return a Categorical distribution.

        This method applies the learned calibration to transform uncalibrated
        logits into calibrated probabilities.

        Args:
            logits: Uncalibrated model outputs of shape (n_samples, n_classes).

        Returns:
            A torch.distributions.Categorical distribution over calibrated
            probabilities. Access probabilities via .probs or sample via .sample().

        Example:
            >>> calibrated_dist = calibrator.predict(test_logits)
            >>> calibrated_probs = calibrated_dist.probs  # shape: (n_samples, n_classes)
            >>> predictions = calibrated_dist.sample()     # shape: (n_samples,)
            >>> log_probs = calibrated_dist.log_prob(labels)  # shape: (n_samples,)
        """
        ...



[docs]
    @abstractmethod
    def state_dict(self) -> dict:
        """
        Return a dictionary containing the calibrator's state.

        This should include all learned parameters needed to reproduce
        the calibrator's behavior after fitting.

        Returns:
            Dictionary mapping parameter names to their values.

        Example:
            >>> calibrator.fit(val_logits, val_labels)
            >>> state = calibrator.state_dict()
            >>> # state might be {'temperature': 1.5, 'n_classes': 10}
        """
        ...



[docs]
    @abstractmethod
    def load_state_dict(self, state: dict) -> None:
        """
        Load calibrator state from a dictionary.

        This restores the calibrator to a previously saved state,
        allowing it to be used without refitting.

        Args:
            state: Dictionary containing calibrator state, typically
                  from a previous call to state_dict().

        Raises:
            SerializationError: If state is invalid or incompatible.

        Example:
            >>> state = calibrator.state_dict()
            >>> new_calibrator = MyCalibrator()
            >>> new_calibrator.load_state_dict(state)
            >>> # new_calibrator now behaves identically to calibrator
        """
        ...



[docs]
    def save(self, path: str) -> None:
        """
        Save calibrator state to a file.

        Args:
            path: File path where the state will be saved.

        Raises:
            SerializationError: If saving fails.

        Example:
            >>> calibrator.fit(val_logits, val_labels)
            >>> calibrator.save('calibrator.pt')
        """
        from ..exceptions import SerializationError

        try:
            torch.save(self.state_dict(), path)
        except Exception as e:
            raise SerializationError(f"Failed to save to {path}: {e}") from e



[docs]
    @classmethod
    def load(cls, path: str) -> "BaseCalibrator":
        """
        Load a calibrator from a file.

        Args:
            path: File path to load the state from.

        Returns:
            A new calibrator instance with loaded state.

        Raises:
            SerializationError: If loading fails.

        Example:
            >>> calibrator = MyCalibrator.load('calibrator.pt')
            >>> calibrated_dist = calibrator.predict(test_logits)
        """
        from ..exceptions import SerializationError

        try:
            state = torch.load(path, weights_only=True)
            instance = cls()
            instance.load_state_dict(state)
            return instance
        except Exception as e:
            raise SerializationError(f"Failed to load from {path}: {e}") from e