Source code for stable_pretraining.callbacks.probe

from functools import partial
from typing import Optional, Union

import torch
import torchmetrics
from lightning.pytorch import LightningModule
from loguru import logger as logging
import types
from .utils import (
    TrainableCallback,
    detach_tensors,
    get_data_from_batch_or_outputs,
    log_header,
)



[docs]
class OnlineProbe(TrainableCallback):
    """Online probe for evaluating learned representations during self-supervised training.

    This callback implements the standard linear evaluation protocol by training a probe
    (typically a linear classifier) on top of frozen features from the main model. The probe
    is trained simultaneously with the main model but maintains its own optimizer, scheduler,
    and training loop. This allows monitoring representation quality throughout training
    without modifying the base model.

    **Key features**

    * Automatic gradient detachment to prevent probe gradients affecting the main model.
    * Independent optimizer and scheduler management.
    * Support for gradient accumulation.
    * Mixed precision training compatibility through automatic dtype conversion.
    * Metric tracking and logging.

    Args:
        module: The ``spt.LightningModule`` to probe.
        name: Unique identifier for this probe instance. Used for logging and storing
            metrics/modules.
        input: Key in batch dict or outputs dict containing input features to probe.
        target: Key in batch dict containing ground truth target labels.
        probe: The probe module to train. Can be a ``nn.Module`` instance, callable that
            returns a module, or Hydra config to instantiate.
        loss: Loss function for probe training (e.g., ``nn.CrossEntropyLoss()``).
        optimizer: Optimizer configuration for the probe. Accepted forms — string name
            (``"AdamW"``, ``"SGD"``, ``"LARS"``), a dict like
            ``{"type": "AdamW", "lr": 1e-3, ...}``, a pre-configured ``functools.partial``,
            an optimizer instance, or a callable. ``None`` uses
            ``LARS(lr=0.1, clip_lr=True, eta=0.02, exclude_bias_n_norm=True, weight_decay=0)``
            (the standard for SSL linear probes, default).
        scheduler: Learning rate scheduler configuration. Accepted forms — string name
            (``"CosineAnnealingLR"``, ``"StepLR"``), a dict
            ``{"type": "CosineAnnealingLR", "T_max": 1000, ...}``, a partial, a scheduler
            instance, or a callable. ``None`` uses ``ConstantLR(factor=1.0)``
            (constant LR, default).
        accumulate_grad_batches: Number of batches to accumulate gradients before
            optimizer step. Default is 1 (no accumulation).
        gradient_clip_val: Maximum gradient norm for clipping probe gradients.
            ``None`` disables clipping. Default is ``None``.
        gradient_clip_algorithm: Norm type used for gradient clipping — ``"norm"``
            (L2) or ``"value"`` (element-wise). Default is ``"norm"``.
        metrics: Metrics to track during training/validation. Can be dict, list, tuple,
            or single metric instance.
        verbose: If ``True``, log extra per-step detail. ``None`` inherits the
            global ``spt`` verbosity setting.

    Note:
        * The probe module is stored in ``pl_module.callbacks_modules[name]``.
        * Metrics are stored in ``pl_module.callbacks_metrics[name]``.
        * Predictions are stored in batch dict with key ``'{name}_preds'``.
        * Loss is logged as ``'train/{name}_loss'``.
        * Metrics are logged with prefix ``'train/{name}_'`` and ``'eval/{name}_'``.
    """

    def __init__(
        self,
        module: LightningModule,
        name: str,
        input: str,
        target: str,
        probe: torch.nn.Module,
        loss: callable = None,
        optimizer: Optional[Union[str, dict, partial, torch.optim.Optimizer]] = None,
        scheduler: Optional[
            Union[str, dict, partial, torch.optim.lr_scheduler.LRScheduler]
        ] = None,
        accumulate_grad_batches: int = 1,
        gradient_clip_val: float = None,
        gradient_clip_algorithm: str = "norm",
        metrics: Optional[Union[dict, tuple, list, torchmetrics.Metric]] = None,
        verbose: bool = None,
    ) -> None:
        from .utils import resolve_verbose

        # Initialize base class
        self.input = input
        self.target = target
        if loss is None:
            logging.warning(f"Not loss given to {name}, will use output of `probe`")
        self.loss = loss
        self.verbose = resolve_verbose(verbose)

        # Store probe configuration for later initialization
        self._probe_config = probe

        # Format metrics
        super().__init__(
            module=module,
            name=name,
            optimizer=optimizer,
            scheduler=scheduler,
            accumulate_grad_batches=accumulate_grad_batches,
            gradient_clip_val=gradient_clip_val,
            gradient_clip_algorithm=gradient_clip_algorithm,
        )

        log_header("OnlineProbe")
        logging.info(f"  name: {self.name}")
        logging.info(f"  input: {input}")
        logging.info(f"  target: {target}")
        logging.info(f"  accumulate_grad_batches: {accumulate_grad_batches}")
        # Setup metrics
        self.metrics = metrics
        logging.info("  wrapping forward")
        self.wrap_forward(pl_module=module)


[docs]
    def configure_model(self, pl_module: LightningModule) -> torch.nn.Module:
        """Initialize the probe module from configuration."""
        if isinstance(self._probe_config, torch.nn.Module):
            probe_module = self._probe_config
        elif callable(self._probe_config):
            probe_module = self._probe_config(pl_module)
        else:
            raise ValueError("the probe should be a module or a callable")
        return probe_module


    def wrap_forward(self, pl_module):
        fn = pl_module.forward

        def new_forward(self, batch, stage, callback=self, fn=fn):
            outputs = fn(batch, stage)
            if (
                callback.input is None
                or callback.target is None
                or callback.loss is None
            ):
                assert callback.target is None
                assert callback.input is None
                assert callback.loss is None
                return callback.module(batch, outputs, self)
            else:
                x = get_data_from_batch_or_outputs(
                    callback.input, batch, outputs, caller_name=callback.name
                )
                y = get_data_from_batch_or_outputs(
                    callback.target, batch, outputs, caller_name=callback.name
                )

                if x is None or y is None:
                    raise ValueError(
                        f"Callback {callback.name} missing {callback.input} or {callback.target}"
                    )

                preds = callback.module(detach_tensors(x))
                y = detach_tensors(y)

            prediction_key = f"{callback.name}_preds"
            assert prediction_key not in batch
            outputs[prediction_key] = preds

            scalar_logs = {}
            metric_logs = {}
            if stage == "fit":
                loss = callback.loss(preds, y)
                assert f"train/{callback.name}_loss" not in scalar_logs
                if "loss" not in outputs:
                    outputs["loss"] = 0
                outputs["loss"] = outputs["loss"] + loss
                scalar_logs[f"train/{callback.name}_loss"] = loss.item()

                my_metrics = self.callbacks_metrics[callback.name]["_train"]
                for metric_name, metric in my_metrics.items():
                    metric.update(preds, y)
                    assert f"train/{callback.name}_{metric_name}" not in metric_logs
                    metric_logs[f"train/{callback.name}_{metric_name}"] = metric
            elif stage == "validate":
                my_metrics = pl_module.callbacks_metrics[callback.name]["_val"]
                for metric_name, metric in my_metrics.items():
                    metric(preds, y)
                    metric_logs[f"eval/{callback.name}_{metric_name}"] = metric

            # Raw scalars (loss): sync across GPUs
            if scalar_logs:
                self.log_dict(scalar_logs, on_step=True, on_epoch=True, sync_dist=True)
            # torchmetrics: handle their own distributed sync, do NOT use sync_dist
            if metric_logs:
                self.log_dict(metric_logs, on_step=True, on_epoch=True, sync_dist=False)
            return outputs

        # Bind the new method to the instance
        pl_module.forward = types.MethodType(new_forward, pl_module)