Source code for cockpit.quantities.distance

"""Class for tracking distance from initialization."""

from cockpit.quantities.quantity import TwoStepQuantity


[docs]class Distance(TwoStepQuantity):
    """Distance Quantity class tracking distance of the parameters from their init."""

    CACHE_KEY = "params"
    """str: String under which the parameters are cached for computation.
       Default: ``'params'``.
    """
    INIT_GLOBAL_STEP = 0
    """int: Iteration number used as reference. Defaults to ``0``."""

    def extensions(self, global_step):
        """Return list of BackPACK extensions required for the computation.

        Args:
            global_step (int): The current iteration number.

        Returns:
            list: (Potentially empty) list with required BackPACK quantities.
        """
        return []

    def is_start(self, global_step):
        """Return whether current iteration is start point.

        Only the initializtion (first iteration) is a start point.

        Args:
            global_step (int): The current iteration number.

        Returns:
            bool: Whether ``global_step`` is a start point.
        """
        return global_step == self.INIT_GLOBAL_STEP

    def is_end(self, global_step):
        """Return whether current iteration is end point.

        Args:
            global_step (int): The current iteration number.

        Returns:
            bool: Whether ``global_step`` is an end point.
        """
        return self._track_schedule(global_step)

    def _compute_start(self, global_step, params, batch_loss):
        """Perform computations at start point (store initial parameter values).

        Modifies ``self._cache``.

        Args:
            global_step (int): The current iteration number.
            params ([torch.Tensor]): List of torch.Tensors holding the network's
                parameters.
            batch_loss (torch.Tensor): Mini-batch loss from current step.
        """
        params_copy = [p.data.clone().detach() for p in params]

        def block_fn(step):
            """Block deletion of parameters for all non-negative iterations.

            Args:
                step (int): Iteration number.

            Returns:
                bool: Whether deletion is blocked in the specified iteration
            """
            return step >= self.INIT_GLOBAL_STEP

        self.save_to_cache(global_step, self.CACHE_KEY, params_copy, block_fn)

    def _compute_end(self, global_step, params, batch_loss):
        """Compute and return the current distance from initialization.

        Args:
            global_step (int): The current iteration number.
            params ([torch.Tensor]): List of torch.Tensors holding the network's
                parameters.
            batch_loss (torch.Tensor): Mini-batch loss from current step.

        Returns:
            [float]: Layer-wise L2-distances to initialization.
        """
        params_init = self.load_from_cache(self.INIT_GLOBAL_STEP, self.CACHE_KEY)

        distance = [
            (p.data - p_init).norm(2).item() for p, p_init in zip(params, params_init)
        ]

        return distance