L1 (absolute error) loss¤

L1 (absolute error) loss.

`L1AbsoluteLoss` ¤

Bases: Metric

L1 (absolute error) loss.

L1 loss penalty is the absolute sum of the learned activations, averaged over the number of activation vectors.

Example

l1_loss = L1AbsoluteLoss() learned_activations = torch.tensor([ ... [ # Batch 1 ... [1., 0., 1.] # Component 1: learned features (L1 of 2) ... ], ... [ # Batch 2 ... [0., 1., 0.] # Component 1: learned features (L1 of 1) ... ] ... ]) l1_loss.forward(learned_activations=learned_activations) tensor(1.5000)

Source code in sparse_autoencoder/metrics/loss/l1_absolute_loss.py

class L1AbsoluteLoss(Metric):
    """L1 (absolute error) loss.

    L1 loss penalty is the absolute sum of the learned activations, averaged over the number of
    activation vectors.

    Example:
        >>> l1_loss = L1AbsoluteLoss()
        >>> learned_activations = torch.tensor([
        ...     [ # Batch 1
        ...         [1., 0., 1.] # Component 1: learned features (L1 of 2)
        ...     ],
        ...     [ # Batch 2
        ...         [0., 1., 0.] # Component 1: learned features (L1 of 1)
        ...     ]
        ... ])
        >>> l1_loss.forward(learned_activations=learned_activations)
        tensor(1.5000)
    """

    # Torchmetrics settings
    is_differentiable: bool | None = True
    full_state_update: bool | None = False
    plot_lower_bound: float | None = 0.0

    # Settings
    _num_components: int
    _keep_batch_dim: bool

    @property
    def keep_batch_dim(self) -> bool:
        """Whether to keep the batch dimension in the loss output."""
        return self._keep_batch_dim

    @keep_batch_dim.setter
    def keep_batch_dim(self, keep_batch_dim: bool) -> None:
        """Set whether to keep the batch dimension in the loss output.

        When setting this we need to change the state to either a list if keeping the batch
        dimension (so we can accumulate all the losses and concatenate them at the end along this
        dimension). Alternatively it should be a tensor if not keeping the batch dimension (so we
        can sum the losses over the batch dimension during update and then take the mean).

        By doing this in a setter we allow changing of this setting after the metric is initialised.
        """
        self._keep_batch_dim = keep_batch_dim
        self.reset()  # Reset the metric to update the state
        if keep_batch_dim and not isinstance(self.absolute_loss, list):
            self.add_state(
                "absolute_loss",
                default=[],
                dist_reduce_fx="sum",
            )
        elif not isinstance(self.absolute_loss, Tensor):
            self.add_state(
                "absolute_loss",
                default=torch.zeros(self._num_components),
                dist_reduce_fx="sum",
            )

    # State
    absolute_loss: Float[Tensor, Axis.names(Axis.COMPONENT_OPTIONAL)] | list[
        Float[Tensor, Axis.names(Axis.BATCH, Axis.COMPONENT_OPTIONAL)]
    ] | None = None
    num_activation_vectors: Int64[Tensor, Axis.SINGLE_ITEM]

    @validate_call
    def __init__(
        self,
        num_components: PositiveInt = 1,
        *,
        keep_batch_dim: bool = False,
    ) -> None:
        """Initialize the metric.

        Args:
            num_components: Number of components.
            keep_batch_dim: Whether to keep the batch dimension in the loss output.
        """
        super().__init__()
        self._num_components = num_components
        self.keep_batch_dim = keep_batch_dim
        self.add_state(
            "num_activation_vectors",
            default=torch.tensor(0, dtype=torch.int64),
            dist_reduce_fx="sum",
        )

    @staticmethod
    def calculate_abs_sum(
        learned_activations: Float[
            Tensor, Axis.names(Axis.BATCH, Axis.COMPONENT_OPTIONAL, Axis.LEARNT_FEATURE)
        ],
    ) -> Float[Tensor, Axis.names(Axis.BATCH, Axis.COMPONENT_OPTIONAL)]:
        """Calculate the absolute sum of the learned activations.

        Args:
            learned_activations: Learned activations (intermediate activations in the autoencoder).

        Returns:
            Absolute sum of the learned activations (keeping the batch and component axis).
        """
        return torch.abs(learned_activations).sum(dim=-1)

    def update(
        self,
        learned_activations: Float[
            Tensor, Axis.names(Axis.BATCH, Axis.COMPONENT_OPTIONAL, Axis.LEARNT_FEATURE)
        ],
        **kwargs: Any,  # type: ignore # noqa: ARG002, ANN401 (allows combining with other metrics)
    ) -> None:
        """Update the metric state.

        If we're keeping the batch dimension, we simply take the absolute sum of the activations
        (over the features dimension) and then append this tensor to a list. Then during compute we
        just concatenate and return this list. This is useful for e.g. getting L1 loss by batch item
        when resampling neurons (see the neuron resampler for details).

        By contrast if we're averaging over the batch dimension, we sum the activations over the
        batch dimension during update (on each process), and then divide by the number of activation
        vectors on compute to get the mean.

        Args:
            learned_activations: Learned activations (intermediate activations in the autoencoder).
            **kwargs: Ignored keyword arguments (to allow use with other metrics in a collection).
        """
        absolute_loss = self.calculate_abs_sum(learned_activations)

        if self.keep_batch_dim:
            self.absolute_loss.append(absolute_loss)  # type: ignore
        else:
            self.absolute_loss += absolute_loss.sum(dim=0)
            self.num_activation_vectors += learned_activations.shape[0]

    def compute(self) -> Tensor:
        """Compute the metric."""
        return (
            torch.cat(self.absolute_loss)  # type: ignore
            if self.keep_batch_dim
            else self.absolute_loss / self.num_activation_vectors
        )

`keep_batch_dim: bool = keep_batch_dim` `instance-attribute` `property` `writable` ¤

Whether to keep the batch dimension in the loss output.

`init(num_components=1, *, keep_batch_dim=False)` ¤

Initialize the metric.

Parameters:

Name	Type	Description	Default
`num_components`	`PositiveInt`	Number of components.	`1`
`keep_batch_dim`	`bool`	Whether to keep the batch dimension in the loss output.	`False`

Source code in sparse_autoencoder/metrics/loss/l1_absolute_loss.py

@validate_call
def __init__(
    self,
    num_components: PositiveInt = 1,
    *,
    keep_batch_dim: bool = False,
) -> None:
    """Initialize the metric.

    Args:
        num_components: Number of components.
        keep_batch_dim: Whether to keep the batch dimension in the loss output.
    """
    super().__init__()
    self._num_components = num_components
    self.keep_batch_dim = keep_batch_dim
    self.add_state(
        "num_activation_vectors",
        default=torch.tensor(0, dtype=torch.int64),
        dist_reduce_fx="sum",
    )

`calculate_abs_sum(learned_activations)` `staticmethod` ¤

Calculate the absolute sum of the learned activations.

Parameters:

Name	Type	Description	Default
`learned_activations`	`Float[Tensor, names(BATCH, COMPONENT_OPTIONAL, LEARNT_FEATURE)]`	Learned activations (intermediate activations in the autoencoder).	required

Returns:

Type	Description
`Float[Tensor, names(BATCH, COMPONENT_OPTIONAL)]`	Absolute sum of the learned activations (keeping the batch and component axis).

Source code in sparse_autoencoder/metrics/loss/l1_absolute_loss.py

@staticmethod
def calculate_abs_sum(
    learned_activations: Float[
        Tensor, Axis.names(Axis.BATCH, Axis.COMPONENT_OPTIONAL, Axis.LEARNT_FEATURE)
    ],
) -> Float[Tensor, Axis.names(Axis.BATCH, Axis.COMPONENT_OPTIONAL)]:
    """Calculate the absolute sum of the learned activations.

    Args:
        learned_activations: Learned activations (intermediate activations in the autoencoder).

    Returns:
        Absolute sum of the learned activations (keeping the batch and component axis).
    """
    return torch.abs(learned_activations).sum(dim=-1)

`compute()` ¤

Compute the metric.

Source code in sparse_autoencoder/metrics/loss/l1_absolute_loss.py

def compute(self) -> Tensor:
    """Compute the metric."""
    return (
        torch.cat(self.absolute_loss)  # type: ignore
        if self.keep_batch_dim
        else self.absolute_loss / self.num_activation_vectors
    )

`update(learned_activations, **kwargs)` ¤

Update the metric state.

If we're keeping the batch dimension, we simply take the absolute sum of the activations (over the features dimension) and then append this tensor to a list. Then during compute we just concatenate and return this list. This is useful for e.g. getting L1 loss by batch item when resampling neurons (see the neuron resampler for details).

By contrast if we're averaging over the batch dimension, we sum the activations over the batch dimension during update (on each process), and then divide by the number of activation vectors on compute to get the mean.

Parameters:

Name	Type	Description	Default
`learned_activations`	`Float[Tensor, names(BATCH, COMPONENT_OPTIONAL, LEARNT_FEATURE)]`	Learned activations (intermediate activations in the autoencoder).	required
`**kwargs`	`Any`	Ignored keyword arguments (to allow use with other metrics in a collection).	`{}`

Source code in sparse_autoencoder/metrics/loss/l1_absolute_loss.py

def update(
    self,
    learned_activations: Float[
        Tensor, Axis.names(Axis.BATCH, Axis.COMPONENT_OPTIONAL, Axis.LEARNT_FEATURE)
    ],
    **kwargs: Any,  # type: ignore # noqa: ARG002, ANN401 (allows combining with other metrics)
) -> None:
    """Update the metric state.

    If we're keeping the batch dimension, we simply take the absolute sum of the activations
    (over the features dimension) and then append this tensor to a list. Then during compute we
    just concatenate and return this list. This is useful for e.g. getting L1 loss by batch item
    when resampling neurons (see the neuron resampler for details).

    By contrast if we're averaging over the batch dimension, we sum the activations over the
    batch dimension during update (on each process), and then divide by the number of activation
    vectors on compute to get the mean.

    Args:
        learned_activations: Learned activations (intermediate activations in the autoencoder).
        **kwargs: Ignored keyword arguments (to allow use with other metrics in a collection).
    """
    absolute_loss = self.calculate_abs_sum(learned_activations)

    if self.keep_batch_dim:
        self.absolute_loss.append(absolute_loss)  # type: ignore
    else:
        self.absolute_loss += absolute_loss.sum(dim=0)
        self.num_activation_vectors += learned_activations.shape[0]

L1 (absolute error) loss¤

L1AbsoluteLoss ¤

keep_batch_dim: bool = keep_batch_dim instance-attribute property writable ¤

__init__(num_components=1, *, keep_batch_dim=False) ¤

calculate_abs_sum(learned_activations) staticmethod ¤

compute() ¤

update(learned_activations, **kwargs) ¤

`L1AbsoluteLoss` ¤

`keep_batch_dim: bool = keep_batch_dim` `instance-attribute` `property` `writable` ¤

`init(num_components=1, *, keep_batch_dim=False)` ¤

`calculate_abs_sum(learned_activations)` `staticmethod` ¤

`compute()` ¤

`update(learned_activations, **kwargs)` ¤