Source code for kooplearn.torch.nn._base

"""Loss functions for representation learning."""

from torch import Tensor
from torch.nn import Module

from kooplearn.torch.nn import _functional as F

__all__ = [
    "AutoEncoderLoss",
    "EnergyLoss",
    "SpectralContrastiveLoss",
    "VampLoss",
]



[docs]
class VampLoss(Module):
    r"""Variational Approach for learning Markov Processes (VAMP) score by
    :cite:t:`vamploss-Wu2019`.

    .. math::

        \mathcal{L}(x, y) = -\sum_{i} \sigma_{i}(A)^{p} \qquad \text{where}~A = \big(x^{\top}x\big)^{\dagger/2}x^{\top}y\big(y^{\top}y\big)^{\dagger/2}.

    Args:
        schatten_norm (int, optional): Computes the VAMP-p score with ``p = schatten_norm``.
        Defaults to 2.
        center_covariances (bool, optional): Use centered covariances to compute the VAMP score.
        Defaults to True.

    .. hint::
        Check out the `Ordered MNIST <../examples/ordered_mnist_torch.html>`_ example for a
        practical use of this loss function.
    """  # noqa: E501

    def __init__(
        self,
        schatten_norm: int = 2,
        center_covariances: bool = True,
    ) -> None:
        super().__init__()
        self.schatten_norm = schatten_norm
        self.center_covariances = center_covariances


[docs]
    def forward(self, x: Tensor, y: Tensor) -> Tensor:
        """Forward pass of VAMP loss.

        Args:
            x (Tensor): Features for x.
            y (Tensor): Features for y.

        Raises:
            NotImplementedError: If ``schatten_norm`` is not 1 or 2.

        Shape:
            ``x``: :math:`(N, D)`, where :math:`N` is the batch size and :math:`D` is the number of
            features.

            ``y``: :math:`(N, D)`, where :math:`N` is the batch size and :math:`D` is the number of
            features.
        """
        return F.vamp_loss(
            x,
            y,
            self.schatten_norm,
            self.center_covariances,
        )





[docs]
class SpectralContrastiveLoss(Module):
    r"""Spectral contrastive loss based originally introduced by
    :cite:t:`spectralcontrastiveloss-haochen2021provable`, and adopted for evolution operators in
    :cite:t:`spectralcontrastiveloss-turri2025self, spectralcontrastiveloss-jeong2025efficient`

    .. math::

        \mathcal{L}(x, y) = \frac{1}{N(N-1)}\sum_{i \neq j}\langle x_{i}, y_{j} \rangle^2 - \frac{2}{N}\sum_{i=1}\langle x_{i}, y_{i} \rangle.

    .. hint::
        Check out the `Ordered MNIST <../examples/ordered_mnist_torch.html>`_ example for a
        practical use of this loss function.
    """  # noqa: E501

    def __init__(
        self,
    ) -> None:
        super().__init__()


[docs]
    def forward(self, x: Tensor, y: Tensor) -> Tensor:
        """Forward pass of the L2 contrastive loss.

        Args:
            x (Tensor): Input features.
            y (Tensor): Output features.


        Shape:
            ``x``: :math:`(N, D)`, where :math:`N` is the batch size and :math:`D` is the number of
            features.

            ``y``: :math:`(N, D)`, where :math:`N` is the batch size and :math:`D` is the number of
            features.
        """
        return F.spectral_contrastive_loss(x, y)





[docs]
class AutoEncoderLoss(Module):
    r"""Single-step Dynamic Autoencoder (DAE) loss introduced by
    :cite:t:`autoencoderloss-Lusch2018`.

    This loss combines three objectives to train dynamic autoencoders:

    1. **Reconstruction loss** — measures how well the autoencoder reconstructs inputs.
    2. **Linearity loss** — enforces linear evolution in latent space.
    3. **Prediction loss** — penalizes errors between predicted and actual encoded outputs.

    The total loss is a weighted sum:

    .. math::
        \mathcal{L} =
        \alpha_\mathrm{rec} \, \|x - \phi^{-1}(\phi(x)) \|^2 +
        \alpha_\mathrm{lin} \, \|\phi(y) - K\phi(x) \|^2 +
        \alpha_\mathrm{pred} \, \|y - \phi^{-1}(K\phi(x))\|^2

    where :math:`\phi^{-1}(\phi(x))` is the reconstruction of :math:`x`,
    :math:`\phi(y)` is the encoded output,
    :math:`K\phi(x)` is the evolved input latent representation,
    and :math:`\phi^{-1}(K\phi(x))` is the predicted decoded output.

    .. hint::
        Check out the `Ordered MNIST <../examples/ordered_mnist_torch.html>`_ example for a
        practical use of this loss function.
    """

    def __init__(
        self,
        alpha_rec: float = 1.0,
        alpha_lin: float = 1.0,
        alpha_pred: float = 1.0,
    ) -> None:
        r"""Initialize the Dynamic Autoencoder (DAE) loss.

        Parameters
        ----------
        alpha_rec : float, default=1.0
            Weight for the reconstruction term :math:`\|x - \phi^{-1}(\phi(x)) \|^2`.
        alpha_lin : float, default=1.0
            Weight for the linearity term :math:`\|\phi(y) - K\phi(x) \|^2`.
        alpha_pred : float, default=1.0
            Weight for the prediction term :math:`\|y - \phi^{-1}(K\phi(x))\|^2`.
        """
        super().__init__()
        self.alpha_rec = alpha_rec
        self.alpha_lin = alpha_lin
        self.alpha_pred = alpha_pred


[docs]
    def forward(
        self,
        x: Tensor,
        y: Tensor,
        x_rec: Tensor,
        y_enc: Tensor,
        x_evo: Tensor,
        y_pred: Tensor,
    ) -> Tensor:
        """Compute the Dynamic Autoencoder loss.

        Parameters
        ----------
        x : torch.Tensor
            Input features of shape ``(N, D)``, where ``N`` is the batch size
            and ``D`` is the feature dimension.
        y : torch.Tensor
            Output (target) features. Same shape as ``x``.
        x_rec : torch.Tensor
            Reconstructed version of the input ``x`` produced by the decoder. Same shape as ``x``.
        y_enc : torch.Tensor
            Encoded latent representation of the target ``y``.
        x_evo : torch.Tensor
            Evolved latent representation obtained by applying the learned
            linear operator to the latent encoding of ``x``. Same shape as ``x``.
        y_pred : torch.Tensor
            Predicted decoded output corresponding to the evolved latent state. Same shape as ``x``.

        Returns
        -------
        torch.Tensor
            A scalar tensor representing the total dynamic autoencoder loss.
        """
        return F.dynamic_ae_loss(
            x,
            y,
            x_rec,
            y_enc,
            x_evo,
            y_pred,
            self.alpha_rec,
            self.alpha_lin,
            self.alpha_pred,
        )





[docs]
class EnergyLoss(Module):
    r"""Energy-based loss function.

    Computes an energy-based loss that incorporates second-order information
    (Jacobians) into the learning process.

    The loss is computed as:

    .. math::

        \mathcal{L}(x, y) = \text{tr}(W^2) - 2\langle x, x \rangle \cdot L

    where

    .. math::

        W = \frac{1}{N}(xx^\top + \lambda yy^\top)

    where:

    - :math:`x \in \mathbb{R}^{N \times L}` are input features
    - :math:`y \in \mathbb{R}^{N \times DL}` are Jacobian features
      (reshaped from :math:`(N, D, L)`)
    - :math:`\lambda` is the ```grad_weight``` parameter controlling Jacobian
      contribution
    - :math:`N` is the batch size
    - :math:`D` is the state space dimensionality
    - :math:`L` is the latent space dimensionality

    .. hint::
        Check out the `Prinz Potential <../examples/prinz_potential.html>`_ example for a practical
        use of this loss function.

    Parameters
    ----------
    grad_weight : float, optional
        Weight for the Jacobian contribution. Must be non-negative. Controls how much
        the Jacobian term contributes to the total loss. Default is 1e-3.
    """

    def __init__(
        self,
        grad_weight: float = 1e-3,
    ) -> None:
        """Initialize the Energy-based loss.

        Parameters
        ----------
        grad_weight : float, optional
            Weight for the Jacobian contribution. Must be non-negative.
            Controls how much the Jacobian term contributes to the total
            loss. Default is 1e-3.
        """
        super().__init__()
        self.grad_weight = grad_weight


[docs]
    def forward(self, x: Tensor, y: Tensor) -> Tensor:
        r"""Compute the energy-based loss combining input and Jacobian features.

        Parameters
        ----------
        x : Tensor
            Input features of shape :math:`(N, L)`, where :math:`N` is the batch size
            and :math:`L` is the dimensionality of the latent space.
        y : Tensor
            Jacobian features of shape :math:`(N, D, L)`, where :math:`N`
            is the batch size, :math:`D` is the state space dimensionality,
            and :math:`L` is the latent space dimensionality.

        Returns
        -------
        Tensor
            Scalar loss value.
        """
        return F.energy_loss(x, y, self.grad_weight)