Source code for tfep.nn.embeddings.mafembed

#!/usr/bin/env python


# =============================================================================
# MODULE DOCSTRING
# =============================================================================

"""
Embedding layers for masked autoregressive flows (MAF).
"""


# =============================================================================
# GLOBAL IMPORTS
# =============================================================================

import abc
from collections.abc import Sequence
from typing import Optional

import torch

from tfep.utils.misc import ensure_tensor_sequence, remove_and_shift_sorted_indices


# =============================================================================
# BASE CLASS
# =============================================================================


[docs]
class MAFEmbedding(abc.ABC, torch.nn.Module):
    """An embedding layer for a masked autoregressive flow.

    This class documents the API of an embedding layer compatible with
    :class:`tfep.nn.flows.maf.MAF`.

    """


[docs]
    @abc.abstractmethod
    def get_degrees_out(self, degrees_in: torch.Tensor) -> torch.Tensor:
        """Return the degrees of the features after the forward pass.

        These are the degrees that will be passed as input to the conditioner.

        The periodic features after the forward are represented as 2 features
        (cosine and sine) that both are assigned the same degree as the input
        feature.

        Parameters
        ----------
        degrees_in : torch.Tensor
            The degrees of the input features.

        Returns
        -------
        degrees_out : torch.Tensor
            The degrees of the features after the forward pass.
        """
        pass




# =============================================================================
# PERIODIC EMBEDDING
# =============================================================================


[docs]
class PeriodicEmbedding(MAFEmbedding):
    """Lift periodic degrees of freedom into a periodic representation (cos, sin)."""


[docs]
    def __init__(
            self,
            n_features_in : int,
            limits : Sequence[float],
            periodic_indices : Optional[Sequence[int]] = None,
    ):
        """Constructor.

        Parameters
        ----------
        n_features_in : int
            Number of input features.
        limits : Sequence[float]
            A pair ``(lower, upper)`` defining the limits of the periodic
            variables. The period is given by ``upper - lower``.
        periodic_indices : Sequence[int] or None, optional
            Shape (n_periodic,). The (ordered) indices of the input features
            that are periodic and must be lifted to the (cos, sin)
            representation. If ``None``, all features are embedded.

        """
        super().__init__()

        # Limits.
        self.register_buffer('limits', ensure_tensor_sequence(limits))

        # Periodic feature indices.
        if periodic_indices is None:
            periodic_indices = torch.arange(n_features_in)
        else:
            periodic_indices = ensure_tensor_sequence(periodic_indices)
            # Check if there are repeated entries.
            if len(periodic_indices.unique()) < len(periodic_indices):
                raise ValueError('Found duplicated indices in periodic_indices.')
        self.register_buffer('_periodic_indices', periodic_indices)

        # Cache the nonperiodic indices to avoid recomputing them at each pass.
        nonperiodic_indices = remove_and_shift_sorted_indices(
            indices=torch.arange(n_features_in),
            removed_indices=periodic_indices,
            shift=False,
        )
        self.register_buffer('_nonperiodic_indices', nonperiodic_indices)



[docs]
    def forward(self, x: torch.Tensor) -> torch.Tensor:
        """Lift each periodic degree of freedom x into a periodic representation (cosx, sinx).

        Parameters
        ----------
        x : torch.Tensor
            Shape ``(batch_size, n_features)``. Input tensor.

        Returns
        -------
        out : torch.Tensor
            Shape ``(batch_size, n_features + n_periodic)``. The input with the
            periodic DOFs transformed. The cosx, sinx representation is placed
            contiguously where the original DOF was. E.g., if ``2`` is the first
            element in ``periodic_indices``, then cos and sin will be placed at
            ``y[:, 2]`` and ``y[:, 3]`` respectively.
        """
        batch_size = x.shape[0]

        # Transform periodic interval to [0, 2pi].
        period_scale = 2*torch.pi / (self.limits[1] - self.limits[0])
        x_periodic = (x[:, self._periodic_indices] - self.limits[0]) * period_scale

        # Embed.
        return torch.cat([
            x[:, self._nonperiodic_indices],
            torch.stack([
                torch.cos(x_periodic),
                torch.sin(x_periodic),
            ], dim=2).reshape(batch_size, -1),
        ], dim=1)



[docs]
    def get_degrees_out(self, degrees_in: torch.Tensor) -> torch.Tensor:
        """Return the degrees of the features after the forward pass.

        These are the degrees that will be passed as input to the conditioner.

        The periodic features after the forward are represented as 2 features
        (cosine and sine) that both are assigned the same degree as the input
        feature.

        Parameters
        ----------
        degrees_in : torch.Tensor
            The degrees of the input features.

        Returns
        -------
        degrees_out : torch.Tensor
            The degrees of the features after the forward pass.

        """
        return torch.cat([
            degrees_in[self._nonperiodic_indices],
            degrees_in[self._periodic_indices].repeat_interleave(2)
        ])




# =============================================================================
# FLIP-INVARIANT EMBEDDING
# =============================================================================


[docs]
class FlipInvariantEmbedding(MAFEmbedding):
    """Embeds vector features into a representation invariant to sign flips.

    This implements the embedding proposed in [1] (Equation 46 in the SI).

    References
    ----------
    [1] Köhler J, Invernizzi M, De Haan P, Noé F. Rigid body flows for sampling
        molecular crystal structures. In International Conference on Machine
        Learning 2023 Jul 3 (pp. 17301-17326). PMLR.

    """


[docs]
    def __init__(
            self,
            n_features_in : int,
            embedding_dimension : int,
            embedded_indices : Optional[Sequence[int]] = None,
            vector_dimension : int = 4,
            hidden_layer_width : int = 32,
    ):
        """Constructor.

        Parameters
        ----------
        n_features_in : int
            Number of input features (embedded and not).
        embedding_dimension : int
            The embedding dimension of each vector.
        embedded_indices : Sequence[int] or None, optional
            A sequence of length ``n_vectors*vector_dimension`` with the
            (ordered) indices of the input features corresponding to the
            vectors to embed. Vectors are assumed to be represented by
            consecutive elements. If ``None``, all features are embedded.
        vector_dimension : int, optional
            The dimension of the embedded vectors. Default is 4.
        hidden_layer_width : int, optional
            The width of the hidden layer of the fully-connected neural
            networks used to embed the vectors. Default is 32.

        """
        super().__init__()

        # Create NNP layers for the embedding.
        self.embedding_layer = torch.nn.Sequential(
            torch.nn.Linear(vector_dimension, hidden_layer_width),
            torch.nn.ELU(),
            torch.nn.Linear(hidden_layer_width, embedding_dimension),
        )
        self.weight_layer = torch.nn.Sequential(
            torch.nn.Linear(vector_dimension, hidden_layer_width),
            torch.nn.ELU(),
            torch.nn.Linear(hidden_layer_width, 1),
        )

        # Embedded indices.
        if embedded_indices is None:
            embedded_indices = torch.arange(n_features_in)
        else:
            embedded_indices = ensure_tensor_sequence(embedded_indices)
            # Check if there are repeated entries.
            if len(embedded_indices.unique()) < len(embedded_indices):
                raise ValueError('Found duplicated indices in embedded_indices.')
        self.register_buffer('_embedded_indices', embedded_indices)

        # Cache the nonembedded indices to avoid recomputing them at each pass.
        nonembedded_indices = remove_and_shift_sorted_indices(
            indices=torch.arange(n_features_in),
            removed_indices=embedded_indices,
            shift=False,
        )
        self.register_buffer('_nonembedded_indices', nonembedded_indices)


    @property
    def vector_dimension(self) -> int:
        """int: The input vector dimensionality."""
        return self.embedding_layer[0].in_features

    @property
    def embedding_dimension(self) -> int:
        """int: The embedding dimension for each vector."""
        return self.embedding_layer[-1].out_features


[docs]
    def forward(self, x: torch.Tensor) -> torch.Tensor:
        """Forward.

        Parameters
        ----------
        x : torch.Tensor
            Shape ``(batch, n_features)``. Input tensor.

        Returns
        -------
        out : torch.Tensor
            Shape ``(batch, n_features + n_vectors*(embedded_dim - vector_dim))``.
            The transformed features with the ``n_vectors`` vectors embedded
            from the ``vector_dim`` to an ``embedded_dim`` space.

        """
        batch_size = x.shape[0]

        # Extract vectors.
        vectors = x[:, self._embedded_indices]

        # From (batch, n_vectors*vector_dim) to (batch*n_vectors, vector_dim).
        vectors = vectors.reshape(-1, self.vector_dimension)

        # Find the positive and negative embeddings.
        # Out shape is (batch*n_vectors, 2, embedding_dim).
        embedded_vectors = torch.stack([
            self.embedding_layer(vectors),
            self.embedding_layer(-vectors)
        ], dim=1)

        # Find the softmax weights for the positive and negative embeddings.
        # Out shape is (batch*n_vectors, 2, 1).
        weights = torch.softmax(torch.stack([
            self.weight_layer(vectors),
            self.weight_layer(-vectors),
        ], dim=1), dim=1)

        # Weighted sum the positive and negative embeddings.
        # Out shape is (batch*n_vectors, embedding_dim)
        embedded_vectors = (weights * embedded_vectors).sum(dim=1)

        # From (batch*n_vectors, embedding_dim) to (batch, n_vectors*embedding_dim).
        embedded_vectors = embedded_vectors.reshape(batch_size, -1)

        # Return embedded features.
        return torch.cat([
            x[:, self._nonembedded_indices],
            embedded_vectors,
        ], dim=1)



[docs]
    def get_degrees_out(self, degrees_in: torch.Tensor) -> torch.Tensor:
        """Return the degrees of the features after the forward pass.

        This requires that all components of each vector is assigned a single
        degree.

        Parameters
        ----------
        degrees_in : torch.Tensor
            Shape ``(n_features_in,)``. The degrees of the input features.

        Returns
        -------
        degrees_out : torch.Tensor
            Shape ``(n_features_out,)``. The degrees of the features after the
            forward pass.

        Raises
        ------
        ValueError
            If there are some embedded vectors whose components have been
            assigned different degrees.

        """
        # Get the degrees of the input vectors. Shape (n_vectors, vector_dimension).
        vec_degrees_in = degrees_in[self._embedded_indices].reshape(-1, self.vector_dimension)

        # All components of each vector must be assigned to the same degree.
        if not torch.all(vec_degrees_in == vec_degrees_in[:, [0]]):
            raise ValueError('The same degree must be assigned to all '
                             'components of each embedded vectors.')

        # Update vector degrees from vector to embedding dimension.
        vec_degrees_in = vec_degrees_in[:, [0]].expand(-1, self.embedding_dimension)
        
        # Concatenate to non-embedded features.
        return torch.cat([
            degrees_in[self._nonembedded_indices],
            vec_degrees_in.flatten(),
        ])




# =============================================================================
# MIXED EMBEDDING
# =============================================================================


[docs]
class MixedEmbedding(MAFEmbedding):
    """Utility class mixing multiple embeddings.

    The class forwards to the mixed embedding layers only the features assigned
    to them.

    """


[docs]
    def __init__(
            self,
            n_features_in : int,
            embedding_layers : Sequence[MAFEmbedding],
            embedded_indices : Sequence[Sequence[int]],
    ):
        """Constructor.

        Parameters
        ----------
        n_features_in : int
            Number of input features (embedded and not).
        embedding_layers : Sequence[MAFEmbedding]
            The embedding layers to mix.
        embedded_indices : Sequence[Sequence[int]]
            ``embedded_indices[i]`` is the set of indices passed to the
            ``i``-th embedding layer. The indices cannot overlap.

        """
        super().__init__()

        # Check the two lengths are equal.
        if len(embedding_layers) != len(embedded_indices):
            raise ValueError('Different number of layers and indices.')

        # Convert to tensor.
        embedded_indices = [ensure_tensor_sequence(indices) for indices in embedded_indices]

        # Check that indices do not overlap.
        indices0_set = set(embedded_indices[0].tolist())
        for indices in embedded_indices[1:]:
            if len(indices0_set & set(indices.tolist())) > 0:
                raise ValueError('Different embedding layers must be assigned '
                                 'to different feature indices.')

        # Save embedding layers.
        self.embedding_layers = torch.nn.ModuleList(embedding_layers)

        # Cache embedded and nonembedd indices.
        for i, indices in enumerate(embedded_indices):
            self.register_buffer(f'_embedded_indices{i}', indices)

        nonbedded_indices = remove_and_shift_sorted_indices(
            indices=torch.arange(n_features_in),
            removed_indices=torch.cat(embedded_indices).sort().values,
            shift=False,
        )
        self.register_buffer('_nonembedded_indices', nonbedded_indices)



[docs]
    def forward(self, x: torch.Tensor) -> torch.Tensor:
        """Forward.

        Parameters
        ----------
        x : torch.Tensor
            Shape ``(batch, n_features_in)``. Input tensor.

        Returns
        -------
        out : torch.Tensor
            Shape ``(batch, n_features_out``. The embedded features.

        """
        x_embedded = [layer(x[:, getattr(self, f'_embedded_indices{i}')])
                      for i, layer in enumerate(self.embedding_layers)]
        return torch.cat([x[:, self._nonembedded_indices], *x_embedded], dim=1)



[docs]
    def get_degrees_out(self, degrees_in: torch.Tensor) -> torch.Tensor:
        """Return the degrees of the features after the embedding.

        Parameters
        ----------
        degrees_in : torch.Tensor
            Shape ``(n_features_in,)``. The degrees of the input features.

        Returns
        -------
        degrees_out : torch.Tensor
            Shape ``(n_features_out,)``. The degrees of the features after the
            embedding.

        """
        deg_out = [layer.get_degrees_out(degrees_in[getattr(self, f'_embedded_indices{i}')])
                   for i, layer in enumerate(self.embedding_layers)]
        return torch.cat([degrees_in[self._nonembedded_indices], *deg_out])