Source code for e3tools.nn._conv

import functools
from typing import Callable, Mapping, Optional, Union

import e3nn
import e3nn.o3
import torch
from torch import nn

from e3tools import scatter

from ._gate import Gated
from ._interaction import LinearSelfInteraction
from ._mlp import ScalarMLP
from ._tensor_product import SeparableTensorProduct



[docs]
class FusedConv(nn.Module):
    """
    Fused version of equivariant convolution layer with OpenEquivariance kernels.

    ref: https://arxiv.org/abs/1802.08219
    ref: https://arxiv.org/abs/2501.13986
    """

    def __init__(
        self,
        irreps_in: Union[str, e3nn.o3.Irreps],
        irreps_out: Union[str, e3nn.o3.Irreps],
        irreps_sh: Union[str, e3nn.o3.Irreps],
        edge_attr_dim: int,
        radial_nn: Optional[Callable[..., nn.Module]] = None,
        tensor_product: Optional[Callable[..., nn.Module]] = None,
    ):
        """
        Parameters
        ----------
        irreps_in: e3nn.o3.Irreps
            Input node feature irreps
        irreps_out: e3nn.o3.Irreps
            Ouput node feature irreps
        irreps_sh: e3nn.o3.Irreps
            Edge spherical harmonic irreps
        edge_attr_dim: int
            Dimension of scalar edge attributes to be passed to radial_nn
        radial_nn: Optional[Callable[..., nn.Module]]
            Factory function for radial nn used to generate tensor product weights.
            Should be callable as radial_nn(in_features, out_features)
            if `None` then
                ```
                functools.partial(
                    e3tools.nn.ScalarMLP,
                    hidden_features=[edge_attr_dim],
                    activation_layer=nn.SiLU,
                )
                ```
            is used.
        tensor_product: Optional[Callable[..., nn.Module]]
            Factory function for tensor product used to mix input node
            representations with edge spherical harmonics.
            Should be callable as `tensor_product(irreps_in, irreps_sh, irreps_out)`
            and return an object with `weight_numel` property defined
            If `None` then
                ```
                functools.partial(
                    e3nn.o3.FullyConnectedTensorProduct
                    shared_weights=False,
                    internal_weights=False,
                )
                ```
            is used.
        """
        try:
            import openequivariance as oeq
        except ImportError as e:
            raise ImportError(f"OpenEquivariance could not be imported: {e}")

        super().__init__()

        self.irreps_in = e3nn.o3.Irreps(irreps_in)
        self.irreps_out = e3nn.o3.Irreps(irreps_out)
        self.irreps_sh = e3nn.o3.Irreps(irreps_sh)

        if tensor_product is None:
            tensor_product = functools.partial(
                e3nn.o3.FullyConnectedTensorProduct,
                shared_weights=False,
                internal_weights=False,
            )

        self.tp = tensor_product(irreps_in, irreps_sh, irreps_out)
        if radial_nn is None:
            radial_nn = functools.partial(
                ScalarMLP,
                hidden_features=[edge_attr_dim],
                activation_layer=nn.SiLU,
            )

        self.radial_nn = radial_nn(edge_attr_dim, self.tp.weight_numel)

        if isinstance(self.tp, SeparableTensorProduct):
            tp = self.tp.dtp
            self.has_post_linear = True
        else:
            tp = self.tp
            self.has_post_linear = False

        # Remove path weight and path shape from instructions for OpenEquivariance.
        oeq_instructions = [instruction[:5] for instruction in tp.instructions]
        oeq_tpp = oeq.TPProblem(
            tp.irreps_in1,
            tp.irreps_in2,
            tp.irreps_out,
            oeq_instructions,
            shared_weights=False,
            internal_weights=False,
        )
        self.fused_tp_conv = oeq.TensorProductConv(
            oeq_tpp, torch_op=True, deterministic=False, use_opaque=False
        )


[docs]
    def forward(
        self,
        node_attr: torch.Tensor,
        edge_index: torch.Tensor,
        edge_attr: torch.Tensor,
        edge_sh: torch.Tensor,
    ) -> torch.Tensor:
        """
        Computes the forward pass of the equivariant convolution.

        Let N be the number of nodes, and E be the number of edges

        Parameters
        ----------
        node_attr: [N, irreps_in.dim]
        edge_index: [2, E]
        edge_attr: [E, edge_attr_dim]
        edge_sh: [E, irreps_sh.dim]

        Returns
        -------
        out: [N, irreps_out.dim]
        """
        N = node_attr.shape[0]

        src, dst = edge_index
        radial_attr = self.radial_nn(edge_attr)
        messages_agg = self.fused_tp_conv(node_attr, edge_sh, radial_attr, dst, src)
        if self.has_post_linear:
            messages_agg = self.tp.lin(messages_agg)

        num_neighbors = scatter(
            torch.ones_like(src), src, dim=0, dim_size=N, reduce="sum"
        )
        out = messages_agg / num_neighbors.clamp_min(1).unsqueeze(1)
        return out





[docs]
class Conv(nn.Module):
    """
    Equivariant convolution layer

    ref: https://arxiv.org/abs/1802.08219
    """

    def __init__(
        self,
        irreps_in: Union[str, e3nn.o3.Irreps],
        irreps_out: Union[str, e3nn.o3.Irreps],
        irreps_sh: Union[str, e3nn.o3.Irreps],
        edge_attr_dim: int,
        radial_nn: Optional[Callable[..., nn.Module]] = None,
        tensor_product: Optional[Callable[..., nn.Module]] = None,
    ):
        """
        Parameters
        ----------
        irreps_in: e3nn.o3.Irreps
            Input node feature irreps
        irreps_out: e3nn.o3.Irreps
            Ouput node feature irreps
        irreps_sh: e3nn.o3.Irreps
            Edge spherical harmonic irreps
        edge_attr_dim: int
            Dimension of scalar edge attributes to be passed to radial_nn
        radial_nn: Optional[Callable[..., nn.Module]]
            Factory function for radial nn used to generate tensor product weights.
            Should be callable as radial_nn(in_features, out_features)
            if `None` then
                ```
                functools.partial(
                    e3tools.nn.ScalarMLP,
                    hidden_features=[edge_attr_dim],
                    activation_layer=nn.SiLU,
                )
                ```
            is used.
        tensor_product: Optional[Callable[..., nn.Module]]
            Factory function for tensor product used to mix input node
            representations with edge spherical harmonics.
            Should be callable as `tensor_product(irreps_in, irreps_sh, irreps_out)`
            and return an object with `weight_numel` property defined
            If `None` then
                ```
                functools.partial(
                    e3nn.o3.FullyConnectedTensorProduct
                    shared_weights=False,
                    internal_weights=False,
                )
                ```
            is used.
        """

        super().__init__()

        self.irreps_in = e3nn.o3.Irreps(irreps_in)
        self.irreps_out = e3nn.o3.Irreps(irreps_out)
        self.irreps_sh = e3nn.o3.Irreps(irreps_sh)

        if tensor_product is None:
            tensor_product = functools.partial(
                e3nn.o3.FullyConnectedTensorProduct,
                shared_weights=False,
                internal_weights=False,
            )

        self.tp = tensor_product(irreps_in, irreps_sh, irreps_out)
        if radial_nn is None:
            radial_nn = functools.partial(
                ScalarMLP,
                hidden_features=[edge_attr_dim],
                activation_layer=nn.SiLU,
            )

        self.radial_nn = radial_nn(edge_attr_dim, self.tp.weight_numel)


[docs]
    def apply_per_edge(
        self,
        node_attr_src: torch.Tensor,
        edge_attr: torch.Tensor,
        edge_sh: torch.Tensor,
    ) -> torch.Tensor:
        return self.tp(node_attr_src, edge_sh, self.radial_nn(edge_attr))



[docs]
    def forward(
        self,
        node_attr: torch.Tensor,
        edge_index: torch.Tensor,
        edge_attr: torch.Tensor,
        edge_sh: torch.Tensor,
    ) -> torch.Tensor:
        """
        Computes the forward pass of the equivariant convolution.

        Let N be the number of nodes, and E be the number of edges

        Parameters
        ----------
        node_attr: [N, irreps_in.dim]
        edge_index: [2, E]
        edge_attr: [E, edge_attr_dim]
        edge_sh: [E, irreps_sh.dim]

        Returns
        -------
        out: [N, irreps_out.dim]
        """
        N = node_attr.shape[0]

        src, dst = edge_index
        out_ij = self.apply_per_edge(node_attr[src], edge_attr, edge_sh)
        out = scatter(out_ij, dst, dim=0, dim_size=N, reduce="mean")

        return out





[docs]
class SeparableConv(Conv):
    """
    Equivariant convolution layer using separable tensor product

    ref: https://arxiv.org/abs/1802.08219
    ref: https://arxiv.org/abs/2206.11990
    """

    def __init__(self, *args, **kwargs):
        super().__init__(
            *args,
            **kwargs,
            tensor_product=SeparableTensorProduct,
        )




[docs]
class FusedSeparableConv(FusedConv):
    """
    Equivariant convolution layer using separable tensor product, with fused OpenEquivariance kernels.

    ref: https://arxiv.org/abs/1802.08219
    ref: https://arxiv.org/abs/2206.11990
    """

    def __init__(self, *args, **kwargs):
        super().__init__(
            *args,
            **kwargs,
            tensor_product=SeparableTensorProduct,
        )




[docs]
class ConvBlock(nn.Module):
    """
    Equivariant convolution with gated non-linearity and linear self-interaction
    """

    def __init__(
        self,
        irreps_in: Union[str, e3nn.o3.Irreps],
        irreps_out: Union[str, e3nn.o3.Irreps],
        irreps_sh: Union[str, e3nn.o3.Irreps],
        edge_attr_dim: int,
        act: Optional[Mapping[int, nn.Module]] = None,
        act_gates: Optional[Mapping[int, nn.Module]] = None,
        conv: Optional[Callable[..., nn.Module]] = None,
    ):
        """
        Parameters
        ----------
        irreps_in: e3nn.o3.Irreps
            Input node feature irreps
        irreps_out: e3nn.o3.Irreps
            Ouput node feature irreps
        irreps_sh: e3nn.o3.Irreps
            Edge spherical harmonic irreps
        edge_attr_dim: int
            Dimension of scalar edge attributes to be passed to radial_nn
        act: Mapping[int, nn.Module]
            Mapping from parity to activation module.
            If `None` defaults to `{1 : nn.LeakyReLU(), -1: nn.Tanh()}`
        act_gates: Mapping[int, nn.Module]
            Mapping from parity to activation module.
            If `None` defaults to `{1 : nn.Sigmoid(), -1: nn.Tanh()}`
        conv: Optional[Callable[..., nn.Module]] = None
            Factory function for convolution layer used for computing keys and values
        """

        super().__init__()

        self.irreps_in = e3nn.o3.Irreps(irreps_in)
        self.irreps_out = e3nn.o3.Irreps(irreps_out)
        self.irreps_sh = e3nn.o3.Irreps(irreps_sh)

        if conv is None:
            conv = Conv

        wrapped_conv = functools.partial(
            conv, irreps_sh=irreps_sh, edge_attr_dim=edge_attr_dim
        )

        self.gated_conv = LinearSelfInteraction(
            Gated(
                wrapped_conv,
                irreps_in=self.irreps_in,
                irreps_out=self.irreps_out,
                act=act,
                act_gates=act_gates,
            )
        )


[docs]
    def forward(
        self,
        node_attr: torch.Tensor,
        edge_index: torch.Tensor,
        edge_attr: torch.Tensor,
        edge_sh: torch.Tensor,
    ) -> torch.Tensor:
        """
        Computes the forward pass of the equivariant graph attention

        Let N be the number of nodes, and E be the number of edges

        Parameters
        ----------
        node_attr: [N, irreps_in.dim]
        edge_index: [2, E]
        edge_attr: [E, edge_attr_dim]
        edge_sh: [E, irreps_sh.dim]

        Returns
        -------
        out: [N, irreps_out.dim]
        """
        return self.gated_conv(node_attr, edge_index, edge_attr, edge_sh)





[docs]
class SeparableConvBlock(ConvBlock):
    """e3tools.nn.ConvBlock with SeparableConv as the underlying convolution layer."""

    def __init__(self, *args, **kwargs):
        """
        Initializes the SeparableConvBlock.

        All arguments are passed directly to the parent ConvBlock,
        with the 'conv' argument specifically set to SeparableConv.
        """
        super().__init__(
            *args,
            **kwargs,
            conv=SeparableConv,
        )




[docs]
class FusedSeparableConvBlock(ConvBlock):
    """e3tools.nn.ConvBlock with FusedSeparableConv as the underlying convolution layer."""

    def __init__(self, *args, **kwargs):
        """
        Initializes the SeparableConvBlock.

        All arguments are passed directly to the parent ConvBlock,
        with the 'conv' argument specifically set to SeparableConv.
        """
        super().__init__(
            *args,
            **kwargs,
            conv=FusedSeparableConv,
        )
Source code for e3tools.nn._conv

e3tools

Navigation

Related Topics