fixed doc

GiovanniCanali · GiovanniCanali · commit 383a92a18ece · 2025-06-01T14:05:08.000+02:00
diff --git a/pina/model/block/message_passing/en_equivariant_network_block.py b/pina/model/block/message_passing/en_equivariant_network_block.py
@@ -8,6 +8,29 @@
 
 
 class EnEquivariantNetworkBlock(MessagePassing):
+    """
+    Implementation of the E(n) Equivariant Graph Neural Network block.
+    This block is used to perform message-passing between nodes and edges in a
+    graph neural network, following the scheme proposed by Satorras et al. in
+    2021. It serves as an inner block in a larger graph neural network
+    architecture.
+    The message between two nodes connected by an edge is computed by applying a
+    linear transformation to the sender node features and the edge features,
+    together with the squared euclidean distance between the sender and
+    recipient node positions, followed by a non-linear activation function.
+    Messages are then aggregated using an aggregation scheme (e.g., sum, mean,
+    min, max, or product).
+    The update step is performed by applying another MLP to the concatenation of
+    the incoming messages and the node features. Here, also the node
+    positions are updated by adding the incoming messages divided by the
+    degree of the recipient node.
+    .. seealso::
+        **Original reference** Satorras, V. G., Hoogeboom, E., Welling, M.
+        (2021). *E(n) Equivariant Graph Neural Networks.*
+        In International Conference on Machine Learning.
+        DOI: `<https://doi.org/10.48550/arXiv.2102.09844>`_.
+    """
+
     def __init__(
         self,
         node_feature_dim,
@@ -21,15 +44,49 @@ def __init__(
         node_dim=-2,
         flow="source_to_target",
     ):
+        """
+        Initialization of the :class:`EnEquivariantNetworkBlock` class.
+        :param int node_feature_dim: The dimension of the node features.
+        :param int edge_feature_dim: The dimension of the edge features.
+        :param int pos_dim: The dimension of the position features.
+        :param int hidden_dim: The dimension of the hidden features.
+            Default is 64.
+        :param int n_message_layers: The number of layers in the message
+            network. Default is 2.
+        :param int n_update_layers: The number of layers in the update network.
+            Default is 2.
+        :param torch.nn.Module activation: The activation function.
+            Default is :class:`torch.nn.SiLU`.
+        :param str aggr: The aggregation scheme to use for message passing.
+            Available options are "add", "mean", "min", "max", "mul".
+            See :class:`torch_geometric.nn.MessagePassing` for more details.
+            Default is "add".
+        :param int node_dim: The axis along which to propagate. Default is -2.
+        :param str flow: The direction of message passing. Available options
+            are "source_to_target" and "target_to_source".
+            The "source_to_target" flow means that messages are sent from
+            the source node to the target node, while the "target_to_source"
+            flow means that messages are sent from the target node to the
+            source node. See :class:`torch_geometric.nn.MessagePassing` for more
+            details. Default is "source_to_target".
+        :raises AssertionError: If `node_feature_dim` is not a positive integer.
+        :raises AssertionError: If `edge_feature_dim` is a negative integer.
+        :raises AssertionError: If `pos_dim` is not a positive integer.
+        :raises AssertionError: If `hidden_dim` is not a positive integer.
+        :raises AssertionError: If `n_message_layers` is not a positive integer.
+        :raises AssertionError: If `n_update_layers` is not a positive integer.
+        """
         super().__init__(aggr=aggr, node_dim=node_dim, flow=flow)
 
+        # Check values
         check_positive_integer(node_feature_dim, strict=True)
         check_positive_integer(edge_feature_dim, strict=False)
         check_positive_integer(pos_dim, strict=True)
         check_positive_integer(hidden_dim, strict=True)
         check_positive_integer(n_message_layers, strict=True)
         check_positive_integer(n_update_layers, strict=True)
 
+        # Layer for computing the message
         self.message_net = FeedForward(
             input_dimensions=2 * node_feature_dim + edge_feature_dim + 1,
             output_dimensions=pos_dim,
@@ -38,6 +95,7 @@ def __init__(
             func=activation,
         )
 
+        # Layer for updating the node features
         self.update_feat_net = FeedForward(
             input_dimensions=node_feature_dim + pos_dim,
             output_dimensions=node_feature_dim,
@@ -46,6 +104,8 @@ def __init__(
             func=activation,
         )
 
+        # Layer for updating the node positions
+        # The output dimension is set to 1 for equivariant updates
         self.update_pos_net = FeedForward(
             input_dimensions=pos_dim,
             output_dimensions=1,
@@ -87,18 +147,21 @@ def message(self, x_i, x_j, pos_i, pos_j, edge_attr):
         :param edge_attr: The edge attributes.
         :type edge_attr: torch.Tensor | LabelTensor
         :return: The message to be passed.
-        :rtype: torch.Tensor
+        :rtype: tuple(torch.Tensor, torch.Tensor)
         """
+        # Compute the euclidean distance between the sender and recipient nodes
         diff = pos_i - pos_j
         dist = torch.norm(diff, dim=-1, keepdim=True) ** 2
 
+        # Compute the message input
         if edge_attr is None:
             input_ = torch.cat((x_i, x_j, dist), dim=-1)
         else:
             input_ = torch.cat((x_i, x_j, dist, edge_attr), dim=-1)
 
-        m_ij = self.message_net(input_)  # message features
-        message = diff * self.update_pos_net(m_ij)  # equivariant message
+        # Compute the messages and their equivariant counterpart
+        m_ij = self.message_net(input_)
+        message = diff * self.update_pos_net(m_ij)
 
         return message, m_ij
 
@@ -112,20 +175,20 @@ def aggregate(self, inputs, index, ptr=None, dim_size=None):
 
         :param tuple(torch.Tensor) inputs: Tuple containing two messages to
             aggregate.
-        :param torch.Tensor | LabelTensor index: The indices of target nodes
-            for each message. This tensor specifies which node each message
-            is aggregated into.
-        :param torch.Tensor | LabelTensor ptr: Optional tensor to specify
-            the slices of messages for each node (used in some aggregation
-            strategies).
+        :param index: The indices of target nodes for each message. This tensor
+            specifies which node each message is aggregated into.
+        :type index: torch.Tensor | LabelTensor
+        :param ptr: Optional tensor to specify the slices of messages for each
+            node (used in some aggregation strategies). Default is None.
+        :type ptr: torch.Tensor | LabelTensor
         :param int dim_size: Optional size of the output dimension, i.e.,
-            number of nodes.
-        :return: Tuple of aggregated tensors corresponding to
-            (aggregated messages for position updates, aggregated messages for
-            feature updates).
+            number of nodes. Default is None.
+        :return: Tuple of aggregated tensors corresponding to (aggregated
+            messages for position updates, aggregated messages for feature
+            updates).
         :rtype: tuple(torch.Tensor, torch.Tensor)
         """
-        # inputs is tuple (message, m_ij), we want to aggregate separately
+        # Unpack the messages from the inputs
         message, m_ij = inputs
 
         # Aggregate messages as usual using self.aggr method