Add Averaging Neural Operator with tests and a tutorial (#230)

* add Averaging Neural Operator with tests * add backward test * minor changes * doc addition --------- Co-authored-by: Dario Coscia <dariocoscia@Dario-Coscia.local>
2024-03-05 12:30:53 +01:00
parent b10e02103b
commit 43f69242ab
8 changed files with 254 additions and 1 deletions
--- a/docs/source/_rst/_code.rst
+++ b/docs/source/_rst/_code.rst
@@ -56,6 +56,7 @@ Models
    MIONet <models/mionet.rst>
    FourierIntegralKernel <models/fourier_kernel.rst>
    FNO <models/fno.rst>
    AveragingNeuralOperator <models/avno.rst>
 Layers
 -------------
@@ -67,10 +68,10 @@ Layers
    EnhancedLinear layer <layers/enhanced_linear.rst>
    Spectral convolution <layers/spectral.rst>
    Fourier layers <layers/fourier.rst>
    Averaging layer <layers/avno_layer.rst>
    Continuous convolution <layers/convolution.rst>
    Proper Orthogonal Decomposition <layers/pod.rst>
    Periodic Boundary Condition embeddings <layers/embedding.rst>
 Equations and Operators
 -------------------------
--- a/docs/source/_rst/layers/avno_layer.rst
+++ b/docs/source/_rst/layers/avno_layer.rst
@@ -0,0 +1,8 @@
 Averaging layers
 ====================
 .. currentmodule:: pina.model.layers.avno_layer
 .. autoclass:: AVNOBlock
    :members:
    :show-inheritance:
    :noindex:
--- a/docs/source/_rst/models/avno.rst
+++ b/docs/source/_rst/models/avno.rst
@@ -0,0 +1,7 @@
 Averaging Neural Operator
 ==============================
 .. currentmodule:: pina.model.avno
 .. autoclass:: AveragingNeuralOperator
   :members:
   :show-inheritance:
--- a/pina/model/init.py
+++ b/pina/model/init.py
@@ -7,6 +7,7 @@ __all__ = [
    "FNO",
    "FourierIntegralKernel",
    "KernelNeuralOperator",
    "AveragingNeuralOperator",
 ]
 from .feed_forward import FeedForward, ResidualFeedForward
@@ -14,3 +15,4 @@ from .multi_feed_forward import MultiFeedForward
 from .deeponet import DeepONet, MIONet
 from .fno import FNO, FourierIntegralKernel
 from .base_no import KernelNeuralOperator
 from .avno import AveragingNeuralOperator
--- a/pina/model/avno.py
+++ b/pina/model/avno.py
@@ -0,0 +1,104 @@
 """Module Averaging Neural Operator."""
 from torch import nn, concatenate
 from . import FeedForward
 from .layers import AVNOBlock
 from .base_no import KernelNeuralOperator
 from pina.utils import check_consistency
 class AveragingNeuralOperator(KernelNeuralOperator):
    """
    Implementation of Averaging Neural Operator. 
    Averaging Neural Operator is a general architecture for
    learning Operators. Unlike traditional machine learning methods
    AveragingNeuralOperator is designed to map entire functions
    to other functions. It can be trained with Supervised learning strategies.
    AveragingNeuralOperator does convolution by performing a field average.
    .. seealso::
        **Original reference**: Lanthaler S. Li, Z., Kovachki,
        Stuart, A. (2020). *The Nonlocal Neural Operator:
        Universal Approximation*.
        DOI: `arXiv preprint arXiv:2304.13221.
        <https://arxiv.org/abs/2304.13221>`_
    """
    def __init__(
        self,
        input_numb_fields,
        output_numb_fields,
        field_indices,
        coordinates_indices,
        dimension=3,
        inner_size=100,
        n_layers=4,
        func=nn.GELU,
    ):
        """
        :param int input_numb_fields: The number of input components 
            of the model.
        :param int output_numb_fields: The number of output components 
            of the model.
        :param int dimension: the dimension of the domain of the functions.
        :param int inner_size: number of neurons in the hidden layer(s). 
            Defaults to 100.
        :param int n_layers: number of hidden layers. Default is 4.
        :param func: the activation function to use. Default to nn.GELU.
        :param list[str] field_indices: the label of the fields 
            in the input tensor. 
        :param list[str] coordinates_indices: the label of the 
            coordinates in the input tensor. 
        """
        # check consistency
        check_consistency(input_numb_fields, int)
        check_consistency(output_numb_fields, int)
        check_consistency(field_indices, str)
        check_consistency(coordinates_indices, str)
        check_consistency(dimension, int)
        check_consistency(inner_size, int)
        check_consistency(n_layers, int)
        check_consistency(func, nn.Module, subclass=True)
        # assign
        self.input_numb_fields = input_numb_fields
        self.output_numb_fields = output_numb_fields
        self.dimension = dimension
        self.coordinates_indices = coordinates_indices
        self.field_indices = field_indices
        integral_net = nn.Sequential(
            *[AVNOBlock(inner_size, func) for _ in range(n_layers)])
        lifting_net = FeedForward(dimension + input_numb_fields, inner_size,
                                  inner_size, n_layers, func)
        projection_net = FeedForward(inner_size + dimension, output_numb_fields,
                                     inner_size, n_layers, func)
        super().__init__(lifting_net, integral_net, projection_net)
    def forward(self, x):
        r"""
        Forward computation for Averaging Neural Operator. It performs a
        lifting of the input by the ``lifting_net``. Then different layers
        of Averaging Neural Operator Blocks are applied.
        Finally the output is projected to the final dimensionality
        by the ``projecting_net``.
        :param torch.Tensor x: The input tensor for fourier block,
            depending on ``dimension`` in the initialization. It expects
            a tensor :math:`B \times N \times D`,
            where :math:`B` is the batch_size, :math:`N` the number of points
            in the mesh, :math:`D` the dimension of the problem, i.e. the sum
            of ``len(coordinates_indices)+len(field_indices)``.
        :return: The output tensor obtained from Average Neural Operator.
        :rtype: torch.Tensor
        """
        points_tmp = x.extract(self.coordinates_indices)
        features_tmp = x.extract(self.field_indices)
        new_batch = concatenate((features_tmp, points_tmp), dim=2)
        new_batch = self._lifting_operator(new_batch)
        new_batch = self._integral_kernels(new_batch)
        new_batch = concatenate((new_batch, points_tmp), dim=2)
        new_batch = self._projection_operator(new_batch)
        return new_batch
--- a/pina/model/layers/init.py
+++ b/pina/model/layers/init.py
@@ -10,6 +10,7 @@ __all__ = [
    "FourierBlock3D",
    "PODBlock",
    "PeriodicBoundaryEmbedding",
    "AVNOBlock",
 ]
 from .convolution_2d import ContinuousConvBlock
@@ -22,3 +23,4 @@ from .spectral import (
 from .fourier import FourierBlock1D, FourierBlock2D, FourierBlock3D
 from .pod import PODBlock
 from .embedding import PeriodicBoundaryEmbedding
 from .avno_layer import AVNOBlock
--- a/pina/model/layers/avno_layer.py
+++ b/pina/model/layers/avno_layer.py
@@ -0,0 +1,67 @@
 """ Module for Averaging Neural Operator Layer class. """
 from torch import nn, mean
 from pina.utils import check_consistency
 class AVNOBlock(nn.Module):
    r"""
    The PINA implementation of the inner layer of the Averaging Neural Operator.
    The operator layer performs an affine transformation where the convolution
    is approximated with a local average. Given the input function
    :math:`v(x)\in\mathbb{R}^{\rm{emb}}` the layer computes
    the operator update :math:`K(v)` as:
    .. math::
        K(v) = \sigma\left(Wv(x) + b + \frac{1}{|\mathcal{A}|}\int v(y)dy\right)
    where:
    *   :math:`\mathbb{R}^{\rm{emb}}` is the embedding (hidden) size
        corresponding to the ``hidden_size`` object
    *   :math:`\sigma` is a non-linear activation, corresponding to the
        ``func`` object
    *   :math:`W\in\mathbb{R}^{\rm{emb}\times\rm{emb}}` is a tunable matrix.
    *   :math:`b\in\mathbb{R}^{\rm{emb}}` is a tunable bias.
    .. seealso::
        **Original reference**: Lanthaler S. Li, Z., Kovachki, 
        Stuart, A. (2020). *The Nonlocal Neural Operator: Universal
        Approximation*.
        DOI: `arXiv preprint arXiv:2304.13221.
        <https://arxiv.org/abs/2304.13221>`_
    """
    def __init__(self, hidden_size=100, func=nn.GELU):
        """
        :param int hidden_size: Size of the hidden layer, defaults to 100.
        :param func: The activation function, default to nn.GELU.
        """
        super().__init__()
        # Check type consistency
        check_consistency(hidden_size, int)
        check_consistency(func, nn.Module, subclass=True)
        # Assignment
        self._nn = nn.Linear(hidden_size, hidden_size)
        self._func = func()
    def forward(self, x):
        r"""
        Forward pass of the layer, it performs a sum of local average
        and an affine transformation of the field.
        :param torch.Tensor x: The input tensor for performing the
            computation. It expects a tensor :math:`B \times N \times D`,
            where :math:`B` is the batch_size, :math:`N` the number of points
            in the mesh, :math:`D` the dimension of the problem. In particular
            :math:`D` is the codomain of the function :math:`v`. For example
            a scalar function has :math:`D=1`, a 4-dimensional vector function
            :math:`D=4`.
        :return: The output tensor obtained from Average Neural Operator Block.
        :rtype: torch.Tensor
        """
        return self._func(self._nn(x) + mean(x, dim=1, keepdim=True))
--- a/tests/test_model/test_avno.py
+++ b/tests/test_model/test_avno.py
@@ -0,0 +1,62 @@
 import torch
 from pina.model import AveragingNeuralOperator
 from pina import LabelTensor
 output_numb_fields = 5
 batch_size = 15
 def test_constructor():
    input_numb_fields = 1
    output_numb_fields = 1
    #minimuum constructor
    AveragingNeuralOperator(input_numb_fields,
         output_numb_fields,
         coordinates_indices=['p'],
         field_indices=['v'])
    #all constructor
    AveragingNeuralOperator(input_numb_fields,
         output_numb_fields,
         inner_size=5,
         n_layers=5,
         func=torch.nn.ReLU,
         coordinates_indices=['p'],
         field_indices=['v'])
 def test_forward():
    input_numb_fields = 1
    output_numb_fields = 1
    dimension = 1
    input_ = LabelTensor(
        torch.rand(batch_size, 1000, input_numb_fields + dimension), ['p', 'v'])
    ano = AveragingNeuralOperator(input_numb_fields,
               output_numb_fields,
               dimension=dimension,
               coordinates_indices=['p'],
               field_indices=['v'])
    out = ano(input_)
    assert out.shape == torch.Size(
        [batch_size, input_.shape[1], output_numb_fields])
 def test_backward():
    input_numb_fields = 1
    dimension = 1
    output_numb_fields = 1
    input_ = LabelTensor(
        torch.rand(batch_size, 1000, dimension + input_numb_fields), 
        ['p', 'v'])
    input_ = input_.requires_grad_()
    avno = AveragingNeuralOperator(input_numb_fields,
                output_numb_fields,
                dimension=dimension,
                coordinates_indices=['p'],
                field_indices=['v'])
    out = avno(input_)
    tmp = torch.linalg.norm(out)
    tmp.backward()
    grad = input_.grad
    assert grad.shape == torch.Size(
        [batch_size, input_.shape[1], dimension + input_numb_fields])