Update paper.md (#134)

* update paper.md and paper.bib * correct modulus reference --------- Co-authored-by: Anna Ivagnes <s274001@studenti.polito.it> Co-authored-by: Dario Coscia <93731561+dario-coscia@users.noreply.github.com>
2023-07-04 10:44:28 +02:00
parent b6adcffe07
commit 2bdd7fc9e0
2 changed files with 69 additions and 55 deletions
--- a/joss/paper.bib
+++ b/joss/paper.bib
@@ -10,6 +10,13 @@
  publisher={Now Publishers, Inc.}
 }

+@misc{modulussym,
+  title = {{NVIDIA Modulus}},
+  howpublished = "\url{https://github.com/NVIDIA/modulus}",
+  year = {2023},
+  note = "[Online; accessed 27-April-2023]"
+}
+
@article{Wang_2005,
 doi = {10.1088/0964-1726/14/1/011},
 url = {https://dx.doi.org/10.1088/0964-1726/14/1/011},
@@ -40,19 +47,19 @@ abstract = {We introduce physics-informed neural networks – neural networks th

@misc{pinns,
  doi = {10.48550/ARXIV.2201.05624},
-  
+
  url = {https://arxiv.org/abs/2201.05624},
-  
+
  author = {Cuomo, Salvatore and di Cola, Vincenzo Schiano and Giampaolo, Fabio and Rozza, Gianluigi and Raissi, Maziar and Piccialli, Francesco},
-  
+
  keywords = {Machine Learning (cs.LG), Artificial Intelligence (cs.AI), Numerical Analysis (math.NA), Data Analysis, Statistics and Probability (physics.data-an), FOS: Computer and information sciences, FOS: Computer and information sciences, FOS: Mathematics, FOS: Mathematics, FOS: Physical sciences, FOS: Physical sciences},
-  
+
  title = {Scientific Machine Learning through Physics-Informed Neural Networks: Where we are and What's next},
-  
+
  publisher = {arXiv},
-  
+
  year = {2022},
-  
+
  copyright = {arXiv.org perpetual, non-exclusive license}
 }

@@ -138,41 +145,41 @@ abstract = {In this work we investigate the possibility of using physics-informe

@misc{Markidis,
  doi = {10.48550/ARXIV.2103.09655},
-  
+
  url = {https://arxiv.org/abs/2103.09655},
-  
+
  author = {Markidis, Stefano},
-  
+
  keywords = {Numerical Analysis (math.NA), Distributed, Parallel, and Cluster Computing (cs.DC), Computational Physics (physics.comp-ph), FOS: Mathematics, FOS: Mathematics, FOS: Computer and information sciences, FOS: Computer and information sciences, FOS: Physical sciences, FOS: Physical sciences},
-  
+
  title = {The Old and the New: Can Physics-Informed Deep-Learning Replace Traditional Linear Solvers?},
-  
+
  publisher = {arXiv},
-  
+
  year = {2021},
-  
+
  copyright = {arXiv.org perpetual, non-exclusive license}
 }

@article{Kharazmi_2021,
 	doi = {10.1016/j.cma.2020.113547},
-  
+
 	url = {https://doi.org/10.1016%2Fj.cma.2020.113547},
-  
+
 	year = 2021,
 	month = {feb},
-  
+
 	publisher = {Elsevier {BV}
 },
-  
+
 	volume = {374},
-  
+
 	pages = {113547},
-  
+
 	author = {Ehsan Kharazmi and Zhongqiang Zhang and George E.M. Karniadakis},
-  
+
 	title = {hp-{VPINNs}: Variational physics-informed neural networks with domain decomposition},
-  
+
 	journal = {Computer Methods in Applied Mechanics and Engineering}
 }

@@ -192,54 +199,54 @@ abstract = {Fatigue life of a wind turbine main bearing is drastically affected

@misc{strazdemo,
  doi = {10.48550/ARXIV.2110.13530},
-  
+
  url = {https://arxiv.org/abs/2110.13530},
-  
+
  author = {Demo, Nicola and Strazzullo, Maria and Rozza, Gianluigi},
-  
+
  keywords = {Machine Learning (cs.LG), Numerical Analysis (math.NA), FOS: Computer and information sciences, FOS: Computer and information sciences, FOS: Mathematics, FOS: Mathematics},
-  
+
  title = {An extended physics informed neural network for preliminary analysis of parametric optimal control problems},
-  
+
  publisher = {arXiv},
-  
+
  year = {2021},
-  
+
  copyright = {arXiv.org perpetual, non-exclusive license}
 }

@misc{adam,
  doi = {10.48550/ARXIV.1412.6980},
-  
+
  url = {https://arxiv.org/abs/1412.6980},
-  
+
  author = {Kingma, Diederik P. and Ba, Jimmy},
-  
+
  keywords = {Machine Learning (cs.LG), FOS: Computer and information sciences, FOS: Computer and information sciences},
-  
+
  title = {Adam: A Method for Stochastic Optimization},
-  
+
  publisher = {arXiv},
-  
+
  year = {2014},
-  
+
  copyright = {arXiv.org perpetual, non-exclusive license}
 }

@misc{ccnn,
  doi = {10.48550/ARXIV.2210.13416},
-  
+
  url = {https://arxiv.org/abs/2210.13416},
-  
+
  author = {Coscia, Dario and Meneghetti, Laura and Demo, Nicola and Stabile, Giovanni and Rozza, Gianluigi},
-  
+
  keywords = {Machine Learning (cs.LG), Numerical Analysis (math.NA), FOS: Computer and information sciences, FOS: Computer and information sciences, FOS: Mathematics, FOS: Mathematics},
-  
+
  title = {A Continuous Convolutional Trainable Filter for Modelling Unstructured Data},
-  
+
  publisher = {arXiv},
-  
+
  year = {2022},
-  
+
  copyright = {Creative Commons Attribution 4.0 International}
 }
--- a/joss/paper.md
+++ b/joss/paper.md
@@ -6,7 +6,7 @@ tags:
  - physics-informed neural networks
  - scientific machine learning
  - differential equations.
-authors: 
+authors:
  - name: Dario Coscia
    orcid: 0000-0001-8833-6833
    equal-contrib: true
@@ -35,19 +35,19 @@ Artificial Intelligence (AI) strategies are massively emerging in several fields
 However, the amount of data required to analyze complex systems is often insufficient to make AI predictions reliable and robust. Physics-informed neural networks (PINNs) have been formulated [@RAISSI2019686] to overcome the issues of missing data, by incorporating the physical knowledge into the neural network training. Thus, PINNs aim to approximate any differential equation by solving a minimization problem in an unsupervised learning setting, learning the unknown field in order to preserve the imposed constraints (boundaries and physical residuals). Formally, we consider the general form of a differential equation, which typically presents the most challenging issues from a numerical point of view:
 \begin{equation}
 \begin{split}
-    \mathcal{F}(\pmb{u}(\pmb{z});\alpha)&=\pmb{f}(\pmb{z}) \quad \pmb{z} \in \Omega,\\       
-    \mathcal{B}(\pmb{u}(\pmb{z}))&=\pmb{g}(\pmb{z}) \quad \pmb{z} \in \partial\Omega,   
+    \mathcal{F}(\pmb{u}(\pmb{z});\alpha)&=\pmb{f}(\pmb{z}) \quad \pmb{z} \in \Omega,\\
+    \mathcal{B}(\pmb{u}(\pmb{z}))&=\pmb{g}(\pmb{z}) \quad \pmb{z} \in \partial\Omega,
 \end{split}
 \end{equation}
 where $\Omega\subset\mathbb{R}^d$ is the domain and $\partial\Omega$ the boundaries of the latter. In particular, $\pmb{z}$ indicates the spatio-temporal coordinates vector, $\pmb{u}$ the unknown field, $\alpha$ the physical parameters, $\pmb{f}$ the forcing term, and $\mathcal{F}$ the differential operator. In addition, $\mathcal{B}$ identifies the operator indicating arbitrary initial or boundary conditions and $\pmb{g}$ the boundary function. The PINN's objective is to find a solution to the problem, which is done by approximating the true solution $\pmb{u}$ with a neural network $\hat{\pmb{u}}_{\theta} : \Omega \rightarrow \mathbb{R}$, with $\theta$ network's parameters. Such a model is trained to find the optimal parameters $\theta^*$ whose minimizing the physical loss function depending on the physical conditions $\mathcal{L}_{\mathcal{F}}$, boundary conditions $\mathcal{L}_{\mathcal{B}}$ and, if available, real data $\mathcal{L}_{\textrm{data}}$:

 \begin{equation}
-    \theta^* = \underset{\theta}{\mathrm{argmin}} \mathcal{L} = 
+    \theta^* = \underset{\theta}{\mathrm{argmin}} \mathcal{L} =
    \underset{\theta}{\mathrm{argmin}} (\mathcal{L}_{\mathcal{F}} + \mathcal{L}_{\mathcal{B}} + \mathcal{L}_{\text{data}}).
 \end{equation}


-The PINNs framework is completely general and applicable to different types of ordinary differential equations (ODEs), or partial differential equations (PDEs). Nevertheless, the loss function strictly depends on the problem chosen to be solved, since different operators or boundary conditions lead to different losses, increasing the difficulty to write a general and portable code for different problems. 
+The PINNs framework is completely general and applicable to different types of ordinary differential equations (ODEs), or partial differential equations (PDEs). Nevertheless, the loss function strictly depends on the problem chosen to be solved, since different operators or boundary conditions lead to different losses, increasing the difficulty to write a general and portable code for different problems.

 ![PINA logo.\label{logo}](pina_logo.png){ width=20% }

@@ -56,19 +56,21 @@ The PINNs framework is completely general and applicable to different types of o
 # Statement of need
 PINA is an open-source Python library that provides an intuitive interface for the approximated resolution of Ordinary Differential Equations and Partial Differential Equations using  a deep learning paradigm, in particular via PINNs.
 The gain of popularity for PINNs in recent years, and the evolution of open-source frameworks, such as TensorFlow, Keras, and PyTorch, led to the development of several libraries, whose focus is the exploitation of PINNs to approximately solve ODEs and PDEs.
-We here mention some PyTorch-based libraries, \verb+NeuroDiffEq+ [@chen2020neurodiffeq], \verb+IDRLNet+ [@peng2021idrlnet], and some TensorFlow-based libraries, such as \verb+DeepXDE+ [@lu2021deepxde], \verb+TensorDiffEq+ [@mcclenny2021tensordiffeq], \verb+SciANN+ [@haghighat2021sciann] (which is both TensorFlow and Keras-based), \verb+PyDEns+ [@koryagin2019pydens], \verb+Elvet+ [@araz2021elvet], \verb+NVIDIA SimNet+ [@hennigh2021nvidia].
-Among all these frameworks, PINA wants to emerge for its easiness of usage, allowing the users to quickly formulate the problem at hand and solve it, resulting in an intuitive frameworks designed by researchers for researchers.
+We here mention some PyTorch-based libraries, \verb+NeuroDiffEq+ [@chen2020neurodiffeq], \verb+IDRLNet+ [@peng2021idrlnet], NVIDIA \verb+Modulus+ [@modulussym], and some TensorFlow-based libraries, such as \verb+DeepXDE+ [@lu2021deepxde], \verb+TensorDiffEq+ [@mcclenny2021tensordiffeq], \verb+SciANN+ [@haghighat2021sciann] (which is both TensorFlow and Keras-based), \verb+PyDEns+ [@koryagin2019pydens], \verb+Elvet+ [@araz2021elvet], \verb+NVIDIA SimNet+ [@hennigh2021nvidia].
+Among all these frameworks, PINA wants to emerge for its easiness of usage, allowing the users to quickly formulate the problem at hand and solve it, resulting in an intuitive framework designed by researchers for researchers.
+
+Built over PyTorch --- in order to inherit the \verb+autograd+ module and all the other features already implemented --- PINA provides indeed documented API to explain usage and capabilities of the different classes. We have built several abstract interfaces not only for better structure of the source code but especially to give the final user an easy entry point to implement their own extensions, like new loss functions, new training procedures, and so on. This aspect, together with the capability to use all the PyTorch models, makes it possible to incorporate almost any existing architecture into the PINA framework.
 We have decided to build it on top of PyTorch in order to exploit the \verb+autograd+ module, as well as all the other features implemented in this framework. The final outcome is then a library with incremental complexity, capable of being used by the new users to perform the first investigation using PINNs, but also as a core framework to actively develop new features to improve the discussed methodology.

 The high-level structure of the package is illustrated in Figure \ref{API_visual}; the approximated solution of a differential equation can be implemented using PINA in a few lines of code thanks to the intuitive and user-friendly interface.
-Besides the user-friendly interface, PINA also offers several examples and tutorials, aiming to guide new users toward an easy exploration of the software features. The online documentation is released at \url{https://mathlab.github.io/PINA/}, while the robustness of the package is continuously monitored by unit tests. 
+Besides the user-friendly interface, PINA also offers several examples and tutorials, aiming to guide new users toward an easy exploration of the software features. The online documentation is released at \url{https://mathlab.github.io/PINA/}, while the robustness of the package is continuously monitored by unit tests.

-The API visualization in Figure \ref{API_visual} shows that a complete workflow in PINA is characterized by 3 main steps: the problem formulation, the model definition, i.e. the structure of the neural network used, and the PINN training, eventually followed by the data visualization.
+The API visualization in Figure \ref{API_visual} shows that a complete workflow in PINA is characterized by 3 main steps: the problem formulation, the model definition, i.e. the structure of the neural network used, and the training, eventually followed by the data visualization.

 ![High-level structure of the library.\label{API_visual}](API_color.png){ width=70% }

 ## Problem definition in PINA
-The first step is the formalization of the problem. 
+The first step is the formalization of the problem.
 The problem definition in the PINA framework is inherited from one or more problem classes (at the moment the available classes are \verb+SpatialProblem+, \verb+TimeDependentProblem+, \verb+ParametricProblem+), depending on the nature of the problem treated.
 The user has to include in the problem formulation the following components:
 \begin{itemize}
@@ -76,11 +78,16 @@ The user has to include in the problem formulation the following components:
    \item the output variables, i.e. the unknowns of the problem;
    \item the conditions that the neural network has to satisfy, i.e. the differential equations, the boundary and initial conditions.
 \end{itemize}
-We highlight that in PINA we abandoned the classical division between physical loss, boundary loss, and data loss: all these terms are encapsulated within the \verb+Condition+ class, in order to keep the framework as general as possible. The users can indeed define all the constraints the unknown field needs to satisfy, avoiding any forced structure in the formulation and allowing them to mix heterogeneous constraints --- e.g. data values, differential boundary conditions.
+We highlight that in PINA we abandoned the classical division between physical loss, boundary loss, and data loss: all these terms are encapsulated within the \verb+Condition+ class, in order to keep the framework as general as possible. The users can indeed define all the constraints the unknown field needs to satisfy, avoiding any forced structure in the formulation and allowing them to mix heterogeneous constraints --- e.g. data values, differential boundary conditions. Moreover PINA already implements functions to easily compute the diffential operations (gradient, divergence, laplacian) over the output(s) of interest, aiming to make the problem definition an easy task for the users.

 ## Model definition in PINA
 The second fundamental step is the definition of the model of the neural network employed to find the approximated solution to the differential problem in question.
-In PINA, the user has the possibility to use either a custom \verb+torch+ network model and translate it to a PINA model (with the class \verb+Network+), or to exploit one of the built-in models such as \verb+FeedForward+, \verb+MultiFeedForward+ and \verb+DeepONet+, defining their characteristics during instantiation --- i.e. number of layers, number of neurons, activation functions. The list of the built-in models will be extended in the next release of the library.
+In PINA, the user has the possibility to use either a custom \verb+torch+ network model, or to exploit one of the built-in models such as \verb+FeedForward+, \verb+MultiFeedForward+ and \verb+DeepONet+, defining their characteristics during instantiation --- i.e. number of layers, number of neurons, activation functions. The list of the built-in models will be extended in the next release of the library.
+
+## Training in PINA
+In the last step, the actual training of the model in order to solve the problem at hand is computed. In this phase, the residuals of the conditions (expressed in the problem) are minimized in order to provide the target approximation. The sampling points where the physical residuals are evaluated can be passed by the user, or automatically sampled from the original domain using one of the available sampling techniques.
+The training is then computed for a certain amount of epochs, or until reaching the user-defined loss threshold.
+Once the model is ready to be inferred, the user can save it onto a binary file for future reusing, by inheriting the PyTorch functionality. The user can also evaluate the (trained) model for any new input, or just use it together with the \verb+Plotter+ in order to render the predicted output variables.


 # Acknowledgements