<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mar. Sci.</journal-id>
<journal-title>Frontiers in Marine Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mar. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-7745</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmars.2024.1309775</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Marine Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>DF-ParPINN: parallel PINN based on velocity potential field division and single time slice focus</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Chen</surname>
<given-names>Jingjian</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2168135"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Yuan</surname>
<given-names>Chunxin</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2025026"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Xu</surname>
<given-names>Jiali</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bie</surname>
<given-names>Pengfei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wei</surname>
<given-names>Zhiqiang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>College of Information Science and Engineering, Ocean University of China</institution>, <addr-line>Qingdao</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>College of Mathematical Sciences, Ocean University of China</institution>, <addr-line>Qingdao</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Ocean Observation and Exploration Research, Laoshan Laboratory</institution>, <addr-line>Qingdao</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: An-An Liu, Tianjin University, China</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Shiqiang Yan, City University of London, United Kingdom</p>
<p>Xinwei Fu, Tianjin University, China</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Jiali Xu, <email xlink:href="mailto:jlxu@qnlm.ac">jlxu@qnlm.ac</email>
</p>
</fn>
<fn fn-type="equal" id="fn003">
<p>&#x2020;These authors have contributed equally to this work and share first authorship</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>14</day>
<month>03</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>11</volume>
<elocation-id>1309775</elocation-id>
<history>
<date date-type="received">
<day>08</day>
<month>10</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>24</day>
<month>01</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Chen, Yuan, Xu, Bie and Wei</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Chen, Yuan, Xu, Bie and Wei</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Modified Benney-Luke equation (mBL equation) is a three-dimensional temporal-spatial equation with complex structures, that is a high-dimensional partial differential equation (PDE), it is also a new equation of the physical ocean field, and its solution is important for studying the internal wave-wave interaction of inclined seafloor. For conventional PDE solvers such as the pseudo-spectral method, it is difficult to solve mBL equation with both accuracy and speed. Physics-informed neural network (PINN) incorporates physical prior knowledge in deep neural networks, which can solve PDE with relative accuracy and speed. However, PINN is only suitable for solving low-dimensional PDE with simple structures, and not suitable for solving high-dimensional PDE with complex structures. This is mainly because high-dimensional PDEs usually have complex structures and high-order derivatives and are likely to be high-dimensional non-convex functions, and the high-dimensional non-convex optimization problem is an NP-hard problem, resulting in the PINN easily falling into inaccurate local optimal solutions when solving high-dimensional PDEs. Therefore, we improve the PINN for the characteristics of mBL equation and propose &#x201c;DF-ParPINN: parallel PINN based on velocity potential field division and single time slice focus&#x201d; to solve mBL equation with large amounts of data. DF-ParPINN consists of three modules: temporal-spatial division module of overall velocity potential field, data rational selection module of multiple time slices, and parallel computation module of high-velocity fields and low-velocity fields. The experimental results show that the solution time of DF-ParPINN is no more than 0.5s, and its accuracy is much higher than that of PINN, PIRNN, cPINN, and DeepONet. Moreover, the relative error of DF-ParPINN after deep training 1000000 epochs can be reduced to less than 0.1. The validity of DF-ParPINN proves that the improved PINN also can solve high dimensional PDE with complex structures and large amounts of data quickly and accurately, which is of great significance to the deep learning of the physical ocean field.</p>
</abstract>
<kwd-group>
<kwd>mBL equation</kwd>
<kwd>PINN</kwd>
<kwd>DF-ParPINN</kwd>
<kwd>temporal-spatial division</kwd>
<kwd>data rational selection</kwd>
<kwd>parallel computation</kwd>
</kwd-group>
<counts>
<fig-count count="7"/>
<table-count count="14"/>
<equation-count count="19"/>
<ref-count count="29"/>
<page-count count="17"/>
<word-count count="11018"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Ocean Observation</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>With the rapid development of computer technology, scientific computation has become the third scientific method that can be juxtaposed with theory and experiments (<xref ref-type="bibr" rid="B23">Shi, 2001</xref>; <xref ref-type="bibr" rid="B10">Lu and Guan, 2004</xref>). Solving various partial differential equations (PDE) numerically is an important part of scientific computation (<xref ref-type="bibr" rid="B15">Ockendon et&#xa0;al., 2003</xref>), which is of great significance in promoting the development of related fields. Many physical processes, such as nuclear explosion and fluid flow, can be described by PDE. However, solving PDE through theoretical analysis is very complicated and time-consuming, and it is faced with unsolvable dilemmas (<xref ref-type="bibr" rid="B21">Science, 2016</xref>). It is usually faster to obtain the numerical approximate solution of PDE by scientific computation, and the solution model based on computer science and technology can be continuously optimized, which liberates human participation in the theoretical solution.</p>
<p>Traditional numerical methods mainly include the finite difference method, finite element method, and finite volume method (<xref ref-type="bibr" rid="B3">Chen et&#xa0;al., 2020</xref>). These methods first discretize the computational domain into independent grid elements, and then iteratively solve the partial differential equation on the subdomain of the element to obtain the numerical approximate solution of the equation. However, to ensure the accuracy of the solution, traditional numerical methods are usually time-consuming and rely heavily on manual experience: On the one hand, iterative solving of complex PDE requires expensive computational overhead. On the other hand, to avoid calculation failure, frequent human-computer interaction is usually required to identify and optimize grid quality during grid division, to meet the requirements of prediction accuracy (<xref ref-type="bibr" rid="B7">Katz and Sankaran, 2011</xref>; <xref ref-type="bibr" rid="B1">Abel et&#xa0;al., 2013</xref>). With the increasing complexity of the PDE solving process, the high computational cost and frequent human-computer interaction limit the efficiency of traditional numerical methods in parameter optimization, space exploration, real-time simulation, and other aspects.</p>
<p>Using the traditional numerical methods for PDE, grid division and iterative solution are required, which is computationally expensive and technically difficult. The method of solving PDEs based on deep learning can not only quickly move forward and inverse  (<xref ref-type="bibr" rid="B24">Wang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B27">Xu, 2021</xref>), but also effectively solve nonlinear problems (<xref ref-type="bibr" rid="B17">Raissi et al., 2017a</xref>, <xref ref-type="bibr" rid="B18">Raissi et&#xa0;al., 2017b</xref>, <xref ref-type="bibr" rid="B19">Raissi et al., 2017c</xref>, <xref ref-type="bibr" rid="B16">Raissi and Karniadakis, 2018</xref>) and more complex and higher-dimensional PDE (<xref ref-type="bibr" rid="B25">Weinan et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B4">Han et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B14">Nabian and Meidani, 2019</xref>). Solving methods of PDE based on deep learning is overturning traditional numerical methods of PDE, leading the scientific and technological wave of &#x201c;AI for science&#x201d; (<xref ref-type="bibr" rid="B8">Le, 2022</xref>).</p>
<p>Different from the traditional neural networks, the physics-informed neural network (PINN) is a new method based on &#x201c;meshless&#x201d; calculation (<xref ref-type="bibr" rid="B20">Raissi et&#xa0;al., 2019</xref>), which fundamentally solves the differentiation problem of grid division (<xref ref-type="bibr" rid="B22">Shao et&#xa0;al., 2022</xref>). PINN uses not only the neural network&#x2019;s own loss function but also the physical information loss function with the physical equation as the restriction condition (<xref ref-type="bibr" rid="B29">Zheng et&#xa0;al., 2022</xref>). Therefore, the model trained by PINN can learn both the distribution law contained in the training data set like the traditional neural network model, and the physical law described by the partial differential equation (<xref ref-type="bibr" rid="B12">Lu et&#xa0;al., 2021</xref>). Compared with pure data-driven neural networks, PINN can learn a model with more generalization ability by fewer training data samples due to the additional physical information constraints in the training process (<xref ref-type="bibr" rid="B9">Li and Cheng, 2022</xref>). PINN uses a deep neural network (DNN) as its basic network structure, if DNN is replaced by a recurrent neural network (RNN), a new variant of PINN is formed: Physics-Informed Recurrent Neural Network (PIRNN) (<xref ref-type="bibr" rid="B26">Wu et&#xa0;al., 2023</xref>).</p>
<p>One of the main limitations of PINN is the high cost of training, which can adversely affect performance, especially when solving real-world applications that require running PINN models in real time. Therefore, it is crucial to find ways to accelerate the convergence of these models without sacrificing performance. This problem is first addressed in the conservative physics-informed neural network (cPINN) algorithm (<xref ref-type="bibr" rid="B5">Jagtap et&#xa0;al., 2020</xref>), which uses the domain division method in the PINN framework by dividing the computational domain into subdomains. cPINN deploys a separate neural network in each subdomain, and efficiently tunes hyperparameters for all networks, thus providing the network with strong parallelization and representation capabilities, and the final global solution obtained consists of a series of independent subproblems solutions associated with the entire domain.</p>
<p>In addition to introducing physical information in neural networks, neural operators are also a class of methods for deep learning to solve PDEs. While neural networks are used to learn mappings between finite-dimensional spaces, neural operators can learn mappings between infinite-dimensional spaces by introducing kernel functions into the linear transformations of the neural network. The deep operator networks (DeepONet) can solve a family of PDEs with a series of initial and boundary conditions in one go (<xref ref-type="bibr" rid="B11">Lu et&#xa0;al., 2019</xref>). DeepONet first constructs two sub-networks to encode input functions and location variables separately, and then merge them together to compute the output functions, consequently learning neural operators accurately and efficiently from a relatively small dataset.</p>
<p>In the context of three-dimensional ocean internal waves, considering the topographic effect, Yuan Chunxin et&#xa0;al. proposed the modified Benney-Luke equation (mBL equation) (<xref ref-type="bibr" rid="B28">Yuan and Wang, 2022</xref>) to describe the internal wave interaction on the oblique bottom. Compared with the Benney-Luke equation (BL equation) (<xref ref-type="bibr" rid="B2">Benney and Luke, 1964</xref>), mBL equation has a more concise structure and the characteristics of isotropic and bidirectional propagation. The numerical solution of mBL equation fits well with those of BL equation, which proves that mBL equation is valid.</p>
<p>As a relatively complex new partial differential equation in the field of the physical ocean field, the mBL equation has multiple higher partial derivatives, a complex temporal-spatial boundary, and involves a large space range and time range. At present, for mBL equation, only the traditional numerical methods are used to solve it, while deep learning methods such as PINN have not been used to solve it. However, solving mBL equation directly with PINN cannot obtain high-precision solutions, mainly because PINN has the following problems:</p>
<list list-type="bullet">
<list-item>
<p>It is difficult to solve complex PDE with high-dimensional non-convex properties. High-dimensional PDE are usually space-time equations in three dimensions and above, have complex structures and highorder derivatives, and are likely to be high-dimensional non-convex functions, and high-dimensional non-convex optimization problems are NP-hard problems, which are difficult to solve. Therefore, due to the inaccuracies involved in solving high-dimensional nonconvex optimization problems, PINN can easily fall into local optimal solutions when solving high-dimensional PDE, which leads to difficulties in obtaining exact solutions of high-dimensional PDE.</p>
</list-item>
<list-item>
<p>It is difficult to transfer the physical information of boundary points and initial points. PINN are trained from initial points and boundary points, however, as the number of training times increases, it is difficult to transfer the physical information of initial points and boundary points to longer time scales and deeper spatial interiors, and sometimes it is difficult to determine the initial or boundary conditions of PDE.</p>
</list-item>
<list-item>
<p>It is difficult to train the automatic derivative network quickly at a low cost. The backbone network of PINN is a deep neural network, which introduces the physical information of PDE in the iterative training using automatic derivation, and the derivation includes finding the spatial partial derivatives and the temporal partial derivatives, but the complicated process of derivation will increase the cost and time of the training greatly.</p>
</list-item>
</list>
<p>Aiming at the above problems, this paper proposes &#x201c;DF-ParPINN: parallel PINN based on velocity potential field division and single time slice focus for solving mBL equation&#x201d;, with the following contributions:</p>
<list list-type="bullet">
<list-item>
<p>Proposed a temporal-spatial division module of overall velocity potential field. The module firstly divides the overall velocity potential field into velocity potential fields of different time slices based on the time axis, and then divides the velocity potential field of different time slices into the highvelocity field and the low-velocity field based on the shape of rules. The module provides a temporal dimensionality reduction and spatial domain division of overall velocity potential field, delineating multiple sets of velocity potential fields under different temporal-spatial conditions, and reduces the complex high-dimensional nonconvexity of overall velocity potential field.</p>
</list-item>
<list-item>
<p>Proposed a data rational selection module of multiple time slices. The module selects different time slices of data to start training through the reasonable allocation of physical information: on the basis of correlatively selecting all previous time slices of data, the module focuses on selecting the data of the time slice to be solved, and combines the two parts of the selected data to start training. In the case where the initial and boundary points exist only in the initial field with the velocity potential values all zero, the module reasonably selects data from different time slices to start training, which reduces the influence of the physical information of the initial and boundary points that is difficult to be transferred.</p>
</list-item>
<list-item>
<p>Proposed a parallel computation module of high-velocity fields and low-velocity fields. The module uses multiple servers to accelerate solving the high-velocity fields and the low-velocity fields, and then merges the high-velocity fields and the low-velocity fields into one velocity potential field based on the spatial coordinates. This module accelerates the solution of the high-velocity fields and the low-velocity fields on the basis of overall velocity potential field spatio-temporal division and multi-time slice data reasonable selection, which reduces the training cost and time of the network.</p>
</list-item>
</list>
<p>DF-ParPINN improves PINN and can solve mBL equation with high accuracy. DF-ParPINN is a breakthrough in solving complex PDE of the physical ocean field by using deep learning technology.</p>
</sec>
<sec id="s2">
<label>2</label>
<title>Related work</title>
<sec id="s2_1">
<label>2.1</label>
<title>mBL equation</title>
<p>The Benney-Luke equation (BL equation) is a nonlinear partial differential equation used to observe the interaction and reflection characteristics of finite amplitude permanent waves, but the structure of the equation is somewhat complicated. The Kadomtsev-Petviashvili equation (the KP equation) (<xref ref-type="bibr" rid="B6">Kadomtsev and Petviashvili, 1970</xref>; <xref ref-type="bibr" rid="B13">Molinet et&#xa0;al., 2011</xref>) is a nonlinear partial differential equation used to simulate nonlinear waves, but it lacks the characteristics of isotropic and bidirectional propagation. In the context of three-dimensional ocean internal waves, taking into account the topographic effect, Yuan Chunxin et&#xa0;al. proposed the modified Benney-Luke equation (mBL equation) to describe the internal wave-wave interaction of the inclined seafloor, as shown below:</p>
<disp-formula id="eq1">
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mi>c</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mtext>&#x394;</mml:mtext>
<mml:mi>&#x3be;</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:mtext>&#x394;</mml:mtext>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi>&#x3b2;</mml:mi>
<mml:mo>&#x2207;</mml:mo>
<mml:mo>&#xb7;</mml:mo>
<mml:mi>b</mml:mi>
<mml:mo>&#x2207;</mml:mo>
<mml:mi>&#x3be;</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>&#x3b3;</mml:mi>
<mml:mo stretchy="false">[</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mo>&#x2223;</mml:mo>
<mml:mo>&#x2207;</mml:mo>
<mml:mi>&#x3be;</mml:mi>
<mml:msup>
<mml:mo>&#x2223;</mml:mo>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mtext>&#x394;</mml:mtext>
<mml:mi>&#x3be;</mml:mi>
<mml:mo stretchy="false">]</mml:mo>
<mml:mo>=</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq1">Equation 1</xref>,</p>
<disp-formula id="eq2-3">
<label>(2, 3)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:msup>
<mml:mi>c</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mi>g</mml:mi>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>&#x2212;</mml:mo>
</mml:msup>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>+</mml:mo>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>+</mml:mo>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:mi>R</mml:mi>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>&#x2212;</mml:mo>
</mml:msup>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>&#x2212;</mml:mo>
</mml:msup>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>+</mml:mo>
</mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>&#x2212;</mml:mo>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:mi>R</mml:mi>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>+</mml:mo>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mn>3</mml:mn>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>+</mml:mo>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:mi>R</mml:mi>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>&#x2212;</mml:mo>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq4-5">
<label>(4, 5)</label>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:mi>&#x3b2;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mi>g</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>+</mml:mo>
</mml:msup>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>+</mml:mo>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:mi>R</mml:mi>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>&#x2212;</mml:mo>
</mml:msup>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>&#x3b3;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>+</mml:mo>
</mml:msup>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>R</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>&#x2212;</mml:mo>
</mml:msup>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>+</mml:mo>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:mi>R</mml:mi>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mo>&#x2212;</mml:mo>
</mml:msup>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq2-3">Equations 2</xref>&#x2013;<xref ref-type="disp-formula" rid="eq4-5">5</xref>, <italic>&#x3be;</italic> is the velocity potential, <italic>&#x3be;<sub>t</sub>
</italic> is the first partial derivative of <italic>&#x3be;</italic> to <italic>t</italic>, <italic>&#x3be;<sub>tt</sub>
</italic> is the second partial derivative of <italic>&#x3be;</italic> to <italic>t</italic>, <italic>h</italic>
<sup>+</sup> and <italic>h</italic>
<sup>&#x2212;</sup> are the upper fluid layer water depth and lower fluid layer water depth respectively, R is the ratio of the upper fluid layer density and lower fluid layer density, and g is the gravity acceleration.</p>
<p>
<xref ref-type="disp-formula" rid="eq1">Equation 1</xref> modifies the classical Benney-Luke equation and considers the propagation of nonlinear internal waves over the variable bottom terrain. It is worth noting that mBL equation has the characteristics of isotropic and bidirectional propagation, which the widely used KP equation does not have. The structure of mBL equation is much simpler compared with BL equation, and the numerical results of mBL equation are in good agreement with those of BL equation, which verifies the validity of mBL equation.</p>
<p>
<xref ref-type="disp-formula" rid="eq1">Equation 1</xref> admits an analytic solution for internal line solitary waves in the absence of topography, which can be explicitly expressed as:</p>
<disp-formula id="eq6-7">
<label>(6, 7)</label>
<mml:math display="block" id="M4">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mi>A</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>k</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#xb7;</mml:mo>
<mml:mi>r</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>v</mml:mi>
<mml:mi>k</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>&#x3be;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mi>A</mml:mi>
<mml:mrow>
<mml:mi>v</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mi>t</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>h</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#xb7;</mml:mo>
<mml:mi>r</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>v</mml:mi>
<mml:mi>k</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq6-7">Equations 6, 7</xref>, <italic>r</italic> = (<italic>x</italic>,<italic>y</italic>) is a vector in any direction on the horizontal plane, <italic>k</italic> = (<italic>k<sub>x</sub>
</italic>, <italic>k<sub>y</sub>
</italic>) is the corresponding wave number vector with the magnitude of <inline-formula>
<mml:math display="inline" id="im1">
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>=</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:msubsup>
<mml:mi>k</mml:mi>
<mml:mi>x</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>+</mml:mo>
<mml:msubsup>
<mml:mi>k</mml:mi>
<mml:mi>y</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
</inline-formula>, and the amplitude <italic>A</italic>(<italic>k</italic>) and non-linear wave speed <italic>v</italic>(<italic>k</italic>) as shown in of <xref ref-type="disp-formula" rid="eq8-9">Equations 8</xref>, <xref ref-type="disp-formula" rid="eq8-9">9</xref>:</p>
<disp-formula id="eq8-9">
<label>(8, 9)</label>
<mml:math display="block" id="M5">
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>k</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>4</mml:mn>
<mml:mi>&#x3b1;</mml:mi>
<mml:msup>
<mml:mi>v</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:msup>
<mml:mi>k</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mi>&#x3b3;</mml:mi>
</mml:mfrac>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msup>
<mml:mi>v</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msup>
<mml:mi>c</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
<mml:mi>&#x3b1;</mml:mi>
<mml:msup>
<mml:mi>k</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>PINN</title>
<p>In 2019, the &#x201c;Physical Information Neural Network&#x201d; (PINN) was proposed by a research group led by Professor George Em Karniadakis of Brown University. PINN is a new scientific research paradigm that uses deep learning technology to solve PDE. Since its birth, PINN has become the commonest keyword in the field of &#x201c;AI for science&#x201d;. PINN is a kind of neural network used to solve supervised learning tasks, it adds physical equations as limiting conditions to the neural network so that the trained model can meet the laws of physics. In order to realize this physical limitation, in addition to using the neural network&#x2019;s own loss function, PINN also uses the physical information loss function that contains the physical equation. What PINN optimizes through the physical information loss function is the difference between the solved physical equation value and the real physical equation value, and the closer the difference is to zero, the better the optimization effect is. After many rounds of iteration, the model trained by the PINN not only optimizes the neural network&#x2019;s own loss function but also optimizes the physical information loss function including the physical equation, so that the final solved result can fit the real value and satisfy the physical law described by the partial differential equation. PINN uses a deep neural network to train the model, and the two-dimensional temporal-spatial structure of PINN is shown in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>:</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Network structure of PINN.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-11-1309775-g001.tif"/>
</fig>
<p>In <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>, <italic>x</italic> is the spatial argument in the input data, and <italic>t</italic> is the time argument in the input data. <italic>u</italic> is the output dependent variable, and its right connected <inline-formula>
<mml:math display="inline" id="im2">
<mml:mrow>
<mml:mfrac>
<mml:mo>&#x2202;</mml:mo>
<mml:mrow>
<mml:mo>&#x2202;</mml:mo>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
<mml:mfrac>
<mml:mo>&#x2202;</mml:mo>
<mml:mrow>
<mml:mo>&#x2202;</mml:mo>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msup>
<mml:mo>&#x2202;</mml:mo>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2202;</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</inline-formula>, &#x2026; are the first or multiple partial derivatives of <italic>u</italic> to <italic>t</italic> and <italic>x</italic>. <italic>MSE</italic> stands for mean square error and is formed by adding <italic>MSE</italic>
<sub>{</sub>
<italic>
<sub>u,BC,IC</sub>
</italic>} and <italic>MSE<sub>f</sub>
</italic>. After each iteration, PINN will judge the size of <italic>MSE</italic> and threshold <italic>&#x3f5;</italic>, if <italic>MSE</italic> is greater than threshold, the model training will continue, if <italic>MSE</italic> is less than threshold, the model training will 180 end. Specific definitions of <italic>MSE</italic>, <italic>MSE</italic>
<sub>{</sub>
<italic>
<sub>u,BC,IC</sub>
</italic>} and <italic>MSE<sub>f</sub>
</italic> are as follows:</p>
<disp-formula id="eq10">
<label>(10)</label>
<mml:math display="block" id="M6">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mi>u</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mi>C</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>I</mml:mi>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mi>f</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq10">Equation 10</xref>, <italic>MSE</italic> is the loss function of the whole, which is composed of the addition of the loss function <italic>MSE</italic>
<sub>{</sub>
<italic>
<sub>u</sub>
</italic>,<italic>
<sub>BC</sub>
</italic>,<italic>
<sub>IC</sub>
</italic>
<sub>}</sub> of the initial and boundary point and the physical information loss function <italic>MSE<sub>f</sub>
</italic> of the space point.</p>
<disp-formula id="eq11">
<label>(11)</label>
<mml:math display="block" id="M7">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mi>u</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mi>C</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>I</mml:mi>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>u</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>u</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mi>t</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mi>u</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>&#x2223;</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq11">Equations 11</xref>, <italic>MSE</italic>
<sub>{</sub>
<italic>
<sub>u,BC,IC</sub>
</italic>} is the fitting of the data set, and can learn the distribution law of the training data set just like the traditional neural networks, where <italic>u</italic> is the solution of the partial differential equation, <italic>BC</italic> is the boundary data set, and <italic>IC</italic> is the initial data set. <italic>u</italic>(<italic>x<sub>u</sub>,t<sub>u</sub>
</italic>) is the velocity value (or other values) of the initial and boundary point solved by PINN, <italic>u</italic> is the velocity value (or other values) of the initial and boundary point solved by the numerical method, <italic>N<sub>u</sub>
</italic> is the number of input initial and boundary points.</p>
<disp-formula id="eq12">
<label>(12)</label>
<mml:math display="block" id="M8">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mi>f</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>f</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>f</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mi>t</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2223;</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq12">Equation 12</xref>, <italic>MSE<sub>f</sub>
</italic> is the fitting of physical equations and can learn the physical laws described by the equation. <italic>f</italic>(<italic>x<sub>f</sub>, t<sub>f</sub>
</italic>) is the size of the physical equation solved by PINN, and <italic>N<sub>f</sub>
</italic> is the number of input space points (including initial and boundary points).</p>
<p>If the PINN can obtain the solution of the equation well, then the velocity value (or other values) of <italic>MSE<sub>u</sub>
</italic> with respect to every initial or boundary point approaches zero, and the size of the physical equation of <italic>MSE<sub>f</sub>
</italic> with respect to every point approaches zero. In other words, when <italic>MSE</italic> approaches zero, it can be considered that the solved value of each point on the training data set approaches the true value. In this way, solving the equation is transformed into an optimization loss function using the backpropagation mechanism of the neural network and two optimizers L-BFGS and Adam.</p>
</sec>
</sec>
<sec id="s3" sec-type="materials|methods">
<label>3</label>
<title>Materials and methods</title>
<sec id="s3_1">
<label>3.1</label>
<title>Overall architecture of DF-ParPINN</title>
<p>The mBL equation is a time-dependent two-dimensional equation with a complex structure and non-convex properties, contains many second-order partial derivatives, has a complicated derivation process, and has boundary conditions that are difficult to determine. Because of the problems existing in PINN, it is difficult to obtain the high-accuracy solution of mBL equation directly by PINN. Therefore, according to the characteristics of mBL equation, we proposed &#x201c;DF-ParPINN: parallel PINN based on velocity potential field division and single time slice focus&#x201d;.</p>
<p>The overall architecture of DF-ParPINN consists of three modules: temporal-spatial division module of overall velocity potential field, rational selection module of multiple time slices data, parallel computation module of high-velocity fields and low-velocity fields, each of them respectively improves the optimization of the high-dimensional non-convex equation, the deep transmission of effective physical information, the low cost and fast training of the network. The three modules are shown in <xref ref-type="fig" rid="f2">
<bold>Figures&#xa0;2</bold>
</xref>&#x2013;<xref ref-type="fig" rid="f4">
<bold>4</bold>
</xref>:</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Temporal-spatial division module of overall velocity potential field.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-11-1309775-g002.tif"/>
</fig>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Data rational selection module of multiple time slices.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-11-1309775-g003.tif"/>
</fig>
<p>In <xref ref-type="fig" rid="f2">
<bold>Figures&#xa0;2</bold>
</xref>&#x2013;<xref ref-type="fig" rid="f4">
<bold>4</bold>
</xref>, VPF is shorthand for velocity potential field, HVFs is shorthand for the high-velocity fields and HVF is the singular form of HVFs, LVFs is shorthand for the low-velocity fields and LVF is the singular form of LVFs.</p>
<p>In <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>, firstly, the whole velocity potential field with three-dimensional temporal-spatial data is temporal dimension reduced, and the velocity potential fields of different time slices are obtained. Then, the velocity potential field of different time slices is spatially divided, and the high-velocity field of different time slices (the raised part in middle marked by high) and the low-velocity field of different time slices (the smooth part in around marked by low) are obtained.</p>
<p>In <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>, firstly, the high-velocity field (low-velocity field) data of different time slices are divided into the data of the time slice to be solved and the data of the previous time slices. Then, the data of these two parts are selected reasonably, the data of the time slice to be solved are focused selected, and the data of the previous time slices are less selected, to obtain the reasonably selected data of the high-velocity field (low-velocity field).</p>
<p>In <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>, firstly, the reasonably selected data of the high-velocity field and the reasonably selected data of the low-velocity field are respectively input into parallel physics-informed neural networks (shown in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>) of different servers for subdomain parallel calculation and the solved high-velocity field and the solved low-velocity field are obtained. Then, the subdomains solved by these two parts are combined in space to get the solved velocity potential field.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Parallel computation module of high-velocity fields and low-velocity fields.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-11-1309775-g004.tif"/>
</fig>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Network structure of DF-ParPINN.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-11-1309775-g005.tif"/>
</fig>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Temporal-spatial division module of overall velocity potential field</title>
<sec id="s3_2_1">
<label>3.2.1</label>
<title>mBL equation normalization</title>
<p>mBL equation has different velocity potential fields under different equation coefficients, initial conditions, and boundary conditions. The more coefficients of the equation, the more complex the initial and boundary conditions, and the more irregular the velocity potential field shape of mBL equation. The velocity potential field of mBL equation can be spatially domain divided according to regular shapes, and reduce complex high-dimensional nonconvexity. Therefore, in order to obtain the regular velocity potential field shape, we set the equation coefficients, initial conditions, and boundary conditions of mBL equation, and mBL equation after setting is shown in follows:</p>
<disp-formula id="eq13">
<label>(13)</label>
<mml:math display="block" id="M9">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mi>c</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mtext>&#x394;</mml:mtext>
<mml:mi>&#x3be;</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>a</mml:mi>
<mml:mtext>&#x394;</mml:mtext>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi>&#x3b3;</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mrow>
<mml:mo>&#x2207;</mml:mo>
<mml:mi>&#x3be;</mml:mi>
</mml:mrow>
</mml:mrow>
<mml:msup>
<mml:mo>&#x2223;</mml:mo>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mtext>&#x394;</mml:mtext>
<mml:mi>&#x3be;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</disp-formula>
<p>By setting the coefficient b in <xref ref-type="disp-formula" rid="eq1">Equation 1</xref> to 0, we get <xref ref-type="disp-formula" rid="eq13">Equation  13</xref>. After the above settings, the velocity potential field of mBL equation can take on a regular shape.</p>
</sec>
<sec id="s3_2_2">
<label>3.2.2</label>
<title>Time dimension reduction</title>
<p>For mBL equation, the velocity potential fields of different time slices may have different shapes. Therefore, before spatial domain division of the velocity potential field, time dimension reduction is needed, that is, the overall velocity potential field is divided into velocity potential fields of different time slices based on the time axis. After the time dimension reduction, the original three-dimensional space-time mBL equation becomes many groups of the two-dimensional space mBL equation, and the complex high-dimensional non-convex characteristics of the mBL equation are degraded. In this way, DF-ParPINN does not have to process the three-dimensional data selected under all time slices at once, but only to process the three-dimensional data selected under the required time slices.</p>
<p>mBL equation of <italic>x</italic> &#x2208; [&#x2212;1,1], <italic>y</italic> &#x2208; [&#x2212;2,2] and <italic>t</italic> &#x2208; [0,7500] is taken as an example for time dimension reduction. Among them, x contains 512 points, y contains 1024 points, and t contains 51 time slices. After time dimensionality reduction, the overall velocity potential field, which originally contained 512*1024*51 = 26738688 solutions, was divided into 51 velocity potential fields corresponding to 51 time slices, each containing 512*1024 = 524288 solutions. The velocity potential fields at partial time slice solved by the pseudo-spectral method are shown in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>:</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Velocity potential field at partial time slice solved by pseudo-spectral method.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-11-1309775-g006.tif"/>
</fig>
</sec>
<sec id="s3_2_3">
<label>3.2.3</label>
<title>Spatial domain division</title>
<p>As can be seen from <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>, for mBL equation, except that the initial field when <italic>t</italic> = 0 is &#x201c;a flat land&#x201d;, the velocity potential field of other time slices has a regular shape: high in the middle and low around the sides. Therefore, the velocity potential fields of different time slices can be spatially domain divided according to the shape of this rule. 51 sets of the high-velocity fields and the low-velocity fields can be obtained from 51 time slices. After the Spatial Domain Division, the original multiple velocity potential fields become multiple high-velocity and low-velocity fields, and the non-convex characteristics of mBL equation in space are further degraded. In this way, DF-ParPINN can process high-velocity fields and low-velocity fields separately, to better learn the characteristics of high-velocity fields and low-velocity fields.</p>
<p>For the velocity potential field per time slice (except for the initial field), the velocity potential values of some space points have a large variation range, and these space points are all distributed in the middle of the velocity potential field; the velocity potential values of other space points are almost unchanged, and these points are all distributed around the velocity potential field. The velocity potential field at this time can be divided into high-velocity potential field (referred to as &#x201c;high-velocity field&#x201d;) and low-velocity potential field (referred to as &#x201c;low-velocity field&#x201d;) based on the velocity threshold. The velocity threshold has the following characteristics: it is smaller than the value of all points in the high-velocity field and larger than the value of all points in the low-velocity field. Therefore, the high-velocity field is a part of the velocity potential field where the velocity potential of all points is greater than the velocity threshold, while the low-velocity field is another part of the velocity potential field where the velocity potential of all points is less than the velocity threshold. Because the velocity potential value of no space point is equal to the velocity threshold value, there are no boundary points and boundary domain when the velocity potential field is divided based on the velocity threshold value, and there is no sub neural network aiming at the boundary domain.</p>
<p>The velocity potential field at <italic>t</italic> = 7500<italic>s</italic> (51st time slice) of mBL equation is taken as an example to divide the spatial domain. For the velocity potential field at this time, the velocity threshold is -0.7616 when taking the minimum value of the velocity potential value of all space points by MATLAB (MATLAB takes four decimal places by default). Using -0.7616 as the velocity threshold, the velocity potential field at this time is spatially domain divided. The obtained high-velocity field, as shown in the middle trapezoid (yellow, green, and light blue) in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>, contains 400762 space points. The obtained low-velocity field, as shown in the surrounding plane (dark blue) of <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>, contains 123526 space points.</p>
</sec>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Data rational selection module of multiple time slices</title>
<p>For the overall velocity potential field of mBL equation, it is difficult to obtain a high-accuracy solution by directly selecting a part of data from all time slices into PINN and outputting the solved velocity potential value of all time slices. This is because without dividing the overall velocity potential field, it is impossible to reduce its high-dimensional non-convex property, and the interaction of physical information in different time slices increases the complexity and difficulty of training. Therefore, in addition to the division of overall velocity potential field, the physical information of different time slices should be reasonably allocated. By selecting the data of different time slices reasonably, the physical information of different time slices can be allocated reasonably.</p>
<p>Objectively, the velocity potential value of mBL equation in a certain time slice depends only on the physical information of the current time slice and all previous time slices, and mainly depends on the physical information of the current time slice. Therefore, for the velocity potential field of a certain time slice, the physical information of all previous time slices should be related and the physical information of the current time slice should be focused during training. In other words, for the velocity potential field of a certain time slice, the data entered into the network for training should contain the data of the current time slice and all previous time slices, mainly including the data of the current time slice.</p>
<p>mBL equation of <italic>x</italic> &#x2208; [&#x2212;1,1], <italic>y</italic> &#x2208; [&#x2212;2, 2], and <italic>t</italic> &#x2208; [0,7500] is taken as an example to carry out reasonabledata selection. After the velocity potential field division module, the initial and boundary points of mBL equation are located in the initial field, and the velocity potential value of all space points in the initial field is zero. Moreover, the overall velocity potential field of mBL equation is divided into 51 groups (corresponding to 51 time slices) of high-velocity field and low-velocity field. When the high-velocity field and the low-velocity field of a certain time slice are required to be solved, the data entered into the network for training consists of two parts, as shown below:</p>
<disp-formula id="eq14">
<label>(14)</label>
<mml:math display="block" id="M10">
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>a</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>d</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>+</mml:mo>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi>d</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x2212;</mml:mo>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq14">Equation 14</xref>, <italic>data</italic> indicates all the selected data, <italic>data<sub>i</sub>
</italic>
<sub>+</sub> indicates the data selected from the time slice to be solved, and <italic>data<sub>i</sub>
</italic>
<sub>&#x2212;</sub> indicates the data selected from all previous time slices. The <italic>data</italic> contains space points and corresponding true velocity potential values, the amount of data in <italic>data<sub>i</sub>
</italic>
<sub>+</sub> is greater that in <italic>data<sub>i</sub>
</italic>
<sub>&#x2212;</sub>, and <italic>data<sub>i</sub>
</italic>
<sub>&#x2212;</sub> contains the data of the initial field.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Parallel computation module of high-velocity fields and low-velocity fields</title>
<p>The mBL equation of <italic>x</italic> &#x2208; [&#x2212;1, 1], <italic>y</italic> &#x2208; [&#x2212;2, 2] and <italic>t</italic> &#x2208; [0, 7500] is taken as an example of parallel computation in a subdomain. After the temporal-spatial division module of overall velocity potential field and the data rational selection module of multiple time slices, the overall velocity potential field of mBL equation is divided into 51 groups (corresponding to 51 time slices) of high-velocity field and low-velocity field. Moreover, when the high-velocity or the low-velocity field of a time slice is required to be solved, the data entered into the network contains not only the data of the time slice to be solved but also the data of all previous time slices. Compared with using a single server to serial compute the overall velocity potential field, using multiple servers to compute the high-velocity and the low-velocity fields of different time slices in parallel can accelerate the calculation speed. Therefore, when the velocity potential field of a certain time slice is required to be solved, different servers can be used to compute the high-velocity or the low-velocity field in parallel, and then combine the high-velocity field and the low-velocity field into one velocity potential field according to the spatial coordinates, as shown below:</p>
<disp-formula id="eq15">
<label>(15)</label>
<mml:math display="block" id="M11">
<mml:mrow>
<mml:mi>&#x3be;</mml:mi>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x222a;</mml:mo>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>w</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq16">
<label>(16)</label>
<mml:math display="block" id="M12">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mo stretchy="false">[</mml:mo>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2223;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>H</mml:mi>
<mml:mi>V</mml:mi>
<mml:mi>F</mml:mi>
<mml:mi>s</mml:mi>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq17">
<label>(17)</label>
<mml:math display="block" id="M13">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>w</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mo stretchy="false">[</mml:mo>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>w</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2223;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>L</mml:mi>
<mml:mi>V</mml:mi>
<mml:mi>F</mml:mi>
<mml:mi>s</mml:mi>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq15">Equations 15</xref>&#x2013;<xref ref-type="disp-formula" rid="eq17">17</xref>, <italic>&#x3be;</italic> is the solved velocity potential value of the current velocity potential field, <italic>&#x3be;<sub>high</sub>
</italic> is the solved velocity potential value of the current high-velocity field, and <italic>&#x3be;<sub>low</sub>
</italic> is the solved velocity potential value of the current low-velocity field. <italic>&#x3b8;<sub>high</sub>
</italic> is the neural network used by the current high-velocity field, and <italic>HV Fs</italic> is the current high-velocity field and all previous high-velocity fields. <italic>&#x3b8;<sub>low</sub>
</italic> is the neural network used by the current low-velocity field, <italic>LV Fs</italic> is the current low-velocity field and all previous low-velocity fields, including the initial field, and the initial and boundary points are located in the initial field. <italic>&#x3be;</italic> is obtained by the union of <italic>&#x3be;<sub>high</sub>
</italic> and <italic>&#x3be;<sub>low</sub>
</italic>. <italic>&#x3b8;<sub>high</sub>
</italic> and <italic>&#x3b8;<sub>low</sub>
</italic> have the same network structure is shown in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>:</p>
<p>In the network structure of DF-ParPINN, the input is the space coordinates <italic>x</italic>, <italic>y</italic> and time coordinates <italic>t</italic>, and the output is the velocity potential value <italic>&#x3be;</italic> and the function value <italic>f</italic>. The network first determines whether <italic>x</italic> and <italic>y</italic> belong to the high-velocity field, if yes, they are trained by deep neural network 1 in server 1, if not, they are trained by deep neural network 2 in server 2. The structure of the two deep neural networks is exactly the same, except that the inputs and outputs are different. <italic>x</italic>, <italic>y</italic>, <italic>t</italic> become <italic>&#x3be;</italic> after deep neural network, <italic>&#x3be;</italic> becomes multiple first and second partial derivatives after automatic derivation, and multiple partial derivatives become <italic>f</italic> when substituted into <xref ref-type="disp-formula" rid="eq13">Equation 13</xref>. DF-ParPINN uses multiple deep neural networks in parallel to train the model and defines the loss function as:</p>
<disp-formula id="eq18">
<label>(18)</label>
<mml:math display="block" id="M14">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mi>&#x3be;</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mi>f</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Where, MSE is the overall loss function, which is formed by adding <italic>MSE<sub>&#x3be;</sub>
</italic>, <italic>MSE<sub>&#x3be;t</sub>
</italic>, and <italic>MSE<sub>f</sub>
</italic>.</p>
<disp-formula id="eq19">
<label>(19)</label>
<mml:math display="block" id="M15">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mi>&#x3be;</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>N</mml:mi>
</mml:mfrac>
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>N</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>&#x3be;</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mi>&#x3be;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>&#x2223;</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Where <italic>MSE<sub>&#x3be;</sub>
</italic> is the velocity potential loss function, <italic>&#x3be;</italic>(<italic>x</italic>,<italic>y</italic>,<italic>t</italic>) is the velocity potential value solved by DF-ParPINN, <italic>&#x3be;</italic> is the velocity potential value solved by the pseudospectral method, and <italic>N</italic> is the number of input space points in different time slices (including initial and boundary points). <italic>&#x3be;</italic> in <italic>&#x3b8;<sub>high</sub>
</italic> is <italic>&#x3be;<sub>high</sub>
</italic>, and <italic>&#x3be;</italic> in <italic>&#x3b8;<sub>low</sub>
</italic> is <italic>&#x3be;<sub>low</sub>
</italic>.</p>
<disp-formula id="eq20">
<label>(20)</label>
<mml:math display="block" id="M16">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>N</mml:mi>
</mml:mfrac>
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>N</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mo>&#x2223;</mml:mo>
<mml:msub>
<mml:mi>&#x3be;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi>&#x3be;</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo>&#x2223;</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Where, <italic>MSE<sub>&#x3be;t</sub>
</italic> is the first-order partial time derivative loss function, <italic>&#x3be;<sub>t</sub>
</italic>(<italic>x</italic>,<italic>y</italic>,<italic>t</italic>) is the first partial derivative of <italic>&#x3be;</italic> to <italic>t</italic> solved by DF-ParPINN, <italic>&#x3be;<sub>t</sub>
</italic> is the first partial derivative of <italic>&#x3be;</italic> to <italic>t</italic> solved by the pseudospectral method, and <italic>N</italic> is the number of input space points in different time slices (including initial and boundary points). <italic>&#x3be;<sub>t</sub>
</italic> in <italic>&#x3b8;<sub>high</sub>
</italic> is <italic>&#x3be;<sub>thigh</sub>
</italic>, and <italic>&#x3be;<sub>t</sub>
</italic> in <italic>&#x3b8;<sub>low</sub>
</italic> is <italic>&#x3be;<sub>tlow</sub>
</italic>.</p>
<disp-formula id="eq21">
<label>(21)</label>
<mml:math display="block" id="M17">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mi>f</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>N</mml:mi>
</mml:mfrac>
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>N</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>&#x2223;</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Where, <italic>MSE<sub>f</sub>
</italic>  is the physical information loss function, <italic>f</italic>(<italic>x,y,t</italic>) is the size of mBL equation solved by DF-ParPINN, <italic>f</italic> is the size of mBL equation solved by the pseudo-spectral method, and <italic>N</italic> is the number of input space points in different time slices (include initial and boundary points). <italic>f</italic> in <italic>&#x3b8;<sub>high</sub>
</italic> is <italic>f<sub>high</sub>
</italic>, and <italic>f</italic> in <italic>&#x3b8;<sub>low</sub>
</italic> is <italic>f<sub>low</sub>
</italic>.</p>
<p>Moreover, <italic>&#x3b8;<sub>low</sub>
</italic> is also responsible for processing the data of the initial field, and the initial and boundary points are located in the initial field, and the loss function of the initial and boundary points also follows <xref ref-type="disp-formula" rid="eq18">Equations 18</xref>-<xref ref-type="disp-formula" rid="eq21">21</xref>.</p>
<p>If DF-ParPINN can solve mBL equation well, then the velocity potential value of <italic>MSE<sub>&#x3be;</sub>
</italic> with respect to every point tends to zero, the first partial derivative of <italic>MSE<sub>&#x3be;t</sub>
</italic> with respect to every point tends to zero, and the physical equation value of <italic>MSE<sub>f</sub>
</italic> with respect to every point tends to zero. In other words, when <italic>MSE</italic> approaches zero, it can be considered that the solved value of each point on the training data set approaches the true value. In this way, solving mBL equation is transformed into an optimization loss function using the backpropagation mechanism of the neural network and two optimizers, L-BFGS and Adam.</p>
</sec>
</sec>
<sec id="s4" sec-type="results">
<label>4</label>
<title>Results</title>
<sec id="s4_1">
<label>4.1</label>
<title>Data set</title>
<p>We use mBL equation with the regular shape shown in <xref ref-type="disp-formula" rid="eq13">Equation 13</xref> to conduct numerical experiments, and the data set was obtained and provided by Chunxin Yuan et&#xa0;al. through the pseudo-spectral method. The detailed information of mBL equation dataset is shown in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>:</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Detailed information of mBL equation data set.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Variables or parameter</th>
<th valign="middle" align="center">Physical meaning</th>
<th valign="middle" align="center">Range or size</th>
<th valign="middle" align="center">Number</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">
<italic>x</italic> (independent variable)</td>
<td valign="middle" align="center">Space point on the x-axis</td>
<td valign="middle" align="center">[-1,1]</td>
<td valign="middle" align="center">1024</td>
</tr>
<tr>
<td valign="middle" align="center">
<italic>y</italic> (independent variable)</td>
<td valign="middle" align="center">Space point on the y-axis</td>
<td valign="middle" align="center">[-2,2]</td>
<td valign="middle" align="center">512</td>
</tr>
<tr>
<td valign="middle" align="center">
<italic>t</italic> (independent variable)</td>
<td valign="middle" align="center">Space point on the t-axis</td>
<td valign="middle" align="center">[0,7500]</td>
<td valign="middle" align="center">51</td>
</tr>
<tr>
<td valign="middle" align="center">
<italic>&#x3be;</italic> (dependent variable)</td>
<td valign="middle" align="center">Velocity potential</td>
<td valign="middle" align="center">(-0.8,2.4)</td>
<td valign="middle" align="center">1024 &#xd7; 512 &#xd7; 51</td>
</tr>
<tr>
<td valign="middle" align="center">
<italic>&#x3be;<sub>t</sub>
</italic> (dependent variable)</td>
<td valign="middle" align="center">First partial derivative of <italic>&#x3be;</italic> to <italic>t</italic>
</td>
<td valign="middle" align="center">(-0.5,0.06)</td>
<td valign="middle" align="center">1024 &#xd7; 512 &#xd7; 51</td>
</tr>
<tr>
<td valign="middle" align="center">
<italic>h</italic>
<sup>+</sup> (Invariant parameter)</td>
<td valign="middle" align="center">Upper fluid layer water depth</td>
<td valign="middle" align="center">100</td>
<td valign="middle" align="center">1</td>
</tr>
<tr>
<td valign="middle" align="center">
<italic>h</italic>
<sup>&#x2212;</sup> (Invariant parameter)</td>
<td valign="middle" align="center">Lower fluid layer water depth</td>
<td valign="middle" align="center">200</td>
<td valign="middle" align="center">1</td>
</tr>
<tr>
<td valign="middle" align="center">
<italic>R</italic> (Invariant parameter)</td>
<td valign="middle" align="center">Ratio of <italic>h</italic>
<sup>+</sup> and <italic>h</italic>
<sup>&#x2212;</sup>
</td>
<td valign="middle" align="center">0.9985</td>
<td valign="middle" align="center">1</td>
</tr>
<tr>
<td valign="middle" align="center">
<italic>g</italic> (Invariant parameter)</td>
<td valign="middle" align="center">Gravity acceleration</td>
<td valign="middle" align="center">9.8</td>
<td valign="middle" align="center">1</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Initial conditions and boundary conditions</title>
<p>For mBL equation shown in <xref ref-type="disp-formula" rid="eq13">Equation 13</xref>, there are many sets of initial conditions and boundary conditions, but not every set of conditions results in a mBL equation with the regular shape. The initial conditions and boundary conditions of mBL equation with the regular shape are shown in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>:</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Initial conditions and boundary conditions of mBL equation with the regular shape.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Type</th>
<th valign="top" align="center">Nature</th>
<th valign="top" align="center">Characteristics</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Initial conditions</td>
<td valign="top" align="center">Three-dimensional temporal-spatial points with differentiable velocity potentials</td>
<td valign="top" align="center">
<italic>t</italic> = 0</td>
</tr>
<tr>
<td valign="top" align="left">boundary conditions</td>
<td valign="top" align="center">Three-dimensional temporal-spatial points with differentiable velocity potentials</td>
<td valign="top" align="center">
<italic>&#x3be;</italic> = 0 and <italic>&#x3be;<sub>t</sub>
</italic> = 0</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>Comparative study</title>
<sec id="s4_3_1">
<label>4.3.1</label>
<title>Experimental setup</title>
<p>In order to verify that DF-ParPINN can solve mBL equation with high accuracy, we use three physical information neural network methods PINN, PIRNN, and cPINN, and a neural computing subclass method DeepONet, as the contrast baseline. The differences between the five algorithms are shown in <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>:</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Differences between the five algorithms (contrast experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Algorithm</th>
<th valign="top" align="center">Physical information</th>
<th valign="top" align="center">Neural operator</th>
<th valign="top" align="center">Basic network structure</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">PINN</td>
<td valign="middle" align="center">&#x2713;</td>
<td valign="middle" align="center">&#xd7;</td>
<td valign="middle" align="center">DNN</td>
</tr>
<tr>
<td valign="middle" align="center">PIRNN</td>
<td valign="middle" align="center">&#x2713;</td>
<td valign="middle" align="center">&#xd7;</td>
<td valign="middle" align="center">RNN</td>
</tr>
<tr>
<td valign="middle" align="center">cPINN</td>
<td valign="middle" align="center">&#x2713;</td>
<td valign="middle" align="center">&#xd7;</td>
<td valign="middle" align="center">DNN</td>
</tr>
<tr>
<td valign="middle" align="center">DeepONet</td>
<td valign="middle" align="center">&#xd7;</td>
<td valign="middle" align="center">&#x2713;</td>
<td valign="middle" align="center">DNN</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN</td>
<td valign="middle" align="center">&#x2713;</td>
<td valign="middle" align="center">&#xd7;</td>
<td valign="middle" align="center">DNN</td>
</tr>
</tbody>
<tbody>
<tr>
<th valign="middle" align="center">Algorithm</th>
<th valign="middle" align="center">Data <break/>rational selection</th>
<th valign="middle" align="center">Temporal-spatial domain division</th>
<th valign="middle" align="center">Parallel computation</th>
</tr>
</tbody>
<tbody>
<tr>
<td valign="middle" align="center">PINN</td>
<td valign="top" align="center">&#xd7;</td>
<td valign="top" align="center">&#xd7;</td>
<td valign="middle" align="center">&#xd7;</td>
</tr>
<tr>
<td valign="middle" align="center">PIRNN</td>
<td valign="top" align="center">&#xd7;</td>
<td valign="top" align="center">&#xd7;</td>
<td valign="top" align="center">&#xd7;</td>
</tr>
<tr>
<td valign="middle" align="center">cPINN</td>
<td valign="top" align="center">&#xd7;</td>
<td valign="middle" align="center">&#x2713;</td>
<td valign="top" align="center">&#xd7;</td>
</tr>
<tr>
<td valign="middle" align="center">DeepONet</td>
<td valign="top" align="center">&#xd7;</td>
<td valign="middle" align="center">&#xd7;</td>
<td valign="top" align="center">&#xd7;</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN</td>
<td valign="middle" align="center">&#x2713;</td>
<td valign="middle" align="center">&#x2713;</td>
<td valign="middle" align="center">&#x2713;</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The input and output of the five algorithms are shown in <xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref>:</p>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>Input and output of the five algorithms (contrast experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Algorithm</th>
<th valign="middle" align="center">Input</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">PINN</td>
<td valign="middle" align="center">Partial data set of velocity potential field of all time slices</td>
</tr>
<tr>
<td valign="middle" align="center">PIRNN</td>
<td valign="middle" align="center">Partial data set of velocity potential field of all time slices</td>
</tr>
<tr>
<td valign="middle" align="center">cPINN</td>
<td valign="middle" align="center">Partial data set of high-velocity field (or low-velocity field) of all time slices</td>
</tr>
<tr>
<td valign="middle" align="center">DeepONet</td>
<td valign="middle" align="center">Partial data set of velocity potential field of all time slices</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN</td>
<td valign="middle" align="left">Partial data set of high-velocity field (or low-velocity field) of time slice to be solved and all previous time slices</td>
</tr>
<tr>
<td valign="middle" align="center">Algorithm</td>
<td valign="middle" align="center">Output</td>
</tr>
<tr>
<td valign="middle" align="center">PINN</td>
<td valign="middle" align="center">Velocity potential field of time slice to be solved</td>
</tr>
<tr>
<td valign="middle" align="center">PIRNN</td>
<td valign="middle" align="center">Velocity potential field of time slice to be solved</td>
</tr>
<tr>
<td valign="middle" align="center">cPINN</td>
<td valign="middle" align="center">High-velocity field (or low-velocity field) of time slice to be solved</td>
</tr>
<tr>
<td valign="middle" align="center">DeepONet</td>
<td valign="middle" align="center">Velocity potential field of time slice to be solved</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN</td>
<td valign="middle" align="center">High-velocity field (or low-velocity field) of time slice to be solved</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The detailed settings of the five algorithms are shown in <xref ref-type="table" rid="T5">
<bold>Table&#xa0;5</bold>
</xref>:</p>
<table-wrap id="T5" position="float">
<label>Table&#xa0;5</label>
<caption>
<p>Detailed settings of the five algorithms (contrast experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Algorithm</th>
<th valign="top" align="center">Training instances</th>
<th valign="top" align="center">Testing instances</th>
<th valign="top" align="center">Epochs</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">PINN</td>
<td valign="middle" align="center">100000</td>
<td valign="middle" align="center">10000</td>
<td valign="middle" align="center">5000</td>
</tr>
<tr>
<td valign="middle" align="center">PIRNN</td>
<td valign="middle" align="center">100000</td>
<td valign="middle" align="center">10000</td>
<td valign="middle" align="center">5000</td>
</tr>
<tr>
<td valign="middle" align="center">cPINN</td>
<td valign="middle" align="center">100000</td>
<td valign="middle" align="center">10000</td>
<td valign="middle" align="center">5000</td>
</tr>
<tr>
<td valign="middle" align="center">DeepONet</td>
<td valign="middle" align="center">100000</td>
<td valign="middle" align="center">10000</td>
<td valign="middle" align="center">5000</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN</td>
<td valign="middle" align="center">100000</td>
<td valign="middle" align="center">10000</td>
<td valign="middle" align="center">5000</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Both the training set and the test set of the five algorithms belong to the same data set, both follow the principle of random selection, and the data contained in both are not repeated.</p>
<p>PINN or PIRNN does not perform temporal-spatial domain division of mBL equation. PINN or PIRNN selected directly 100000 datasets from 1024 &#xd7; 512 &#xd7; 51 datasets (containing the overall velocity potential field of all time slices) as the training set, and 10000 datasets from 1024 &#xd7; 512 datasets (containing only the velocity potential field of the time slice to be solved) as the test set.</p>
<p>cPINN only performs temporal-spatial domain division (division only in the spatial domain), and divides the velocity potential field of all time slices into the overall high-velocity field and the overall low-velocity field. For the overall high-velocity field, cPINN selected 100000 datasets from 400762*51 datasets (containing the high-velocity field and the partial low-velocity field of all time slices) as the training set, and selected 10000 datasets from 400762 datasets (containing the high-velocity field and the partial low-velocity field of the time slices to be solved) as the test set. For the overall low-velocity field, cPINN selected 10000 datasets from 123526*51 datasets (containing another part of the low-velocity field of all time slices) as the training set, and selected 10000 datasets from 123526 datasets (containing another part of the low-velocity field of the time slice to be solved) as the test set.</p>
<p>DeepONet does not perform temporal-spatial domain division of mBL equation. The training set and test set selection of DeepONet are the same as that of PINN.</p>
<p>DF-ParPINN performs temporal-spatial domain division (division in both spatial and temporal domains) for mBL equation, and divides the velocity potential field of each time slice into two parts: the high-velocity field and the low-velocity field. For the high-velocity field (the low-velocity field) of the time slice to be solved, DF-ParPINN first selected 95000 datasets from the high-velocity field (the low-velocity field) of the time slice to be solved, then selected 5000 datasets from high-velocity fields (the low-velocity field) of all previous time slices, a total of 100000 datasets were selected as training sets, and selected 10000 datasets from the high-velocity field (the low-velocity field) of the time slice to be solved. Unlike cPINN, which only uses a single server to train and test the overall high-velocity field and the overall low-velocity field, DF-ParPINN uses multiple servers to train and test the high-velocity field and the low-velocity field separately in parallel, to improve the training and testing speed under the spatial-temporal division strategy.</p>
<p>For mBL equation, cPINN divides the velocity potential field of all time slices based on the velocity threshold of the last time slice, and DF-ParPINN divides the velocity potential field of each time slice based on the velocity threshold of each time slice. Because the velocity potential value of no space point is equal to the velocity threshold, there is no boundary point and boundary domain when the velocity potential field is divided based on the velocity threshold, and there is no sub-neural network for the boundary domain.</p>
<p>In solving equations, PINN uses relative error to measure the accuracy of the solution. Therefore, in solving mBL equation, the five algorithms continue to use relative error to measure the accuracy of the velocity potential field solved. In this paper, the relative error is the matrix of two norms between the algorithm prediction solution and the pseudo-spectral method numerical solution. The smaller the relative error is, the higher the accuracy of the prediction solution is, and the better the performance of the algorithm is. For the algorithms that use temporal-spatial domain division, the relative error of the velocity potential field of the time slice to be solved is shown as follows:</p>
<disp-formula id="eq22">
<label>(22)</label>
<mml:math display="block" id="M18">
<mml:mrow>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>o</mml:mi>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mi>h</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>o</mml:mi>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mi>l</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq23-24">
<label>(23, 24)</label>
<mml:math display="block" id="M19">
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>n</mml:mi>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mi>h</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>n</mml:mi>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mi>l</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq15">Equations 23</xref>, <xref ref-type="disp-formula" rid="eq23-24">24</xref>, <italic>error</italic> is the relative error of the velocity potential field of the time slice to be solved, <italic>error<sub>h</sub>
</italic> is the relative error of the high-velocity field of the time slice to be solved, <italic>error<sub>l</sub>
</italic> is the relative error of the low-velocity field of the time slice to be solved, <italic>count<sub>h</sub>
</italic> is the number of space points of the overall high-velocity field (cPINN) or the number of space points of the high-velocity field of the time slice to be solved (DF-ParPINN). <italic>count<sub>l</sub>
</italic> is the number of space points in the overall low-velocity field (cPINN) or the number of space points in the low-velocity field of the time slice to be solved (DF-ParPINN), and <italic>count</italic> is the number of space points in the overall velocity potential field (cPINN) or the number of space points in the velocity potential field of the time slice to be solved (DF-ParPINN).</p>
</sec>
<sec id="s4_3_2">
<label>4.3.2</label>
<title>Experimental results</title>
<p>After the above settings, five algorithms are trained separately on the same mBL equation data set, and partial time slice data is selected for testing. The relative errors of the five algorithms are shown in <xref ref-type="table" rid="T6">
<bold>Table&#xa0;6</bold>
</xref>:</p>
<table-wrap id="T6" position="float">
<label>Table&#xa0;6</label>
<caption>
<p>Relative errors of the five algorithms (contrast experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Algorithm</th>
<th valign="top" align="center">t=750s</th>
<th valign="top" align="center">t=1500s</th>
<th valign="top" align="center">t=2250s</th>
<th valign="top" align="center">t=3000s</th>
<th valign="top" align="center">t=3750s</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">PINN (<xref ref-type="bibr" rid="B20">Raissi et&#xa0;al., 2019</xref>)</td>
<td valign="middle" align="center">0.9902</td>
<td valign="middle" align="center">0.9910</td>
<td valign="middle" align="center">0.9908</td>
<td valign="middle" align="center">0.9904</td>
<td valign="middle" align="center">0.9900</td>
</tr>
<tr>
<td valign="middle" align="center">PIRNN (<xref ref-type="bibr" rid="B26">Wu et&#xa0;al., 2023</xref>)</td>
<td valign="middle" align="center">0.9037</td>
<td valign="middle" align="center">0.9208</td>
<td valign="middle" align="center">0.8774</td>
<td valign="middle" align="center">0.8621</td>
<td valign="middle" align="center">0.8572</td>
</tr>
<tr>
<td valign="middle" align="center">cPINN (<xref ref-type="bibr" rid="B5">Jagtap et&#xa0;al., 2020</xref>)</td>
<td valign="middle" align="center">1.8960</td>
<td valign="middle" align="center">0.9453</td>
<td valign="middle" align="center">0.6099</td>
<td valign="middle" align="center">0.4315</td>
<td valign="middle" align="center">0.3419</td>
</tr>
<tr>
<td valign="middle" align="center">DeepONet (<xref ref-type="bibr" rid="B11">Lu et&#xa0;al., 2019</xref>)</td>
<td valign="middle" align="center">1.0798</td>
<td valign="middle" align="center">1.0400</td>
<td valign="middle" align="center">1.0214</td>
<td valign="middle" align="center">1.0175</td>
<td valign="middle" align="center">1.0100</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>DF-ParPINN</bold>
</td>
<td valign="middle" align="center">
<bold>0.1056</bold>
</td>
<td valign="middle" align="center">
<bold>0.1272</bold>
</td>
<td valign="middle" align="center">
<bold>0.1048</bold>
</td>
<td valign="middle" align="center">
<bold>0.1127</bold>
</td>
<td valign="middle" align="center">
<bold>0.1194</bold>
</td>
</tr>
</tbody>
<tbody>
<tr>
<th valign="middle" align="center">Algorithms</th>
<th valign="middle" align="center">t=4500s</th>
<th valign="middle" align="center">t=5250s</th>
<th valign="middle" align="center">t=6000s</th>
<th valign="middle" align="center">t=6750s</th>
<th valign="middle" align="center">t=7500s</th>
</tr>
</tbody>
<tbody>
<tr>
<td valign="middle" align="center">PINN (<xref ref-type="bibr" rid="B20">Raissi et&#xa0;al., 2019</xref>)</td>
<td valign="middle" align="center">0.9896</td>
<td valign="middle" align="center">0.9893</td>
<td valign="middle" align="center">0.9891</td>
<td valign="middle" align="center">0.9886</td>
<td valign="middle" align="center">0.9891</td>
</tr>
<tr>
<td valign="middle" align="center">PIRNN (<xref ref-type="bibr" rid="B26">Wu et&#xa0;al., 2023</xref>)</td>
<td valign="middle" align="center">0.8607</td>
<td valign="middle" align="center">0.8762</td>
<td valign="middle" align="center">0.8999</td>
<td valign="middle" align="center">0.9200</td>
<td valign="middle" align="center">0.9062</td>
</tr>
<tr>
<td valign="middle" align="center">cPINN (<xref ref-type="bibr" rid="B5">Jagtap et&#xa0;al., 2020</xref>)</td>
<td valign="middle" align="center">0.3736</td>
<td valign="middle" align="center">0.4264</td>
<td valign="middle" align="center">0.4887</td>
<td valign="middle" align="center">0.5539</td>
<td valign="middle" align="center">0.6307</td>
</tr>
<tr>
<td valign="middle" align="center">DeepONet (<xref ref-type="bibr" rid="B11">Lu et&#xa0;al., 2019</xref>)</td>
<td valign="middle" align="center">1.0115</td>
<td valign="middle" align="center">1.0110</td>
<td valign="middle" align="center">1.0090</td>
<td valign="middle" align="center">1.0114</td>
<td valign="middle" align="center">1.0156</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>DF-ParPINN</bold>
</td>
<td valign="middle" align="center">
<bold>0.1604</bold>
</td>
<td valign="middle" align="center">
<bold>0.1866</bold>
</td>
<td valign="middle" align="center">
<bold>0.2255</bold>
</td>
<td valign="middle" align="center">
<bold>0.2564</bold>
</td>
<td valign="middle" align="center">
<bold>0.2895</bold>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="fnT1_1">
<p>Bold representsthe lowest relative errors.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The solution time of the five algorithms is shown in <xref ref-type="table" rid="T7">
<bold>Table&#xa0;7</bold>
</xref>:</p>
<table-wrap id="T7" position="float">
<label>Table&#xa0;7</label>
<caption>
<p>Solution time of the five algorithms (contrast experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Algorithm</th>
<th valign="top" align="center">t=750s</th>
<th valign="top" align="center">t=1500s</th>
<th valign="top" align="center">t=2250s</th>
<th valign="top" align="center">t=3000s</th>
<th valign="top" align="center">t=3750s</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">PINN (<xref ref-type="bibr" rid="B20">Raissi et&#xa0;al., 2019</xref>)</td>
<td valign="middle" align="center">0.0246s</td>
<td valign="middle" align="center">0.0226s</td>
<td valign="middle" align="center">0.0243s</td>
<td valign="middle" align="center">0.0156s</td>
<td valign="middle" align="center">0.0138s</td>
</tr>
<tr>
<td valign="middle" align="center">PIRNN (<xref ref-type="bibr" rid="B26">Wu et&#xa0;al., 2023</xref>)</td>
<td valign="middle" align="center">0.0302s</td>
<td valign="middle" align="center">0.0103s</td>
<td valign="middle" align="center">0.0102s</td>
<td valign="middle" align="center">0.0104s</td>
<td valign="middle" align="center">0.0097s</td>
</tr>
<tr>
<td valign="middle" align="center">cPINN (<xref ref-type="bibr" rid="B5">Jagtap et&#xa0;al., 2020</xref>)</td>
<td valign="middle" align="center">0.0342s</td>
<td valign="middle" align="center">0.0316s</td>
<td valign="middle" align="center">0.0308s</td>
<td valign="middle" align="center">0.0667s</td>
<td valign="middle" align="center">0.0369s</td>
</tr>
<tr>
<td valign="middle" align="center">DeepONet (<xref ref-type="bibr" rid="B11">Lu et&#xa0;al., 2019</xref>)</td>
<td valign="middle" align="center">0.0186s</td>
<td valign="middle" align="center">0.0016s</td>
<td valign="middle" align="center">0.0013s</td>
<td valign="middle" align="center">0.0014s</td>
<td valign="middle" align="center">0.0012s</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>DF-ParPINN</bold>
</td>
<td valign="middle" align="center">
<bold>0.0258s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0232s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0167s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0259s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0155s</bold>
</td>
</tr>
</tbody>
<tbody>
<tr>
<th valign="middle" align="center">Algorithms</th>
<th valign="middle" align="center">t=4500s</th>
<th valign="middle" align="center">t=5250s</th>
<th valign="middle" align="center">t=6000s</th>
<th valign="middle" align="center">t=6750s</th>
<th valign="middle" align="center">t=7500s</th>
</tr>
</tbody>
<tbody>
<tr>
<td valign="middle" align="center">PINN (<xref ref-type="bibr" rid="B20">Raissi et&#xa0;al., 2019</xref>)</td>
<td valign="middle" align="center">0.0136s</td>
<td valign="middle" align="center">0.0129s</td>
<td valign="middle" align="center">0.0132s</td>
<td valign="middle" align="center">0.0131s</td>
<td valign="middle" align="center">0.0131s</td>
</tr>
<tr>
<td valign="middle" align="center">PIRNN (<xref ref-type="bibr" rid="B26">Wu et&#xa0;al., 2023</xref>)</td>
<td valign="middle" align="center">0.0116s</td>
<td valign="middle" align="center">0.0093s</td>
<td valign="middle" align="center">0.0108s</td>
<td valign="middle" align="center">0.0129s</td>
<td valign="middle" align="center">0.0127s</td>
</tr>
<tr>
<td valign="middle" align="center">cPINN (<xref ref-type="bibr" rid="B5">Jagtap et&#xa0;al., 2020</xref>)</td>
<td valign="middle" align="center">0.0369s</td>
<td valign="middle" align="center">0.0375s</td>
<td valign="middle" align="center">0.0308s</td>
<td valign="middle" align="center">0.0285s</td>
<td valign="middle" align="center">0.0307s</td>
</tr>
<tr>
<td valign="middle" align="center">DeepONet (<xref ref-type="bibr" rid="B11">Lu et&#xa0;al., 2019</xref>)</td>
<td valign="middle" align="center">0.0013s</td>
<td valign="middle" align="center">0.0013s</td>
<td valign="middle" align="center">0.0012s</td>
<td valign="middle" align="center">0.0012s</td>
<td valign="middle" align="center">0.0013s</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>DF-ParPINN</bold>
</td>
<td valign="middle" align="center">
<bold>0.0199s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0142s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0155s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0235s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0175s</bold>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="fnT7_1">
<p>Bold representsthe lowest relative errors.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Where, t=750s is the 6th time slice, t=1500s is the 11st time slice, t=2250s is the 16th time slice, t=3000s is the 21st time slice, t=3750s is the 26th time slice, t=4500s is the 31st time slice, t=5250s is the 36th time slice, t=6000s is the 41st time slice, t=6750s is the 46th time slice, t=7500s is the 51st time slice.</p>
<p>It can be clearly seen from <xref ref-type="table" rid="T6">
<bold>Table&#xa0;6</bold>
</xref> that compared with PINN, PIRNN, cPINN, and DeepONet, DFParPINN has absolute accuracy advantages in solving mBL equation, which proves that DF-ParPINN is the most effective. It also can be clearly seen from <xref ref-type="table" rid="T7">
<bold>Table&#xa0;7</bold>
</xref> that the average solution time of the five algorithms is no more than 0.5s, much faster than 9.4 minutes of the pseudo-spectral method, which proves that DF-ParPINN is very efficient.</p>
</sec>
</sec>
<sec id="s4_4">
<label>4.4</label>
<title>Ablation study</title>
<sec id="s4_4_1">
<label>4.4.1</label>
<title>Experimental setup</title>
<p>In addition to comparison experiments, we also conducted ablation experiments to further verify the effectiveness of DF-ParPINN. The ablation experiments adopt module ablation and include three modules. Temporal-spatial division module of overall velocity potential field is the first module, data rational selection module of multiple time slices is the second module, parallel computation module of high-velocity fields and low-velocity fields is the third module. The first module is the premise for the second and the third module, without the first module there can be no the second and the third module. The second module can be divided into the first submodule data rational selection and the second submodule data focus. The second module can be divided into the first submodule data focus and the second submodule data rational selection. The first submodule is the premise of the second submodule data, without the first submodule there is no second submodule. Therefore, five ablation algorithms can be set up. The differences between the five algorithms are shown in <xref ref-type="table" rid="T8">
<bold>Table&#xa0;8</bold>
</xref>:</p>
<table-wrap id="T8" position="float">
<label>Table&#xa0;8</label>
<caption>
<p>Differences between the five algorithms (ablation experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Algorithm</th>
<th valign="top" align="center">First module</th>
<th valign="top" align="left">First submodule of second module</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">DF-ParPINN-1a</td>
<td valign="top" align="center">&#x2713;</td>
<td valign="middle" align="center">&#x2713;</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1b</td>
<td valign="top" align="center">&#x2713;</td>
<td valign="middle" align="center">&#xd7;</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-12</td>
<td valign="top" align="center">&#x2713;</td>
<td valign="middle" align="center">&#x2713;</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1a3</td>
<td valign="top" align="center">&#x2713;</td>
<td valign="middle" align="center">&#x2713;</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1b3</td>
<td valign="top" align="center">&#x2713;</td>
<td valign="middle" align="center">&#xd7;</td>
</tr>
</tbody>
<tbody>
<tr>
<th valign="middle" align="center">Algorithm</th>
<th valign="top" align="center">Second submodule of second module</th>
<th valign="middle" align="center">Third module</th>
</tr>
</tbody>
<tbody>
<tr>
<td valign="top" align="center">DF-ParPINN-1a</td>
<td valign="top" align="center">&#xd7;</td>
<td valign="middle" align="center">&#xd7;</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1b</td>
<td valign="top" align="center">&#xd7;</td>
<td valign="top" align="center">&#xd7;</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-12</td>
<td valign="middle" align="center">&#x2713;</td>
<td valign="top" align="center">&#xd7;</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1a3</td>
<td valign="top" align="center">&#xd7;</td>
<td valign="top" align="center">&#x2713;</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1b3</td>
<td valign="top" align="center">&#xd7;</td>
<td valign="top" align="center">&#x2713;</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The input and output of the five algorithms are shown in <xref ref-type="table" rid="T9">
<bold>Table&#xa0;9</bold>
</xref>:</p>
<table-wrap id="T9" position="float">
<label>Table&#xa0;9</label>
<caption>
<p>Input and output of the five algorithms (ablation experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Algorithm</th>
<th valign="top" align="center">Input</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">DF-ParPINN-1a</td>
<td valign="top" align="center">Partial data set of high-velocity field (or low-velocity field) of time slice to be solved and all previous time slices</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1b</td>
<td valign="top" align="center">Partial data set of high-velocity field (or low-velocity field) of all previous time slices</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-12</td>
<td valign="top" align="center">Partial data set of high-velocity field (or low-velocity field) of time slice to be solved and all previous time slices</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1a3</td>
<td valign="top" align="center">Partial data set of high-velocity field (or low-velocity field) of time slice to be solved and all previous time slices</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1b3</td>
<td valign="top" align="center">Partial data set of high-velocity field (or low-velocity field) of all previous time slices</td>
</tr>
</tbody>
<tbody>
<tr>
<th valign="top" align="center">Algorithm</th>
<th valign="top" align="center">Output</th>
</tr>
</tbody>
<tbody>
<tr>
<td valign="top" align="center">DF-ParPINN-1a</td>
<td valign="top" align="center">High-velocity field (or low-velocity field) of time slice to be solved</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1b</td>
<td valign="top" align="center">High-velocity field (or low-velocity field) of time slice to be solved</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-12</td>
<td valign="top" align="center">High-velocity field (or low-velocity field) of time slice to be solved</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1a3</td>
<td valign="top" align="center">High-velocity field (or low-velocity field) of time slice to be solved</td>
</tr>
<tr>
<td valign="top" align="center">DF-ParPINN-1b3</td>
<td valign="top" align="center">High-velocity field (or low-velocity field) of time slice to be solved</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The detailed settings of five algorithms are shown in <xref ref-type="table" rid="T10">
<bold>Table&#xa0;10</bold>
</xref>:</p>
<table-wrap id="T10" position="float">
<label>Table&#xa0;10</label>
<caption>
<p>Detailed settings of five algorithms (ablation experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Algorithm</th>
<th valign="top" align="center">Training instances</th>
<th valign="top" align="center">Testing instances</th>
<th valign="top" align="center">Epochs</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">DF-ParPINN-1a</td>
<td valign="middle" align="center">100000</td>
<td valign="middle" align="center">10000</td>
<td valign="middle" align="center">5000</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-1b</td>
<td valign="middle" align="center">100000</td>
<td valign="middle" align="center">10000</td>
<td valign="middle" align="center">5000</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-12</td>
<td valign="middle" align="center">100000</td>
<td valign="middle" align="center">10000</td>
<td valign="middle" align="center">5000</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-1a3</td>
<td valign="middle" align="center">100000</td>
<td valign="middle" align="center">10000</td>
<td valign="middle" align="center">5000</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-1b3</td>
<td valign="middle" align="center">100000</td>
<td valign="middle" align="center">10000</td>
<td valign="middle" align="center">5000</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Both the training set and the test set of the five algorithms belong to the same data set, both follow the principle of random selection, and the data contained in both are not repeated.</p>
<p>DF-ParPINN-1a or DF-ParPINN-1a3 do not select data from datasets of the time slice to be solved and datasets of all previous time slices according to the 95000:5000 allocation rule, but more focus on selecting data from datasets of the time slices to be solved. For the high-velocity field (the low-velocity field) of the time slice to be solved, the algorithm first selected 50000 datasets from the high-velocity field (the low-velocity field) of the time slice to be solved, then selected 50000 datasets from high-velocity fields (low-velocity fields) of all previous time slices, a total of 100000 datasets were selected as training sets, and selected 10000 datasets from the high-velocity field (the low-velocity field) of the time slice to be solved as test sets. DF-ParPINN-1a3 also uses different servers to solve high-velocity and low-velocity fields.</p>
<p>DF-ParPINN-1b or DF-ParPINN-1b3 do not select data from datasets of the time slice to be solved and datasets of all previous time slices according to the 95000:5000 allocation rule, and do not focus on selecting data from datasets of the time slices to be solved. For the high-velocity field (the low-velocity field) of the time slice to be solved, the algorithm selected directly 100000 datasets from all high-velocity fields (all low-velocity fields) of all time slices as training sets, and selected 10000 datasets from the high-velocity field (the low-velocity field) of the time slice to be solved as test sets.DF-ParPINN-1b3 also uses different servers to solve high-velocity and low-velocity fields.</p>
<p>DF-ParPINN-12 selects data from datasets of the time slice to be solved and datasets of all previous time slices according to the 95000:5000 allocation rule. For the high-velocity field (the low-velocity field) of the time slice to be solved, the algorithm first selected 5000 datasets from the high-velocity field (the low-velocity field) of the time slice to be solved, then selected 95000 datasets from high-velocity fields (low-velocity fields) of all previous time slices, a total of 100000 datasets were selected as training sets, and selected 10000 datasets from the high-velocity field (the low-velocity field) of the time slice to be solved as test sets. DF-ParPINN-1a3 does not use different servers to solve high-velocity and low-velocity fields.</p>
<p>In solving mBL equation, we still use relative error to measure the accuracy of the velocity potential field solved by the five algorithms. For DF-ParPINN, the relative error of the velocity potential field of the time slice to be solved is shown in <xref ref-type="disp-formula" rid="eq22">Equation 22</xref>).</p>
</sec>
<sec id="s4_4_2">
<label>4.4.2</label>
<title>Experimental results</title>
<p>After the above settings, five algorithms are trained separately on the same mBL equation data set, and partial time slice data is selected for testing. With the addition of DF-ParPINN, the relative errors of the six algorithms are shown in <xref ref-type="table" rid="T11">
<bold>Table&#xa0;11</bold>
</xref>:</p>
<table-wrap id="T11" position="float">
<label>Table&#xa0;11</label>
<caption>
<p>Relative errors of the six algorithms (ablation experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Algorithm</th>
<th valign="middle" align="center">t=750s</th>
<th valign="middle" align="center">t=1500s</th>
<th valign="middle" align="center">t=2250s</th>
<th valign="middle" align="center">t=3000s</th>
<th valign="middle" align="center">t=3750s</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">DF-ParPINN-1a or DF-ParPINN-1a3</td>
<td valign="middle" align="center">0.3466</td>
<td valign="middle" align="center">0.3134</td>
<td valign="middle" align="center">0.2916</td>
<td valign="middle" align="center">0.2954</td>
<td valign="middle" align="center">0.2898</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-1b or DF-ParPINN-1b3</td>
<td valign="middle" align="center">0.5511</td>
<td valign="middle" align="center">0.5572</td>
<td valign="middle" align="center">0.5024</td>
<td valign="middle" align="center">0.5394</td>
<td valign="middle" align="center">0.5143</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>DF-ParPINN or DF-ParPINN-12</bold>
</td>
<td valign="middle" align="center">
<bold>0.1056</bold>
</td>
<td valign="middle" align="center">
<bold>0.1275</bold>
</td>
<td valign="middle" align="center">
<bold>0.1048</bold>
</td>
<td valign="middle" align="center">
<bold>0.1129</bold>
</td>
<td valign="middle" align="center">
<bold>0.12</bold>
</td>
</tr>
</tbody>
<tbody>
<tr>
<th valign="middle" align="center">Algorithms</th>
<th valign="middle" align="center">t=4500s</th>
<th valign="middle" align="center">t=5250s</th>
<th valign="middle" align="center">t=6000s</th>
<th valign="middle" align="center">t=6750s</th>
<th valign="middle" align="center">t=7500s</th>
</tr>
</tbody>
<tbody>
<tr>
<td valign="middle" align="center">DF-ParPINN-1a or DF-ParPINN-1a3</td>
<td valign="middle" align="center">0.3012</td>
<td valign="middle" align="center">0.3199</td>
<td valign="middle" align="center">0.3321</td>
<td valign="middle" align="center">0.3463</td>
<td valign="middle" align="center">0.3558</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-1b or DF-ParPINN-1b3</td>
<td valign="middle" align="center">0.5099</td>
<td valign="middle" align="center">0.5212</td>
<td valign="middle" align="center">0.5278</td>
<td valign="middle" align="center">0.5401</td>
<td valign="middle" align="center">0.5518</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>DF-ParPINN or DF-ParPINN-12</bold>
</td>
<td valign="middle" align="center">
<bold>0.1601</bold>
</td>
<td valign="middle" align="center">
<bold>0.1861</bold>
</td>
<td valign="middle" align="center">
<bold>0.2298</bold>
</td>
<td valign="middle" align="center">
<bold>0.252</bold>
</td>
<td valign="middle" align="center">
<bold>0.2894</bold>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="fnT11_1">
<p>Bold representsthe lowest relative errors.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The solution time of the six algorithms is shown in <xref ref-type="table" rid="T12">
<bold>Table&#xa0;12</bold>
</xref>:</p>
<table-wrap id="T12" position="float">
<label>Table&#xa0;12</label>
<caption>
<p>Solution time of the six algorithms (ablation experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Algorithm</th>
<th valign="top" align="center">t=750s</th>
<th valign="top" align="center">t=1500s</th>
<th valign="top" align="center">t=2250s</th>
<th valign="top" align="center">t=3000s</th>
<th valign="top" align="center">t=3750s</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">DF-ParPINN-1a</td>
<td valign="middle" align="center">0.0542s</td>
<td valign="middle" align="center">0.0309s</td>
<td valign="middle" align="center">0.0294s</td>
<td valign="middle" align="center">0.0312s</td>
<td valign="middle" align="center">0.0377s</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-1b</td>
<td valign="middle" align="center">0.0285s</td>
<td valign="middle" align="center">0.0264s</td>
<td valign="middle" align="center">0.0336s</td>
<td valign="middle" align="center">0.0264s</td>
<td valign="middle" align="center">0.0269s</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-12</td>
<td valign="middle" align="center">0.0514s</td>
<td valign="middle" align="center">0.0344s</td>
<td valign="middle" align="center">0.0303s</td>
<td valign="middle" align="center">0.0402s</td>
<td valign="middle" align="center">0.0286s</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-1a3</td>
<td valign="middle" align="center">0.0312s</td>
<td valign="middle" align="center">0.0258s</td>
<td valign="middle" align="center">0.0159s</td>
<td valign="middle" align="center">0.0168s</td>
<td valign="middle" align="center">0.0193s</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-1b3</td>
<td valign="middle" align="center">0.0143s</td>
<td valign="middle" align="center">0.0136s</td>
<td valign="middle" align="center">0.0205s</td>
<td valign="middle" align="center">0.0136s</td>
<td valign="middle" align="center">0.0138s</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>DF-ParPINN</bold>
</td>
<td valign="middle" align="center">
<bold>0.0258s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0232s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0167s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0259s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0155s</bold>
</td>
</tr>
</tbody>
<tbody>
<tr>
<th valign="middle" align="center">Algorithms</th>
<th valign="middle" align="center">t=4500s</th>
<th valign="middle" align="center">t=5250s</th>
<th valign="middle" align="center">t=6000s</th>
<th valign="middle" align="center">t=6750s</th>
<th valign="middle" align="center">t=7500s</th>
</tr>
</tbody>
<tbody>
<tr>
<td valign="middle" align="center">DF-ParPINN-1a</td>
<td valign="middle" align="center">0.0399s</td>
<td valign="middle" align="center">0.0384s</td>
<td valign="middle" align="center">0.0332s</td>
<td valign="middle" align="center">0.0318s</td>
<td valign="middle" align="center">0.0313s</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-1b</td>
<td valign="middle" align="center">0.0283s</td>
<td valign="middle" align="center">0.0317s</td>
<td valign="middle" align="center">0.0666s</td>
<td valign="middle" align="center">0.0804s</td>
<td valign="middle" align="center">0.0285s</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-12</td>
<td valign="middle" align="center">0.0359s</td>
<td valign="middle" align="center">0.0273s</td>
<td valign="middle" align="center">0.0295s</td>
<td valign="middle" align="center">0.0403</td>
<td valign="middle" align="center">0.0323s</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-1a3</td>
<td valign="middle" align="center">0.0260s</td>
<td valign="middle" align="center">0.0230s</td>
<td valign="middle" align="center">0.0167s</td>
<td valign="middle" align="center">0.0159s</td>
<td valign="middle" align="center">0.0161s</td>
</tr>
<tr>
<td valign="middle" align="center">DF-ParPINN-1b3</td>
<td valign="middle" align="center">0.0145s</td>
<td valign="middle" align="center">0.0180s</td>
<td valign="middle" align="center">0.0494s</td>
<td valign="middle" align="center">0.0668s</td>
<td valign="middle" align="center">0.0148</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>DF-ParPINN</bold>
</td>
<td valign="middle" align="center">
<bold>0.0199s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0142s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0155s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0235s</bold>
</td>
<td valign="middle" align="center">
<bold>0.0175s</bold>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="fnT12_1">
<p>Bold representsthe lowest relative errors.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>It can be clearly seen from <xref ref-type="table" rid="T11">
<bold>Table&#xa0;11</bold>
</xref> that compared with DF-ParPINN-1a, DF-ParPINN-1b, DF-ParPINN1a3, and DF-ParPINN-1b3, DF-ParPINN and DF-ParPINN-12 have same absolute accuracy advantages in solving mBL equation, which proves that DF-ParPINN is the most effective. It also can be clearly seen from <xref ref-type="table" rid="T12">
<bold>Table&#xa0;12</bold>
</xref> that the average solution time of DF-ParPINN, DF-ParPINN-1a, DF-ParPINN-1b, DF-ParPINN-12, DF-ParPINN-1a3 and DF-ParPINN-1b3 is 0.0198s, 0.0358s, 0.0207s, 0.0350s and 0.0239s respectively, and the average solution time of DF-ParPINN is the shortest, which proves that DF-ParPINN is the most efficient.</p>
</sec>
</sec>
<sec id="s4_5">
<label>4.5</label>
<title>Depth study</title>
<sec id="s4_5_1">
<label>4.5.1</label>
<title>Experimental setup</title>
<p>Unlike PINN, PIRNN, cPINN, and DeepONet, which use only one optimizer for training, DF-ParPINN can use both LBFGS and Adam optimizers for deep training. First use LBFGS efficient training, when the epochs reach 10000, the loss no longer decreases. Then use Adam to continue training, until the loss is almost no longer decreasing.</p>
</sec>
<sec id="s4_5_2">
<label>4.5.2</label>
<title>Experimental results</title>
<p>Taking the velocity potential field at t=7500s (51st time slice) of mBL equation as an example, the depth training of DF-ParPINN was conducted. The training set is consistent with the description in 4.2.1, while the test set changes to all 400762 datasets of high-velocity field at t=7500s and all 123526 datasets of low-velocity field at t=7500s. The relative errors in different training stages are shown in <xref ref-type="table" rid="T13">
<bold>Table&#xa0;13</bold>
</xref>:</p>
<table-wrap id="T13" position="float">
<label>Table&#xa0;13</label>
<caption>
<p>Relative errors in different training stages (depth experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">epochs=10000</th>
<th valign="top" align="center">epochs=50000</th>
<th valign="top" align="center">epochs=100000</th>
<th valign="top" align="center">epochs=200000</th>
<th valign="top" align="center">epochs=300000</th>
<th valign="top" align="center">epochs=400000</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">0.2772</td>
<td valign="top" align="center">0.14</td>
<td valign="top" align="center">0.1278</td>
<td valign="top" align="center">0.1193</td>
<td valign="top" align="center">0.1141</td>
<td valign="top" align="center">0.1104</td>
</tr>
</tbody>
<tbody>
<tr>
<th valign="top" align="center">epochs=500000</th>
<th valign="top" align="center">epochs=600000</th>
<th valign="top" align="center">epochs=700000</th>
<th valign="top" align="center">epochs=800000</th>
<th valign="top" align="center">epochs=900000</th>
<th valign="top" align="center">epochs=1000000</th>
</tr>
</tbody>
<tbody>
<tr>
<td valign="top" align="center">0.1076</td>
<td valign="top" align="center">0.1055</td>
<td valign="top" align="center">0.1034</td>
<td valign="top" align="center">0.1003</td>
<td valign="top" align="center">0.0987</td>
<td valign="top" align="center">0.0966</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The solution time in different training stages is shown in <xref ref-type="table" rid="T14">
<bold>Table&#xa0;14</bold>
</xref>:</p>
<table-wrap id="T14" position="float">
<label>Table&#xa0;14</label>
<caption>
<p>Solution time in different training stages (depth experiments).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<td valign="top" align="center">epochs=10000</td>
<th valign="top" align="center">epochs=50000</th>
<th valign="top" align="center">epochs=100000</th>
<th valign="top" align="center">epochs=200000</th>
<th valign="top" align="center">epochs=300000</th>
<th valign="top" align="center">epochs=400000</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">0.1311s</td>
<td valign="top" align="center">0.1218s</td>
<td valign="top" align="center">0.1210s</td>
<td valign="top" align="center">0.1188s</td>
<td valign="top" align="center">0.1187s</td>
<td valign="top" align="center">0.1182s</td>
</tr>
</tbody>
<tbody>
<tr>
<th valign="top" align="center">epochs=500000</th>
<th valign="top" align="center">epochs=600000</th>
<th valign="top" align="center">epochs=700000</th>
<th valign="top" align="center">epochs=800000</th>
<th valign="top" align="center">epochs=900000</th>
<th valign="top" align="center">epochs=1000000</th>
</tr>
</tbody>
<tbody>
<tr>
<td valign="top" align="center">0.1198s</td>
<td valign="top" align="center">0.1197s</td>
<td valign="top" align="center">0.1196s</td>
<td valign="top" align="center">0.1197s</td>
<td valign="top" align="center">0.1195s</td>
<td valign="top" align="center">0.1312s</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Finally, after deep training 1000000 epochs, the velocity potential field t=7500s solved by DF-ParPINN is shown in the left part of <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>, and the velocity potential field t=7500s solved by the pseudo-spectral method is shown in the right part of <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>:</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Velocity potential field at t=7500s solved by two algorithms.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-11-1309775-g007.tif"/>
</fig>
<p>Comparing the left and right parts of <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>, the velocity potential field solved by DF-ParPINN after deep training 1000000 epochs almost fits the velocity potential field solved by the pseudo-spectral method, which further proves DF-ParPINN is very effective. It also can be clearly seen from <xref ref-type="table" rid="T14">
<bold>Table&#xa0;14</bold>
</xref> that the average solution time of DF-ParPINN after deep training is still no more than 0.5s, much faster than 9.4 minutes of the pseudo-spectral method, which proves that DF-ParPINN is very efficient.</p>
</sec>
</sec>
</sec>
<sec id="s5" sec-type="discussion">
<label>5</label>
<title>Discussion</title>
<sec id="s5_1">
<label>5.1</label>
<title>Compared with advanced deep learning PDE solvers</title>
<p>mBL equation is a high-dimensional non-convex function with three-dimensional spatiotemporal variables, and high-dimensional non-convex optimization problems are NP-hard problems that are difficult to solve accurately. Therefore, PINN is easy to fall into the local optimal solution when solving mBL equations, so it is difficult to obtain the exact solution, so the overall accuracy of PINN is not ideal.</p>
<p>Compared with PINN, PIRNN uses RNN to replace the DNN in PINN. The circular structure of RNN allows information to be passed between different time steps, captures long-term dependencies, and exploits contextual information. These make RNN better model the timing relationship of velocity potential fields in different time slices, and then improve the solving accuracy, so the overall accuracy of PIRNN is higher than that of PINN.</p>
<p>Compared with PINN, cPINN uses the same spatial domain partitioning strategy for velocity potential fields in different time slices, and divides the overall velocity potential field into two parts: the overall high-velocity field and the overall low-velocity field, which have different spatial characteristics. Therefore, first solving the overall high-velocity field and the overall low-velocity field, then combining them can reduce the difficulty of solving, and then improve the solving accuracy, so the overall accuracy of cPINN is higher than that of PINN.</p>
<p>DeepONet does not use the corresponding physical information to assist in solving mBL equations, and the complex high-dimensional characteristics of mBL equations are very challenging for DeepONet neural operators. As a result, it is difficult for DeepONet to accurately capture all the details and features of mBL equation, so the overall accuracy of DeepONet is lower than other algorithms.</p>
<p>DF-ParPINN uses three modules: the temporal-spatial division module of the overall velocity potential field, the data rational selection module of multiple time slices, and the parallel computation module of high-velocity and low-velocity fields. These modules improve the PINN, to a certain extent, and solve the following three problems that exist when the PINN solves PDEs: difficult to solve complex PDEs with high-dimensional non-convex properties, difficult to transfer the physical information of boundary points and initial points, and difficult to train the automatic derivative network quickly at a low cost. Therefore, DF-ParPINN greatly improves the accuracy of solving the mBL equation, so the overall accuracy of DF-ParPINN is higher than that of other algorithms.</p>
</sec>
<sec id="s5_2">
<label>5.2</label>
<title>Compared with DF-ParPINN with different modules</title>
<p>DF-ParPINN-1a or DF-ParPINN-1a3 uses the temporal-spatial division module of overall velocity potential field, but uses only the data focus submodule of the data rational selection module of multiple time slices. Because the amount of data selected from the velocity potential field of the time slice to be solved is the same as the velocity potential fields of all previous time slices, the physical information of the velocity potential field of the time slice to be solved is not utilized to the maximum extent, so their accuracy is not ideal.</p>
<p>Compared with DF-ParPINN-1a, DF-ParPINN-1a3 also uses the parallel computation module of highvelocity fields and low-velocity fields, replacing the serial computation of a single server used by the DF-ParPINN-1a with parallel computation of multiple servers, which greatly reduces the training time and significantly reduces the solution time.</p>
<p>DF-ParPINN-1b or DF-ParPINN-1b3 uses the temporal-spatial division module of overall velocity potential field, but does not use the data rational selection module of multiple time slices. Due to the lack of focused and reasonable distribution of training data, the physical information of velocity potential fields of all previous time slices is overused, so their accuracy is not ideal.</p>
<p>Compared with DF-ParPINN-1b, DF-ParPINN-1b3 also uses the parallel computation module of highvelocity fields and low-velocity fields, replacing the serial computation of a single server used by the DF-ParPINN-1b with parallel computation of multiple servers, which greatly reduces the training time and significantly reduces the solution time.</p>
<p>Compared with DF-ParPINN, DF-ParPINN-12 just doesn&#x2019;t use the parallel computation module of high-velocity fields and low-velocity fields, instead using a single server for serial computation. Therefore, the solution accuracy of both is the same, but the training time of DF-ParPINN-12 is much larger than that of DF-ParPINN, and the solution time is significantly larger than that of DF-ParPINN.</p>
<p>DF-ParPINN uses all three modules, and to a certain extent solves the three problems that exist when PINN solves PDE, so the accuracy of DF-ParPINN is the highest.</p>
</sec>
<sec id="s5_3">
<label>5.3</label>
<title>Compared with DF-ParPINN after deep training</title>
<p>DF-ParPINN trained only 5000 epochs using the LBFGS optimizer, and the training loss only converges to a local minimum, so the accuracy of DF-ParPINN is not very low.</p>
<p>DF-ParPINN after deep training uses LBFGS and Adam two optimizers to train more than 10000 epochs, and when epochs reach 1000000 the training loss almost converges to the global minimum, so the accuracy of DF-ParPINN after deep training is close to ideal.</p>
</sec>
<sec id="s5_4">
<label>5.4</label>
<title>Limitations of DF-ParPINN</title>
<p>First, DF-ParPINN needs to perform the temporal-spatial division of the PDE. If there are too many time slices of the PDE or the space field shape of each time slice is irregular, it is difficult to perform the temporal-spatial division.</p>
<p>Secondly, DF-ParPINN needs to perform the data rational selection of different time slices, which depends on the temporal-spatial division of the PDE. If the time dimension reduction is unsuccessful, it is difficult to perform the data rational selection.</p>
<p>Finally, DF-ParPINN needs to perform the parallel computation of different types of fields, which also depends on the temporal-spatial division of the PDE, and if the spatial division is not successful, it is difficult to perform the parallel computation.</p>
<p>Therefore, some very complex high-dimensional PDEs in real-world applications have no regular shape, the current DF-ParPINN has difficulty solving them.</p>
</sec>
</sec>
<sec id="s6" sec-type="conclusions">
<label>6</label>
<title>Conclusion</title>
<p>In order to solve mBL equation, a high-dimensional PDE with complex structures, quickly and accurately, and achieve a new breakthrough in solving complex PDE of the physical ocean field by using deep learning technology, we propose &#x201c;DF-ParPINN: parallel PINN based on velocity potential field division and single time slice focus&#x201d;. DF-ParPINN consists of three modules: temporal-spatial division module of overall velocity potential field, rational selection module of multiple time slices data, and parallel computation module of high-velocity fields and low-velocity fields, each of them respectively realizes the optimization of the high-dimensional non-convex equation, the deep transmission of effective physical information, the low cost and fast training of the network, to varying degrees. The core of DF-ParPINN is parallel physics-informed neural networks of different servers, they are used separately to solve the high-velocity field and low-velocity field. The experimental results show that the solution time of DF-ParPINN is no more than 0.5s, and its accuracy is much higher than that of PINN, PIRNN, cPINN, and DeepONet. Moreover, the relative error of DF-ParPINN after deep training 1000000 epochs can be reduced to less than 0.1. With the help of neural operators and other methods, continue to improve DF-ParPINN, so that it can solve more complex mBL equations more accurately and quickly, which will be our future research direction.</p>
</sec>
<sec id="s7" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s8" sec-type="author-contributions">
<title>Author contributions</title>
<p>JC: Conceptualization, Data curation, Formal analysis, Methodology, Software, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. CY: Conceptualization, Resources, Validation, Writing &#x2013; review &amp; editing. JX: Funding acquisition, Methodology, Resources, Validation, Writing &#x2013; review &amp; editing. PB: Data curation, Software, Writing &#x2013; review &amp; editing. ZW: Funding acquisition, Resources, Writing &#x2013; review &amp; editing.</p>
</sec>
</body>
<back>
<sec id="s9" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This research was supported in part by the Key Research and Development Projects of Shandong Province (2019JMRH0109).</p>
</sec>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Abel</surname> <given-names>G. P.</given-names>
</name>
<name>
<surname>Roca</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Peraire</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Sarrate</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2013</year>). <source>Defining Quality Measures for Validation and Generation of High-Order Tetrahedral Meshes</source> (<publisher-loc>Hoboken</publisher-loc>: <publisher-name>John Wiley and Sons Ltd</publisher-name>).</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Benney</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Luke</surname> <given-names>J. C.</given-names>
</name>
</person-group> (<year>1964</year>). <article-title>On the interactions of permanent waves of finite amplitude</article-title>. <source>Stud. Appl. Mathematics</source>. <volume>43</volume> (<issue>1-4</issue>), <fpage>309</fpage>&#x2013;<lpage>313</lpage>. doi: <pub-id pub-id-type="doi">10.1002/sapm1964431309</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>X. H.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Pang</surname> <given-names>Y. F.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Gong</surname> <given-names>C. Y.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Developing a new mesh quality evaluation method based on convolutional neural network</article-title>. <source>Eng. Appl. Comput. Fluid Mechanics</source> <volume>14</volume>, <fpage>391</fpage>&#x2013;<lpage>400</lpage>. doi: <pub-id pub-id-type="doi">10.1080/19942060.2020.1720820</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Han</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Arnulf</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Weinan</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Solving high-dimensional partial differential equations using deep learning</article-title>. <source>Proc. Natl. Acad. Sci</source>. <volume>115</volume> (<issue>34</issue>), <fpage>8505</fpage>&#x2013;<lpage>8510</lpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.1718942115</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jagtap</surname> <given-names>A. D.</given-names>
</name>
<name>
<surname>Kharazmi</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Karniadakis</surname> <given-names>G. E.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Conservative physics-informed neural networks on discrete domains for conservation laws: Applications to forward and inverse problems</article-title>. <source>Comput. Methods Appl. Mechanics Eng.</source> <volume>365</volume>, <fpage>113028</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cma.2020.113028</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Kadomtsev</surname> <given-names>B. B.</given-names>
</name>
<name>
<surname>Petviashvili</surname> <given-names>V. I.</given-names>
</name>
</person-group> (<year>1970</year>). <source>On the stability of solitarywaves inweakly dispersive media</source>. (<publisher-name>Russian Academy of Sciences, SPB</publisher-name>)</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Katz</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Sankaran</surname> <given-names>V.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Mesh quality effects on the accuracy of cfd solutions on unstructured meshes</article-title>. <source>J. Comput. Phys.</source> <volume>230</volume>, <fpage>7670</fpage>&#x2013;<lpage>7686</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jcp.2011.06.023</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Le</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Ai for science: Innovate the future together - 2022 zhongguancun forum series activities &#x201c;science intelligence summit&#x201d; held</article-title>. <source>Zhongguancun</source> <volume>2</volume>, <fpage>40</fpage>&#x2013;<lpage>41</lpage>.</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>C. S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Physics-informed neural networks: Recent advances and prospects</article-title>. <source>Comput. Sci</source>. <volume>49</volume>(<issue>4</issue>), <fpage>254</fpage>&#x2013;<lpage>262</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.11896/jsjkx.210500158</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lu</surname> <given-names>J. F.</given-names>
</name>
<name>
<surname>Guan</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2004</year>). <source>Numerical Solving Methods of Partial Differential Equations</source>. <edition>2nd</edition> (<publisher-loc>Beijing</publisher-loc>: <publisher-name>Tsinghua University Press</publisher-name>).</citation>
</ref>
<ref id="B11">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Karniadakis</surname> <given-names>G. E.</given-names>
</name>
</person-group> (<year>2019</year>). <source>Deeponet: Learning nonlinear operators for identifying differential equations based on the universal approximation theorem of operators</source>. <publisher-name>ArXiv, ITH</publisher-name>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname> <given-names>Z. B.</given-names>
</name>
<name>
<surname>Qu</surname> <given-names>J. H.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>H.</given-names>
</name>
<name>
<surname>He</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>B. J.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Q. L.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Surrogate modeling for physical fields of heat transfer processes based on physics-informed neural network</article-title>. <source>CIESC J</source>. <volume>72</volume> (<issue>3</issue>), <fpage>1496</fpage>&#x2013;<lpage>1503</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.11949/0438-1157.20201879</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Molinet</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Saut</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Tzvetkov</surname> <given-names>N.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Global well-posedness for the kp-ii equation on the background of a non-localized solution</article-title>. <source>Commun. Math. Phys.</source> <volume>28</volume>, <fpage>653</fpage>&#x2013;<lpage>676</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.anihpc.2011.04.004</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nabian</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Meidani</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A deep learning solution approach for highdimensional random differential equations - sciencedirect</article-title>. <source>Probabilistic Eng. Mechanics</source> <volume>57</volume>, <fpage>14</fpage>&#x2013;<lpage>25</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.probengmech.2019.05.001</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Ockendon</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Howison</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lacey</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Movchan</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2003</year>). <source>Applied Partial Differential Equations</source> (<publisher-loc>New York</publisher-loc>: <publisher-name>Oxford University Press</publisher-name>).</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Raissi</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Karniadakis</surname> <given-names>G. E.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Hidden physics models: Machine learning of nonlinear partial differential equations</article-title>. <source>J. Comput. Phys.</source> <volume>357</volume>, <fpage>125</fpage>&#x2013;<lpage>141</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jcp.2017.11.039</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Raissi</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Perdikaris</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Karniadakis</surname> <given-names>G. E.</given-names>
</name>
</person-group> (<year>2017</year>a). <article-title>Numerical gaussian processes for time-dependent and non-linear partial differential equations</article-title>. <source>Siam J. Sci. Computing</source> <volume>40</volume>, <fpage>A172</fpage>&#x2013;<lpage>A198</lpage>. doi: <pub-id pub-id-type="doi">10.1137/17M1120762</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Raissi</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Perdikaris</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Karniadakis</surname> <given-names>G. E.</given-names>
</name>
</person-group> (<year>2017</year>b). <source>Physics informed deep learning (part I): Data-driven solutions of nonlinear partial differential equations</source>. <publisher-name>ArXiv, ITH</publisher-name>.</citation>
</ref>
<ref id="B19">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Raissi</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Perdikaris</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Karniadakis</surname> <given-names>G. E.</given-names>
</name>
</person-group> (<year>2017</year>c). <source>Physics informed deep learning (part II): Data-driven discovery of nonlinear partial differential equations</source>. <publisher-name>ArXiv, ITH</publisher-name>.</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Raissi</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Perdikaris</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Karniadakis</surname> <given-names>G. E.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Physics-informed neural networks: A deep learning framework for solving forward and inverse problems involving nonlinear partial differential equations</article-title>. <source>J. Comput. Phys.</source> <volume>378</volume>, <fpage>686</fpage>&#x2013;<lpage>707</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jcp.2018.10.045</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<collab>Science</collab>
</person-group> (<year>2016</year>). <article-title>Science publishes 125 cutting-edge questions in science</article-title>. <source>Field Vision</source> <volume>2</volume>, <fpage>54</fpage>&#x2013;<lpage>55</lpage>.</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shao</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lei</surname> <given-names>Y. M.</given-names>
</name>
<name>
<surname>Lan</surname> <given-names>H. Q.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Traveltime calculation for complex models based on physicsinformed neural networks</article-title>. <source>Prog. Geophysics</source>. <volume>37</volume> (<issue>5</issue>), <fpage>1840</fpage>&#x2013;<lpage>1853</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.6038/pg2022FF0474</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname> <given-names>Z. C.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>The third scientific method &#x2013; scientific calculation in the computer age</article-title>. <source>Encyclopedic Knowledge</source> <volume>3</volume>, <fpage>9</fpage>&#x2013;<lpage>11</lpage>.</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Chang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Deep-learning-based inverse modeling approaches: A subsurface flow example</article-title>. <source>John Wiley Sons Ltd</source>. <volume>126</volume> (<issue>2</issue>), <elocation-id>e2020JB020549</elocation-id>. doi: <pub-id pub-id-type="doi">10.1029/2020JB020549</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Weinan</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Han</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Jentzen</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Deep learning-based numerical methods for high-dimensional parabolic partial differential equations and backward stochastic differential equations</article-title>. <volume>5</volume>(<issue>4</issue>), <fpage>349</fpage>&#x2013;<lpage>380</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s40304-017-0117-6</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Yion</surname> <given-names>W. T. G.</given-names>
</name>
<name>
<surname>Dang</surname> <given-names>K. L. N. Q.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Physics-informed machine learning for mpc: Application to a batch crystallization process</article-title>. <source>Chem. Eng. Res. Design</source> <volume>192</volume>, <fpage>556</fpage>&#x2013;<lpage>569</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cherd.2023.02.048</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Dl-pde: Deep-learning based data-driven discovery of partial differential equations from discrete and noisy data</article-title>. <source>Commun. Comput. Phys.</source> <volume>29</volume>, <fpage>698</fpage>&#x2013;<lpage>728</lpage>. doi: <pub-id pub-id-type="doi">10.4208/cicp.OA-2020-0142</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yuan</surname> <given-names>C. X.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>On diffraction and oblique interactions of horizontally two-dimensional internal solitary waves</article-title>. <source>J. Fluid Mechanics</source>. <volume>936</volume>, <fpage>A20</fpage>. doi: <pub-id pub-id-type="doi">10.1017/jfm.2022.60</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zheng</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>Y. Y.</given-names>
</name>
<name>
<surname>Feudal</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Viscous regularization pinn algorithm for shallow water wave equations</article-title>. <source>Chin. J. Comput. Phys</source>. <volume>40</volume> (<issue>3</issue>), <fpage>314</fpage>&#x2013;<lpage>324</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.19596/j.cnki.1001-246x.8592</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>