<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mar. Sci.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Marine Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mar. Sci.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-7745</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmars.2025.1665305</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Research on intelligent predicting method of underwater acoustic field based on physics-informed neural network</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Chen</surname><given-names>Lei</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3109353/overview"/>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname><given-names>Lin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Sun</surname><given-names>Xuehai</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2995250/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Duan</surname><given-names>Jiaxi</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Yin</surname><given-names>Lijun</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Zheng</surname><given-names>Xinshuo</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Chen</surname><given-names>Jie</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Navy Submarine Academy</institution>, <city>Qingdao</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>Qingdao Institute of Collaborative Innovation</institution>, <city>Qingdao</city>,&#xa0;<country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Lei Chen, <email xlink:href="mailto:chenlei00430@163.com">chenlei00430@163.com</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2025-12-18">
<day>18</day>
<month>12</month>
<year>2025</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2025</year>
</pub-date>
<volume>12</volume>
<elocation-id>1665305</elocation-id>
<history>
<date date-type="received">
<day>14</day>
<month>07</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>21</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>19</day>
<month>11</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Chen, Zhang, Sun, Duan, Yin, Zheng and Chen.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Chen, Zhang, Sun, Duan, Yin, Zheng and Chen</copyright-holder>
<license>
<ali:license_ref start_date="2025-12-18">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>In the context of the rapid development of computer hardware and the continuous improvement of the artificial intelligence and deep learning theory, aiming at the traditional numerical solution method to solve the underwater acoustic fluctuation equation with large computational volume and the limitation of using various acoustic propagation models. We use the numerical solution calculated by the KRAKEN based on the normal mode theory, which is widely used in low-frequency shallow water waveguides, and combine it with the idea of solving the retarded envelope function in the parabolic equation theory. We propose a physical information neural network (PINN)-based method for intelligent prediction of the acoustic field using the elliptic fluctuation equation as the controlling equation. We conduct experiments under water body sound velocity varying stratified waveguide, to validate the model forecasting effect. It is experimentally verified that an effectively trained PINN network model can forecast the sound field at any given range. The predicted sound field can be used for a wide range of applications, such as sound source localisation and sonar range estimation.</p>
</abstract>
<kwd-group>
<kwd>wave equation</kwd>
<kwd>KRAKEN</kwd>
<kwd>envelope function</kwd>
<kwd>PINN</kwd>
<kwd>sound field prediction</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declare that no financial support was received for the research and/or publication of this article.</funding-statement>
</funding-group>
<counts>
<fig-count count="14"/>
<table-count count="4"/>
<equation-count count="27"/>
<ref-count count="31"/>
<page-count count="19"/>
<word-count count="11510"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Physical Oceanography</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>In the field of underwater acoustics, two methods are usually used to study the propagation of acoustic signals in seawater media. The first method is wave theory, which applies rigorous mathematical methods, combined with known fixed solution conditions, to solve the wave equation and study the change of amplitude and phase of acoustic signals in space. The second method is ray theory, in which the propagation of sound waves in a seawater medium is regarded as the propagation of sound lines in the medium in the high-frequency case; the change of sound intensity, the propagation time, and the propagation range of the sound lines in space are studied. Due to the approximation of ray theory, it is difficult to apply it in low-frequency shallow water conditions, and the importance of wave theory is particularly prominent in the context of the increasingly low frequency of sonar action. How to be able to solve the fluctuation equations accurately and quickly has become the focus of research by scholars in various countries.</p>
<p>As shown in <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>, under the assumption of linear acoustics, the basic control equation of underwater sound propagation, the wave equation (WE), can be obtained according to the equation of motion, continuity equation, and state equation. Due to the spatial and temporal complexity of the wave equation, it is difficult to solve it directly. Generally, the strategy adopted in practice is to convert the Fourier transform to the frequency domain to obtain the Helmholtz equation (HE) (<xref ref-type="bibr" rid="B13">Jensen et&#xa0;al., 2011</xref>).</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Methods for solving underwater acoustic wave theory.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g001.tif">
<alt-text content-type="machine-generated">Flowchart of equations and solutions: Motion, Continuity, and State Equations lead to the Wave Equation (WE), then to the Helmholtz Equation (HE). From HE, solutions branch to direct and indirect. Direct leads to Wavenumber Integration (WI). Indirect leads to Normal Modes (NM) and Parabolic Equation (PE). NM branches to Coupled, Adiabatic, and Ray-Normal Modes; PE to Hybrid Theory, which includes Normal Modes-Parabolic among others.</alt-text>
</graphic></fig>
<p>Approaches to solving the Helmholtz equation are divided into two methods: direct and indirect. Solving the Helmholtz equation directly is difficult in practical applications, and the amount of computation is still staggering even today, despite the rapid development of computers. <xref ref-type="bibr" rid="B16">Liu et&#xa0;al. (2021)</xref> used the second-order and fourth-order difference formats to solve the Helmholtz equation directly for Lloyd&#x2019;s mirror example with analytical solution, which took more than 1 hour and more than 1,000 iterations to reach convergence on a computer with 360 CPU cores, and the accuracy basically meets the requirements compared with the analytical solution, which is less usable in the actual sound field calculation.</p>
<p>Most of the solution ideas are solved by various simplified theories of Helmholtz equations; in the process of long-term exploration, simplified models based on the wavenumber integration (WI) theory (<xref ref-type="bibr" rid="B25">Schmidt and Glattetre, 1985</xref>), the normal mode (NM) theory (<xref ref-type="bibr" rid="B8">Godin, 1992</xref>), and the parabolic equation (PE) theory (<xref ref-type="bibr" rid="B1">Collis et&#xa0;al., 2008</xref>) are used. At present, most of the numerical solution methods are based on the development of the above theories or a combination of each other; these methods have their own advantages and disadvantages, and restrictions on the use of conditions, and there is no model that can be applied in any case.</p>
<p>Traditional numerical methods for solving partial differential equations (PDEs) are essentially solved discretely. For example, the finite difference method (FDM) (<xref ref-type="bibr" rid="B27">Stephen, 1988</xref>) solves partial differential equations by replacing differentiation with a difference approximation of the derivatives at grid points. The finite element method (FEM) (<xref ref-type="bibr" rid="B28">Thompson, 2006</xref>) solves the problem by dividing the solution domain into a finite number of small elements and then approximating the functional form of the solution on the elements. The finite volume method (FVM) (<xref ref-type="bibr" rid="B6">Fogarty and LeVeque, 1999</xref>) is based on the concept of control volume and divides the solution domain into multiple control volumes. The spectrum method (SM) (<xref ref-type="bibr" rid="B29">Tu et&#xa0;al., 2023</xref>) uses global basis functions (e.g., sine and cosine functions) to approximate the solution. Methods such as the boundary element method (BEM) (<xref ref-type="bibr" rid="B18">Lu et&#xa0;al., 2008</xref>) are widely used for solving PDEs, transforming the problem into integral equations on the boundary and discretizing only the boundary. These numerical discretization methods are currently widely used in underwater acoustic propagation model calculations and have an irreplaceable role for a short period of time.</p>
<p>With the continuous development of artificial intelligence (AI) and deep learning (DL), the application of AI is not only limited to traditional tasks such as computer vision, natural language processing, and speech recognition; the application of AI in various disciplines is more and more extensive, and the combination of AI and other disciplines has become one of the main research directions in this field. The combination of artificial intelligence and other disciplines has become one of the main research directions in this field. One of the applications of combining AI with mathematics, physics, and other disciplines is solving partial differential equations (<xref ref-type="bibr" rid="B9">Han et&#xa0;al., 2018</xref>).</p>
<p>In 1989, Cybenko (<xref ref-type="bibr" rid="B2">Cybenko, 1989</xref>) proved that a perceptron neural network with hidden layers has the ability to approximate any function when the activation function is a Sigmoid function, and in 1991, <xref ref-type="bibr" rid="B10">Hornik et&#xa0;al. (1989)</xref> further proved that the same applies when the activation function is any non-constant function. This is the fundamental theoretical basis of deep learning, universal approximation theorem (UAT), which describes the property that feedforward neural networks with a sufficient number of hidden units can approximate any continuous function to arbitrary accuracy, which is also known as the theoretical basis for neural networks to be able to solve PDEs.</p>
<p>With the rapid development of computer hardware technology and the arrival of the era of big data and deep learning, deep learning frameworks such as TensorFlow (<xref ref-type="bibr" rid="B3">Dean and Monga, 2015</xref>), PyTorch (<xref ref-type="bibr" rid="B21">Paszke, 2019</xref>), and PaddlePaddle (<xref ref-type="bibr" rid="B19">Ma et&#xa0;al., 2019</xref>) have been gradually generated, perfected, and developed, and AI is rapidly becoming a powerful tool for solving complex scientific problems. In particular, the application of AI is opening up new possibilities in the field of solving PDEs. The core of the emerging field of artificial intelligence for partial differential equations (AI4PDE) lies in the use of neural networks and other machine learning techniques to approximate the solution of PDEs, a method called a deep learning solver. Deep learning solvers are able to learn from data and automatically capture complex patterns and features of the problem to provide faster and more accurate solutions than traditional numerical methods.</p>
<p><xref ref-type="bibr" rid="B24">Raissi et&#xa0;al. (2019)</xref> proposed physics-informed neural network (PINN), compared with the traditional purely data-driven neural network, by adding the difference between the physical equations before and after the iteration to the loss function of the neural network so that the physical equations are also &#x201c;involved&#x201d; in the training process, so that the neural network optimizes not only the network itself but also the difference between each iteration of the physical equations during the training iteration, and so that the final training result is to satisfy the physical laws at the same time. Compared with the traditional purely data-driven neural network, by adding the difference of the physical equations before and after the iteration to the loss function of the neural network, the physical equations are also &#x201c;involved&#x201d; in the training process so that the neural network optimizes not only its own loss function but also the difference of the physical equations in each iteration of the training iteration and so that the final training result is to satisfy the laws of physics and, at the same time, use fewer data samples to learn the model with a more generalization ability. This approach is known as the physics-driven approach, and PINN has been applied to quite a number of scientific and engineering problems, such as solving the Navier&#x2013;Stokes equations, Schr&#xf6;dinger&#x2019;s equations, and Maxwell&#x2019;s system of equations. In addition, PINN can solve not only forward problems but also inverse problems. Among them, the forward problem mainly refers to the prediction of the sound field at different locations given the environmental information, and the inverse problem mainly refers to the inverse performance of the environmental information parameters from the information of the measured sound field data, and so on.</p>
<p>As shown in <xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>, in contrast, there is also a class of methods that simply use labeled data for PDE solving, which are generally referred to as data-driven methods. This class of methods does not need to use the physical equations at all, but rather uses neural networks as operator approximators to solve parametric PDEs, using large amounts of labeled data to learn a direct mapping from the PDE parameters to the equation solutions. This includes Deep Operator Network (DeepONet) proposed by <xref ref-type="bibr" rid="B17">Lu et&#xa0;al. (2019)</xref> and Fourier Neural Operator (FNO) proposed by <xref ref-type="bibr" rid="B15">Li et&#xa0;al. (2020)</xref>. However, in the actual complex underwater acoustic modeling process, the cost of obtaining valuable tagged data is often high, and the tagged data usually contain noise. Due to the main reliance on data-driven models, when the available labeled data are small or contain a lot of noise, the trained model has low accuracy and poor generalization ability, and at the same time, purely relying on data-driven models also lacks physical interpretability; thus, these methods have more limitations in practical applications and are currently only used for solving simpler PDE problems with a large amount of valuable labeled data. How to make full use of physical information to solve PDEs with high accuracy when there are little or no labeled data is a key issue to be solved.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Physics-driven approach <italic>vs</italic>. data-driven approach.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g002.tif">
<alt-text content-type="machine-generated">Comparison chart of physics-driven and data-driven approaches across various dimensions. Physics-driven: Core Logic is constrained by physical equations; Information Dependence uses limited labeled data and physical laws; Generalization is strong, adapting to complex scenarios but less accurate with insufficient data; Physical Interpretability is high, following physical laws; Applicable Scenarios involve high data acquisition cost; Core Advantages include low data demand and anti-interference; Core Limitations require domain physical knowledge. Data-driven: Core Logic uses pure statistical learning; Information Dependence requires large-scale high-quality labeled data; Generalization is weak, depending on data distribution; Physical Interpretability is low; Applicable Scenarios involve easily accessible data; Core Advantages include easy implementation; Core Limitations involve poor accuracy with insufficient data.</alt-text>
</graphic></fig>
<p>In the course of previous research, there have been many scholars who have solved the underwater acoustic propagation problem by means of deep learning. <xref ref-type="bibr" rid="B14">Li and Chitre (2023)</xref> combined PINN with ray acoustics to propose a ray basis neural network (RBNN) and compared it with traditional data-driven machine learning methods&#x2014;Gaussian process regression (GPR) and artificial neural network (ANN)&#x2014;for reasonable extrapolation outside the data collection area through four numerical case studies and one ANN. GPR and ANN for reasonable extrapolation outside the data collection area, and the feasibility and applicability of the method are demonstrated through four numerical case studies and one controlled experiment. <xref ref-type="bibr" rid="B4">Du et&#xa0;al. (2023)</xref> proposed a physics-informed neural network (UAFP-PINN) using the COMSOL software to place a point source at the edge of the simulated two-dimensional (2D) and three-dimensional (3D) marine environment and to directly measure the acoustic field of a point source in the simulated 2D and 3D marine environment. A point source is placed at the edge of the simulated 2D and 3D ocean environment using the COMSOL software to directly solve the Helmholtz equation of the sound field, and the effectiveness of the method in forecasting the sound field is verified by comparison. <xref ref-type="bibr" rid="B20">Mallik et&#xa0;al. (2022)</xref> proposed a convolutional recurrent autoencoder network (CRAN) structure, which is a data-driven deep learning model for directly learning acoustic transmission loss in the far field. It is also proposed that the generalization ability of CRAN can be effectively improved by double-checking the errors in the validation set, appropriate hyperparameter tuning, and stopping the training of CRAN earlier. <xref ref-type="bibr" rid="B5">Duan et&#xa0;al. (2024)</xref> proposed a spatial domain decomposition-based physics-informed neural network (SPINN). By generating a range-independent sound field for the RAM model, by adding noise, and by inputting a noise-containing dataset for experiments, they quantitatively analyzed the effects of three influencing factors, namely, sound speed error, marine environmental noise, and observation noise, on the ability of SPINN to learn the sound field by means of root mean square error (RMSE), and compared it with the PINN without spatial domain decomposition. Comparison with PINN without spatial domain decomposition demonstrates the good performance of SPINN. <xref ref-type="bibr" rid="B7">Gao et&#xa0;al. (2024)</xref> proposed a fast computational method for underwater acoustic field based on PINNs, in which the frequency-domain Helmholtz equations, which represent the underwater acoustic propagation law, are encoded as physical neurons through automatic differentiation and combined with a small amount of measurement data as informative neurons to construct a physically informative and data-driven neural network to solve the underwater acoustic field. <xref ref-type="bibr" rid="B12">Huang et&#xa0;al. (2024)</xref> proposed a fast computational method for underwater acoustic field based on PINNs, in which the frequency-domain Helmholtz equations, which represent the underwater acoustic propagation law, are encoded as physical neurons through automatic differentiation and combined with a small amount of measurement data as informative neurons to construct a physically informative and data-driven neural network to solve the underwater acoustic field. <xref ref-type="bibr" rid="B12">Huang et&#xa0;al. (2024)</xref> proposed a fast broadband modeling method using a physics-informed neural network by integrating the modal equations of normal modes as a regular term in the loss function of the neural network, which enables fast broadband modeling of the underwater acoustic channel in the presence of sparse frequency sampling points.</p>
<p>In terms of the research content, the current research mainly shows the combination of numerical solution methods or deep learning solution methods with classical underwater acoustic propagation theory; the solution method and theory each belong to a dimension, and the combination of a solution method and a theory can produce a new underwater acoustic propagation model. As shown in <xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>, the research content of this paper mainly focuses on the combination of PINN with the theory of normal modes and the theory of parabolic equations.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Highlights of the research content of this paper (red areas).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g003.tif">
<alt-text content-type="machine-generated">Comparison table of methods for hydroacoustic propagation theory including numerical and artificial intelligence methods. Columns: Direct Solution, Wavenumber Integration, Normal Modes, and Parabolic Equation. Methods listed are Finite Difference, Finite Element, Spectrum, Finite Volume, Boundary Element, Machine Learning, and DeepONet/FNO. The intersection of &#x201c;Artificial Intelligence Methods&#x201d; and &#x201c;Parabolic Equation&#x201d; is highlighted in red, labeled as &#x201c;PINN."</alt-text>
</graphic></fig>
</sec>
<sec id="s2">
<label>2</label>
<title>PINN model structure and theory</title>
<p>As summarized in the preceding analysis, the current field of underwater acoustic field prediction faces three core challenges: traditional numerical methods (e.g., finite difference method and KRAKEN software based on NM theory) suffer from large computational volumes and poor adaptability to complex stratified waveguides; pure data-driven models (e.g., DeepONet) rely on massive labeled data, which are costly to acquire and noisy in real marine environments, leading to weak generalization; and existing PINNs mostly integrate only a single physical equation (e.g., Helmholtz equation), failing to leverage the multi-scale physical characteristics of underwater acoustic propagation and resulting in suboptimal accuracy in complex scenarios. To address these issues, this study proposes a systematic innovation centered on a dual-physics-constrained PINN framework, which fuses NM theory and PE theory.</p>
<p>The specific innovations are as follows: theoretically, NM theory is used to generate physically meaningful prior data (modal functions and horizontal wavenumbers of each order) via the KRAKEN software, avoiding the &#x201c;modal aliasing&#x201d; problem of existing PINNs caused by random prior data; PE theory converts rapidly fluctuating sound pressure signals into slowly varying envelope functions, reducing the difficulty of neural network learning and solving the convergence issue of direct sound pressure training; meanwhile, the elliptic fluctuation equation derived from PE theory is adopted as the control equation of PINN, which not only retains the computational advantages of parabolic approximation but also inherits the modal information of NM theory, avoiding the approximation errors or computational complexity of existing control equations (e.g., Helmholtz equation). Methodologically, the PINN loss function design is optimized: the total loss includes three components (data-driven term for fitting NM-derived envelope data, boundary constraint term for applying sea surface pressure release conditions, and physical constraint term for minimizing the residual of the elliptic fluctuation equation); considering that the physical constraint term is usually two orders of magnitude smaller than the other two terms, its weight is adjusted to prevent it from being &#x201c;overwhelmed&#x201d;, balancing data fitting and physical consistency, which is different from the equal-weight design of existing PINNs. Practically, the framework integrates seabed parameters through NM theory to adapt to stratified waveguide environments and relies on the physical prior information provided by NM and PE theories to reduce the demand for labeled data, enabling high-precision prediction without massive samples and lowering the cost of real-world deployment. This innovation not only addresses the aforementioned three challenges but also provides a more efficient and accurate technical path for practical applications such as sound source localization and sonar range estimation.</p>
<p>In the course of our research, we propose a deep learning approach to use PINN for forecasting the underwater sound field. While integrating the <italic>a priori</italic> information, PINN is fitted to a portion of the actual computed data. PINN utilizes envelope amplitude data at different depths for data fitting, which is its data-driven part. In addition to fitting the data at the sampling points, the PINN incorporates physical drivers, including the standard parabolic equations governing the PDEs themselves and the surface pressure release boundary conditions, to extend the sound field prediction to unknown points. The network requires a sound speed profile (SSP) and ocean substrate information (including density <italic>&#x3c1;</italic>, sound speed <italic>c</italic>, and attenuation coefficient <italic>&#x3b1;</italic>) as <italic>a priori</italic> information, and KRAKEN is used to compute the actual sound pressure data at the sampling points. According to the conclusion drawn by <xref ref-type="bibr" rid="B4">Du et&#xa0;al. (2023)</xref> in training the network, it can be seen that it is difficult to train the neural network directly using sound pressure data to converge to an exact solution due to the rapidly fluctuating nature of sound pressure data in a wide ocean environment with a range of kilometers, so we convert the rapidly varying sound pressure <inline-formula>
<mml:math display="inline" id="im1"><mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> into a slow-varying envelope function <inline-formula>
<mml:math display="inline" id="im2"><mml:mrow><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> and adding it to the neural network for training. After training, the PINN can predict the sound field at any <inline-formula>
<mml:math display="inline" id="im3"><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>. The predicted sound field is used in a wide range of applications, such as sound source localization and sonar action range estimation.</p>
<p>In the following, we will briefly introduce the principle of calculating sound pressure <inline-formula>
<mml:math display="inline" id="im4"><mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> by normal modes in Section 2.1. Section 2.2 illustrates the conversion relationship between sound pressure <inline-formula>
<mml:math display="inline" id="im5"><mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> and envelope function <inline-formula>
<mml:math display="inline" id="im6"><mml:mrow><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> and introduces the elliptic fluctuation equations. Section 2.3 explains the network design idea of PINN and the basic principle of how to sample and get the envelope function <inline-formula>
<mml:math display="inline" id="im7"><mml:mrow><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> by training.</p>
<sec id="s2_1">
<label>2.1</label>
<title>Calculation of sound pressure by normal mode theory</title>
<p>The normal mode theory was first proposed by Pekeris in 1948 (<xref ref-type="bibr" rid="B22">Pekeris, 1948</xref>) to solve the acoustic propagation problem in a range-independent environment, and nowadays, it is one of the classical theories for solving acoustic propagation problems in shallow water. With the development of computer technology, <xref ref-type="bibr" rid="B23">Porter (1992)</xref> developed the KRAKEN software based on the finite difference method, which has the advantages of computational stability, accuracy, and speed, and this model is one of the widely used numerical computation programs for normal modes in underwater acoustics.</p>
<p>A brief introduction to the normal mode theory for solving the sound field is given according to Section 5.2 of <italic>Computational Ocean Acoustics</italic> (Second Edition) (<xref ref-type="bibr" rid="B13">Jensen et&#xa0;al., 2011</xref>), and we start with the 2D Helmholtz equation, where the sound velocity and density depend only on the depth <italic>z</italic>:</p>
<disp-formula id="eq1"><label>(1)</label>
<mml:math display="block" id="M1"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>r</mml:mi></mml:mfrac><mml:mfrac><mml:mo>&#x2202;</mml:mo><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mfrac><mml:mo>(</mml:mo><mml:mi>r</mml:mi><mml:mfrac><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mfrac><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:mi>&#x3c1;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mfrac><mml:mo>&#x2202;</mml:mo><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:mfrac><mml:mo>(</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>&#x3c1;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mfrac><mml:mfrac><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>z</mml:mi></mml:mrow></mml:mfrac><mml:mo>)</mml:mo><mml:mo>+</mml:mo><mml:mfrac><mml:mrow><mml:msup><mml:mi>&#x3c9;</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:msup><mml:mi>c</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mfrac><mml:mi>p</mml:mi><mml:mo>=</mml:mo><mml:mo>&#x2212;</mml:mo><mml:mfrac><mml:mrow><mml:mi>&#x3b4;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mi>&#x3b4;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mi>z</mml:mi><mml:mi>s</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mrow><mml:mn>2</mml:mn><mml:mi>&#x3c0;</mml:mi><mml:mi>r</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:math>
</disp-formula>
<p>Use the technique of variable separation:</p>
<disp-formula id="eq2"><label>(2)</label>
<mml:math display="block" id="M2"><mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mtext>&#x3a6;</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mtext>&#x3a8;</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math>
</disp-formula>
<p>Substituting <xref ref-type="disp-formula" rid="eq2">Equation 2</xref> into <xref ref-type="disp-formula" rid="eq1">Equation 1</xref> and separating the constant <inline-formula>
<mml:math display="inline" id="im8"><mml:mrow><mml:msubsup><mml:mi>k</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>m</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula> yields</p>
<disp-formula id="eq3"><label>(3)</label>
<mml:math display="block" id="M3"><mml:mrow><mml:mi>&#x3c1;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mfrac><mml:mtext>d</mml:mtext><mml:mrow><mml:mtext>d</mml:mtext><mml:mi>z</mml:mi></mml:mrow></mml:mfrac><mml:mo>[</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:mi>&#x3c1;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mfrac><mml:mfrac><mml:mrow><mml:msub><mml:mrow><mml:mtext>d&#x3a8;</mml:mtext></mml:mrow><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mrow><mml:mtext>d</mml:mtext><mml:mi>z</mml:mi></mml:mrow></mml:mfrac><mml:mo>]</mml:mo><mml:mo>+</mml:mo><mml:mo>[</mml:mo><mml:mfrac><mml:mrow><mml:msup><mml:mi>&#x3c9;</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:msup><mml:mi>c</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mfrac><mml:mo>&#x2212;</mml:mo><mml:msubsup><mml:mi>k</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>m</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msubsup><mml:mo>]</mml:mo><mml:msub><mml:mtext>&#x3a8;</mml:mtext><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math>
</disp-formula>
<p>This is the most important equation in the theory of normal modes&#x2014;in the modal equation, <inline-formula>
<mml:math display="inline" id="im9"><mml:mtext>m</mml:mtext></mml:math></inline-formula> is the <inline-formula>
<mml:math display="inline" id="im10"><mml:mtext>m</mml:mtext></mml:math></inline-formula>th order mode, where <inline-formula>
<mml:math display="inline" id="im11"><mml:mrow><mml:msub><mml:mi>k</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>m</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is the horizontal wavenumber, <inline-formula>
<mml:math display="inline" id="im12"><mml:mrow><mml:msub><mml:mtext>&#x3a8;</mml:mtext><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> is the mode function, and the above equation is the classical Sturm&#x2013;Liouville eigenvalue problem, where the goal is to find its eigenfunctions <inline-formula>
<mml:math display="inline" id="im13"><mml:mrow><mml:msub><mml:mtext>&#x3a8;</mml:mtext><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> and eigenvalues <inline-formula>
<mml:math display="inline" id="im14"><mml:mrow><mml:msubsup><mml:mi>k</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>m</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula>.</p>
<disp-formula id="eq4"><label>(4)</label>
<mml:math display="block" id="M4"><mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mfrac><mml:mi>i</mml:mi><mml:mrow><mml:mn>4</mml:mn><mml:mi>&#x3c1;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>z</mml:mi><mml:mi>s</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mfrac><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>&#x221e;</mml:mi></mml:munderover><mml:msub><mml:mtext>&#x3a8;</mml:mtext><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>z</mml:mi><mml:mtext>s</mml:mtext></mml:msub><mml:mo stretchy="false">)</mml:mo><mml:msub><mml:mtext>&#x3a8;</mml:mtext><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>m</mml:mi></mml:mrow></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math>
</disp-formula>
<p>The sound pressure can be obtained by synthesizing the sound field through <xref ref-type="disp-formula" rid="eq4">Equation 4</xref> by simply requiring the modal function in <xref ref-type="disp-formula" rid="eq3">Equation 3</xref> with the horizontal wavenumber.</p>
<p>We use KRAKEN to calculate the modal functions and horizontal wavenumbers corresponding to each order of modes from the given SSP and environmental information such as ocean substrate information (including density <italic>&#x3c1;</italic>, sound speed <italic>c</italic>, and attenuation coefficient <italic>&#x3b1;</italic>), as well as reasonable settings of various parameters that may affect the number of modes <italic>m</italic> in the environment (env) file and the field (flp) file, such as the frequency f, the minimum phase velocity <inline-formula>
<mml:math display="inline" id="im15"><mml:mrow><mml:msub><mml:mi>c</mml:mi><mml:mrow><mml:mi>l</mml:mi><mml:mi>o</mml:mi><mml:mi>w</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>, and the maximum phase velocity <inline-formula>
<mml:math display="inline" id="im16"><mml:mrow><mml:msub><mml:mi>c</mml:mi><mml:mrow><mml:mi>h</mml:mi><mml:mi>i</mml:mi><mml:mi>g</mml:mi><mml:mi>h</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>. The modal function <inline-formula>
<mml:math display="inline" id="im17"><mml:mrow><mml:msub><mml:mtext>&#x3a8;</mml:mtext><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> and horizontal wavenumber <inline-formula>
<mml:math display="inline" id="im18"><mml:mrow><mml:msub><mml:mi>k</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>m</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> corresponding to each order mode are calculated, and the sound pressure is obtained through <xref ref-type="disp-formula" rid="eq4">Equation 4</xref>, which is used as the input quantity in Section 2.2.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Introduction of elliptic fluctuation equations</title>
<p>According to Section 6.2 of <italic>Computational Ocean Acoustics</italic> (Second Edition) (<xref ref-type="bibr" rid="B13">Jensen et&#xa0;al., 2011</xref>), the standard 2D Helmholtz equation in the column coordinate system is</p>
<disp-formula id="eq5"><label>(5)</label>
<mml:math display="block" id="M5"><mml:mrow><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>r</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>r</mml:mi></mml:mfrac><mml:mfrac><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>z</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:msubsup><mml:mi>k</mml:mi><mml:mn>0</mml:mn><mml:mn>2</mml:mn></mml:msubsup><mml:msup><mml:mi>n</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mi>p</mml:mi><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im19"><mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>&#xa0;</mml:mo></mml:mrow></mml:math></inline-formula> is the sound pressure, <inline-formula>
<mml:math display="inline" id="im20"><mml:mrow><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mo>=</mml:mo><mml:mi>&#x3c9;</mml:mi><mml:mo stretchy="false">/</mml:mo><mml:msub><mml:mi>c</mml:mi><mml:mn>0</mml:mn></mml:msub></mml:mrow></mml:math></inline-formula> is the reference wavenumber, and <inline-formula>
<mml:math display="inline" id="im21"><mml:mrow><mml:mi>n</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:msub><mml:mi>c</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mo stretchy="false">/</mml:mo><mml:mi>c</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> is the refractive index.</p>
<p>Take the solution of <xref ref-type="disp-formula" rid="eq5">Equation 5</xref> in the following form:</p>
<disp-formula id="eq6"><label>(6)</label>
<mml:math display="block" id="M6"><mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math>
</disp-formula>
<p>where the envelope function <inline-formula>
<mml:math display="inline" id="im22"><mml:mrow><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> is slowly varying with range and <inline-formula>
<mml:math display="inline" id="im23"><mml:mrow><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> satisfies the following Bessel differential equation:</p>
<disp-formula id="eq7"><label>(7)</label>
<mml:math display="block" id="M7"><mml:mrow><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>r</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>r</mml:mi></mml:mfrac><mml:mfrac><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:msubsup><mml:mi>k</mml:mi><mml:mn>0</mml:mn><mml:mn>2</mml:mn></mml:msubsup><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math>
</disp-formula>
<p>Substituting <xref ref-type="disp-formula" rid="eq6">Equation 6</xref> into <xref ref-type="disp-formula" rid="eq5">Equation 5</xref> and using the property of <inline-formula>
<mml:math display="inline" id="im24"><mml:mrow><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> in <xref ref-type="disp-formula" rid="eq7">Equation 7</xref> gives</p>
<disp-formula id="eq8"><label>(8)</label>
<mml:math display="block" id="M8"><mml:mrow><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>r</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mo>(</mml:mo><mml:mfrac><mml:mn>2</mml:mn><mml:mrow><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mfrac><mml:mfrac><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>r</mml:mi></mml:mfrac><mml:mo>)</mml:mo><mml:mfrac><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>z</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:msubsup><mml:mi>k</mml:mi><mml:mn>0</mml:mn><mml:mn>2</mml:mn></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msup><mml:mi>n</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>&#x2212;</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo><mml:mi>&#x3c8;</mml:mi><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math>
</disp-formula>
<p>Next, we take the far-field approximation <inline-formula>
<mml:math display="inline" id="im25"><mml:mrow><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo>&#x226b;</mml:mo><mml:mn>1</mml:mn><mml:mo>,</mml:mo></mml:mrow></mml:math></inline-formula> at which point <inline-formula>
<mml:math display="inline" id="im26"><mml:mrow><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> can be replaced by its asymptotic form:</p>
<disp-formula id="eq9"><label>(9)</label>
<mml:math display="block" id="M9"><mml:mrow><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>&#x2243;</mml:mo><mml:msqrt><mml:mrow><mml:mfrac><mml:mn>2</mml:mn><mml:mrow><mml:mi>&#x3c0;</mml:mi><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:msqrt><mml:msup><mml:mtext>e</mml:mtext><mml:mrow><mml:mtext>i</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mfrac><mml:mi>&#x3c0;</mml:mi><mml:mn>4</mml:mn></mml:mfrac><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msup></mml:mrow></mml:math>
</disp-formula>
<p>The simplified elliptic fluctuation equation can be obtained by bringing <xref ref-type="disp-formula" rid="eq9">Equation 9</xref> into <xref ref-type="disp-formula" rid="eq8">Equation 8</xref>:</p>
<disp-formula id="eq10"><label>(10)</label>
<mml:math display="block" id="M10"><mml:mrow><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>r</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mn>2</mml:mn><mml:mtext>i</mml:mtext><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mfrac><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>z</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:msubsup><mml:mi>k</mml:mi><mml:mn>0</mml:mn><mml:mn>2</mml:mn></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msup><mml:mi>n</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>&#x2212;</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo><mml:mi>&#x3c8;</mml:mi><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math>
</disp-formula>
<p>The <xref ref-type="disp-formula" rid="eq10">Equation 10</xref> is the most important control equation in the PINN we designed and is also different from the direct use of <xref ref-type="disp-formula" rid="eq11">Equation 11</xref></p>
<disp-formula id="eq11"><label>(11)</label>
<mml:math display="block" id="M11"><mml:mrow><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>r</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>r</mml:mi></mml:mfrac><mml:mfrac><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>z</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:msup><mml:mi>k</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mi>p</mml:mi><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math>
</disp-formula>
<p>as the control equation (<xref ref-type="bibr" rid="B4">Du et&#xa0;al., 2023</xref>; <xref ref-type="bibr" rid="B5">Duan et&#xa0;al., 2024</xref>) in previous studies.</p>
<p>The sea surface pressure release boundary uses the first type of boundary conditions, also known as the Dirichlet boundary condition (DBC) as shown in <xref ref-type="disp-formula" rid="eq12">Equation 12</xref>:</p>
<disp-formula id="eq12"><label>(12)</label>
<mml:math display="block" id="M12"><mml:mrow><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mn>0</mml:mn><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math>
</disp-formula>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Network design for PINN</title>
<p>The biggest difference between PINN&#x2019;s ability to accurately solve PDEs and numerical methods is the application of the neural network&#x2019;s automatic differentiation (AD) technique. Unlike traditional analytic differentiation or numerical differentiation methods, automatic differentiation is able to automatically compute derivatives with arbitrary accuracy, which has a significant advantage, especially for complex function derivation. Automatic differentiation is used in deep learning to compute the gradient of the loss function with respect to the network parameters for parameter updating and optimization.</p>
<p>As shown in <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref>, the structure of the PINN we designed mainly consists of an input layer, L hidden layers, and an output layer, with a total of <inline-formula>
<mml:math display="inline" id="im27"><mml:mrow><mml:mtext>L</mml:mtext><mml:mo>+</mml:mo><mml:mn>2</mml:mn></mml:mrow></mml:math></inline-formula> layers, where layer 0 is the input layer, layers 1 to L are the hidden layers, and layer <inline-formula>
<mml:math display="inline" id="im28"><mml:mrow><mml:mtext>L</mml:mtext><mml:mo>+</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></inline-formula> is the output layer. The number of neurons in the input layer is 2, which are range <italic>r</italic> and depth <italic>z</italic>. The L hidden layers are fully connected layers, where the number of neurons in the kth layer is <inline-formula>
<mml:math display="inline" id="im29"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>k</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula>. Since the envelope function <inline-formula>
<mml:math display="inline" id="im30"><mml:mrow><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> is complex, the neural network cannot be trained directly on the complex numbers, so it needs to be split into the real part <inline-formula>
<mml:math display="inline" id="im31"><mml:mrow><mml:msub><mml:mi>&#x3c8;</mml:mi><mml:mrow><mml:mtext>real</mml:mtext></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> and the imaginary part <inline-formula>
<mml:math display="inline" id="im32"><mml:mrow><mml:msub><mml:mi>&#x3c8;</mml:mi><mml:mrow><mml:mtext>imag</mml:mtext></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> and then trained; then, the number of neurons in the output layer is 2, which are <inline-formula>
<mml:math display="inline" id="im33"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>&#x3c8;</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mrow><mml:mtext>real</mml:mtext></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> and <inline-formula>
<mml:math display="inline" id="im34"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>&#x3c8;</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mrow><mml:mtext>imag</mml:mtext></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>The PINN structure designed in this paper. PINN, physics-informed neural network.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g004.tif">
<alt-text content-type="machine-generated">Diagram illustrating a neural network combining physics-informed and data-informed methods. Inputs labeled r and z feed into a network with activation functions. The physics-informed part includes PDE and BC loss terms, using automatic differentiation. The data-informed part involves data loss. The neural network outputs real and imaginary components. A process of backpropagation updates weights until convergence is achieved with a condition check. Total loss combines physics and data losses, linked to the done state when conditions are met.</alt-text>
</graphic></fig>
<p>According to the conclusion of <xref ref-type="bibr" rid="B26">Song et&#xa0;al. (2022)</xref> for PINN solving Helmholtz equation, it can be seen that the use of adaptive sinusoidal activation function Sine can be a good solution to the frequency-domain wavefield problem, so we use <inline-formula>
<mml:math display="inline" id="im35"><mml:mrow><mml:mi>&#x3c3;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>x</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mtext>sin</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:mi>x</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> as the activation function; then, the computational structure of feedforward neural network as shown in <xref ref-type="disp-formula" rid="eq13">Equation 13</xref></p>
<disp-formula id="eq13"><label>(13)</label>
<mml:math display="block" id="M13"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>l</mml:mi><mml:mo>+</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mo>{</mml:mo><mml:mtable columnalign="left" equalrows="true" equalcolumns="true"><mml:mtr columnalign="left"><mml:mtd columnalign="left"><mml:mrow><mml:mi>&#x3c3;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>w</mml:mi><mml:mi>l</mml:mi></mml:msub><mml:msub><mml:mi>x</mml:mi><mml:mi>l</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>b</mml:mi><mml:mi>l</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo><mml:mo>,</mml:mo></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mi>l</mml:mi><mml:mo>=</mml:mo><mml:mn>0</mml:mn><mml:mo>&#x2192;</mml:mo><mml:mi>L</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mtd></mml:mtr><mml:mtr columnalign="left"><mml:mtd columnalign="left"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>l</mml:mi></mml:msub><mml:msub><mml:mi>x</mml:mi><mml:mi>l</mml:mi></mml:msub><mml:mo>,</mml:mo></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mi>l</mml:mi><mml:mo>=</mml:mo><mml:mi>L</mml:mi></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im36"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mi>l</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula>
<mml:math display="inline" id="im37"><mml:mrow><mml:msub><mml:mi>b</mml:mi><mml:mi>l</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> denote the weights and biases, respectively, from the <italic>l</italic>th layer to the <inline-formula>
<mml:math display="inline" id="im38"><mml:mrow><mml:mi>l</mml:mi><mml:mo>+</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></inline-formula>th layer.</p>
<p>For simple, physically meaningful PDE problems without the time term t, PINN can be trained by sampling only the interior and boundary points, under the control of PDEs and boundary conditions (BCs), allowing the network to learn the physical processes and extrapolate them for prediction. However, for the complex ocean acoustic propagation problem, it is difficult to use only the PDE loss term and BC loss term in the original PINN structure for purely physical driving to be effective, and in order to improve the accuracy of our prediction, it is necessary to use a part of the exact solution as the labeled data to incorporate the loss term as the data-driven part. Therefore, our loss function term <inline-formula>
<mml:math display="inline" id="im39"><mml:mrow><mml:mi>L</mml:mi><mml:mi>o</mml:mi><mml:mi>s</mml:mi><mml:msub><mml:mi>s</mml:mi><mml:mrow><mml:mi>T</mml:mi><mml:mi>o</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>l</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> consists of three parts as shown in <xref ref-type="disp-formula" rid="eq14">Equation 14</xref>.</p>
<disp-formula id="eq14"><label>(14)</label>
<mml:math display="block" id="M14"><mml:mrow><mml:mi>L</mml:mi><mml:mi>o</mml:mi><mml:mi>s</mml:mi><mml:msub><mml:mi>s</mml:mi><mml:mrow><mml:mi>T</mml:mi><mml:mi>o</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>l</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi></mml:mrow></mml:msub><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math>
</disp-formula>
<p>where each loss function is calculated using mean squared error (MSE) as shown in <xref ref-type="disp-formula" rid="eq15">Equations 15</xref>&#x2013;<xref ref-type="disp-formula" rid="eq17">17</xref>, with <inline-formula>
<mml:math display="inline" id="im40"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> being the loss of the data-driven term, <inline-formula>
<mml:math display="inline" id="im41"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> being the loss of the BC control term, and <inline-formula>
<mml:math display="inline" id="im42"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> being the loss of the PDE control term. The weights of each item are <inline-formula>
<mml:math display="inline" id="im43"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>, <inline-formula>
<mml:math display="inline" id="im44"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>, and <inline-formula>
<mml:math display="inline" id="im45"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>.</p>
<disp-formula id="eq15"><label>(15)</label>
<mml:math display="block" id="M15"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>m</mml:mi></mml:msub></mml:mrow></mml:mfrac><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>m</mml:mi></mml:msub></mml:mrow></mml:munderover><mml:mo>|</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>&#x3c8;</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mrow><mml:mtext>real</mml:mtext></mml:mrow><mml:mn>2</mml:mn></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msubsup><mml:mi>r</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mi>z</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi></mml:msubsup><mml:mo stretchy="false">)</mml:mo><mml:mo>+</mml:mo><mml:msubsup><mml:mover accent="true"><mml:mi>&#x3c8;</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mrow><mml:mtext>imag</mml:mtext></mml:mrow><mml:mn>2</mml:mn></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msubsup><mml:mi>r</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mi>z</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi></mml:msubsup><mml:mo stretchy="false">)</mml:mo><mml:mo>&#x2212;</mml:mo><mml:mo>|</mml:mo><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:msubsup><mml:mi>r</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mi>z</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi></mml:msubsup><mml:mo stretchy="false">)</mml:mo><mml:msup><mml:mo>|</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mo>|</mml:mo></mml:mrow></mml:math>
</disp-formula>
<disp-formula id="eq16"><label>(16)</label>
<mml:math display="block" id="M16"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>b</mml:mi></mml:msub></mml:mrow></mml:mfrac><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>b</mml:mi></mml:msub></mml:mrow></mml:munderover><mml:mo>|</mml:mo><mml:msub><mml:mi>B</mml:mi><mml:mi>&#x3c8;</mml:mi></mml:msub><mml:mo stretchy="false">[</mml:mo><mml:mover accent="true"><mml:mi>&#x3c8;</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mo>(</mml:mo><mml:msubsup><mml:mi>r</mml:mi><mml:mi>i</mml:mi><mml:mi>b</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:mn>0</mml:mn><mml:mo>)</mml:mo><mml:mo stretchy="false">]</mml:mo><mml:msup><mml:mo>|</mml:mo><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:math>
</disp-formula>
<disp-formula id="eq17"><label>(17)</label>
<mml:math display="block" id="M17"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>p</mml:mi></mml:msub></mml:mrow></mml:mfrac><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>p</mml:mi></mml:msub></mml:mrow></mml:munderover><mml:mo>|</mml:mo><mml:msub><mml:mi>N</mml:mi><mml:mi>&#x3c8;</mml:mi></mml:msub><mml:mo stretchy="false">[</mml:mo><mml:mover accent="true"><mml:mi>&#x3c8;</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mo>(</mml:mo><mml:msubsup><mml:mi>r</mml:mi><mml:mi>i</mml:mi><mml:mi>p</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mi>z</mml:mi><mml:mi>i</mml:mi><mml:mi>p</mml:mi></mml:msubsup><mml:mo>)</mml:mo><mml:mo stretchy="false">]</mml:mo><mml:msup><mml:mo>|</mml:mo><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im46"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>m</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the number of sampling points of the exact solution data, and <inline-formula>
<mml:math display="inline" id="im47"><mml:mrow><mml:msubsup><mml:mrow><mml:mo>{</mml:mo><mml:msubsup><mml:mi>r</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mi>z</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi></mml:msubsup><mml:mo>}</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>m</mml:mi></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula> is the set <inline-formula>
<mml:math display="inline" id="im48"><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> of coordinate values of its input network. <inline-formula>
<mml:math display="inline" id="im49"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>b</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the number of equally spaced sampling points at the soft boundary of the sea surface, and <inline-formula>
<mml:math display="inline" id="im50"><mml:mrow><mml:msubsup><mml:mrow><mml:mo>{</mml:mo><mml:msubsup><mml:mi>r</mml:mi><mml:mi>i</mml:mi><mml:mi>b</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:mn>0</mml:mn><mml:mo>}</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>b</mml:mi></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula> is the set <inline-formula>
<mml:math display="inline" id="im51"><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mn>0</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> of coordinate values of its input network. <inline-formula>
<mml:math display="inline" id="im52"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>p</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the number of random sampling points inside the computational domain, and <inline-formula>
<mml:math display="inline" id="im53"><mml:mrow><mml:msubsup><mml:mrow><mml:mo>{</mml:mo><mml:msubsup><mml:mi>r</mml:mi><mml:mi>i</mml:mi><mml:mi>p</mml:mi></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mi>z</mml:mi><mml:mi>i</mml:mi><mml:mi>p</mml:mi></mml:msubsup><mml:mo>}</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>p</mml:mi></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula> is the set <inline-formula>
<mml:math display="inline" id="im54"><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> of coordinate values of its input network. <inline-formula>
<mml:math display="inline" id="im55"><mml:mrow><mml:msub><mml:mi>B</mml:mi><mml:mi>&#x3c8;</mml:mi></mml:msub><mml:mo stretchy="false">[</mml:mo><mml:mo>&#xb7;</mml:mo><mml:mo stretchy="false">]</mml:mo></mml:mrow></mml:math></inline-formula> and <inline-formula>
<mml:math display="inline" id="im56"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>&#x3c8;</mml:mi></mml:msub><mml:mo stretchy="false">[</mml:mo><mml:mo>&#xb7;</mml:mo><mml:mo stretchy="false">]</mml:mo></mml:mrow></mml:math></inline-formula> denote the differential operators for the boundary and inside the computational domain for the envelope function <inline-formula>
<mml:math display="inline" id="im57"><mml:mrow><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>, respectively, and the specifics can be expressed by <xref ref-type="disp-formula" rid="eq18">Equations 18</xref>&#x2013;<xref ref-type="disp-formula" rid="eq20">20</xref>:</p>
<disp-formula id="eq18"><label>(18)</label>
<mml:math display="block" id="M18"><mml:mrow><mml:msub><mml:mi>B</mml:mi><mml:mi>&#x3c8;</mml:mi></mml:msub><mml:mo stretchy="false">[</mml:mo><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mn>0</mml:mn><mml:mo stretchy="false">)</mml:mo><mml:mo stretchy="false">]</mml:mo><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:math>
</disp-formula>
<disp-formula id="eq19"><label>(19)</label>
<mml:math display="block" id="M19"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>&#x3c8;</mml:mi></mml:msub><mml:mo stretchy="false">[</mml:mo><mml:msub><mml:mi>&#x3c8;</mml:mi><mml:mrow><mml:mtext>real</mml:mtext></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo stretchy="false">]</mml:mo><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>r</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mn>2</mml:mn><mml:mi>i</mml:mi><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mfrac><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>z</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:msubsup><mml:mi>k</mml:mi><mml:mn>0</mml:mn><mml:mn>2</mml:mn></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msup><mml:mi>n</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>&#x2212;</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo><mml:mi>&#x3c8;</mml:mi></mml:mrow></mml:math>
</disp-formula>
<disp-formula id="eq20"><label>(20)</label>
<mml:math display="block" id="M20"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>&#x3c8;</mml:mi></mml:msub><mml:mo stretchy="false">[</mml:mo><mml:msub><mml:mi>&#x3c8;</mml:mi><mml:mrow><mml:mtext>imag</mml:mtext></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo stretchy="false">]</mml:mo><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>r</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>&#x2212;</mml:mo><mml:mn>2</mml:mn><mml:mi>i</mml:mi><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mfrac><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>r</mml:mi></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:mfrac><mml:mrow><mml:msup><mml:mo>&#x2202;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mi>&#x3c8;</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msup><mml:mi>z</mml:mi><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac><mml:mo>+</mml:mo><mml:msubsup><mml:mi>k</mml:mi><mml:mn>0</mml:mn><mml:mn>2</mml:mn></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msup><mml:mi>n</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>&#x2212;</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo><mml:mi>&#x3c8;</mml:mi></mml:mrow></mml:math>
</disp-formula>
<p>When <inline-formula>
<mml:math display="inline" id="im58"><mml:mrow><mml:mi>L</mml:mi><mml:mi>o</mml:mi><mml:mi>s</mml:mi><mml:msub><mml:mi>s</mml:mi><mml:mrow><mml:mi>T</mml:mi><mml:mi>o</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>l</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is less than the critical condition value <inline-formula>
<mml:math display="inline" id="im59"><mml:mi>&#x2208;</mml:mi></mml:math></inline-formula> set in advance or when the number of training rounds Epoch reaches the maximum value set in advance, the training is stopped, and the model parameters are saved; otherwise, backpropagation (BP) is continued, and the model parameters are updated.</p>
<p>When using the trained model for sound field prediction, the parameters of the model are loaded, and the range <inline-formula>
<mml:math display="inline" id="im60"><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> of the test set is set reasonably; the real and imaginary parts <inline-formula>
<mml:math display="inline" id="im61"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>&#x3c8;</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mrow><mml:mtext>real</mml:mtext></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> and <inline-formula>
<mml:math display="inline" id="im62"><mml:mrow><mml:msub><mml:mover accent="true"><mml:mi>&#x3c8;</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mrow><mml:mi>i</mml:mi><mml:mi>m</mml:mi><mml:mi>a</mml:mi><mml:mi>g</mml:mi></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> respectively, of the envelope function of the test set in range <inline-formula>
<mml:math display="inline" id="im63"><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> are obtained by model prediction and synthesized to obtain the envelope function, which is then converted to obtain the sound pressure <inline-formula>
<mml:math display="inline" id="im64"><mml:mrow><mml:mover accent="true"><mml:mi>&#x3c8;</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> by <xref ref-type="disp-formula" rid="eq21">Equation 21</xref> and plotted by <xref ref-type="disp-formula" rid="eq22">Equation 22</xref> for the one-dimensional (1D) and 2D transmission loss (TL) to validate the accuracy of the method and the effectiveness of the prediction. TL is compared with the numerical solutions calculated by KRAKEN to verify the accuracy of the method and the validity of the forecast.</p>
<disp-formula id="eq21"><label>(21)</label>
<mml:math display="block" id="M21"><mml:mrow><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mover accent="true"><mml:mi>&#x3c8;</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math>
</disp-formula>
<disp-formula id="eq22"><label>(22)</label>
<mml:math display="block" id="M22"><mml:mrow><mml:mtext>TL</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mo>&#x2212;</mml:mo><mml:mn>20</mml:mn><mml:mtext>&#xa0;log&#xa0;</mml:mtext><mml:mo>|</mml:mo><mml:mover accent="true"><mml:mi>p</mml:mi><mml:mo>&#x2dc;</mml:mo></mml:mover><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>|</mml:mo></mml:mrow></mml:math>
</disp-formula>
</sec>
</sec>
<sec id="s3">
<label>3</label>
<title>Research content and analysis</title>
<sec id="s3_1">
<label>3.1</label>
<title>Isovelocity waveguide with constant velocity of sound in the water column</title>
<p>For the water body sound velocity invariant isovelocity waveguide, we take a kind of Pekeris shallow sea waveguide environment with sedimentary layer added as an example and set the water depth as 100 m, the seafloor as an acoustic semi-infinite space covered with a layer of 20-m-thick sedimentary layer, the sound velocity profile as isoacoustic velocity invariant, the depth of the source as 25 m, and the frequency as 100 Hz. Specific environment parameter information is shown in <xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref>.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Environmental parameters of the Pekeris shallow water waveguide added to the sediment layer.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g005.tif">
<alt-text content-type="machine-generated">Graph depicting sound speed versus depth. The depth range is zero to one hundred meters. Two zones are highlighted: a layer from eighty to one hundred meters with properties &#x3c1;&#x2081; = 1.7 g/cm&#xb3;, &#x3b1;&#x2081; = 0.2 dB/&#x3bb;, C&#x2081; = 1600 m/s, &#x394;H = 20.0 m, and a half-space below one hundred meters with &#x3c1;&#x221e; = 2.0 g/cm&#xb3;, &#x3b1;&#x221e; = 0.2 dB/&#x3bb;, C&#x221e; = 2000 m/s.</alt-text>
</graphic></fig>
<p>The specific parameters are shown in <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>. The receiver depth range is determined based on the acoustic stratification characteristics of shallow-sea water, avoiding interference from bubble scattering near the sea surface (z &lt; 10 m) and strong absorption by sediments at the seabed (z &gt; 90 m). Meanwhile, three key depths (25, 50, and 75 m) are selected: 25 m is in the surface layer, slightly affected by sea surface reflection; 50 m is in the middle layer, where propagation is stable with little modal interference; 75 m is in the bottom layer, slightly affected by reflection from seabed sediments. These depths are used to comprehensively verify the model&#x2019;s performance in different propagation environments.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Experimental parameter description table.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Parameter category</th>
<th valign="middle" align="center">Parameter name</th>
<th valign="middle" align="center">Value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="2" align="center">Source parameters</td>
<td valign="middle" align="center">Source depth</td>
<td valign="middle" align="center">25 m</td>
</tr>
<tr>
<td valign="middle" align="center">Source frequency</td>
<td valign="middle" align="center">100 Hz</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">Receiver parameters</td>
<td valign="middle" align="center">Receiver depth range</td>
<td valign="middle" align="center">10&#x2013;90 m</td>
</tr>
<tr>
<td valign="middle" align="center">Key receiver depths</td>
<td valign="middle" align="center">25, 50, 75 m</td>
</tr>
<tr>
<td valign="middle" align="center">Spatial range</td>
<td valign="middle" align="center">Propagation distance range</td>
<td valign="middle" align="center">1,000&#x2013;9,000 m</td>
</tr>
<tr>
<td valign="middle" align="center">Environmental parameters</td>
<td valign="middle" align="center">Seabed sediment thickness</td>
<td valign="middle" align="center">20 m</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Firstly, using the KRAKEN software, the environment (env) file is set reasonably, and the phase velocity range is set to 0&#x2013;5,000 m/s. A total of 15-order modes are excited for the synthesis of the sound field, and the horizontal wavenumbers <inline-formula>
<mml:math display="inline" id="im65"><mml:mrow><mml:msub><mml:mi>k</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>m</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> and mode functions <inline-formula>
<mml:math display="inline" id="im66"><mml:mrow><mml:msub><mml:mtext>&#x3a8;</mml:mtext><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> are shown in <xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6a&#x2013;c</bold></xref>.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Pekeris waveguide for synthesis of sound field with horizontal wavenumber <inline-formula>
<mml:math display="inline" id="im67"><mml:mrow><mml:msub><mml:mi>k</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>m</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> and modal function <inline-formula>
<mml:math display="inline" id="im68"><mml:mrow><mml:msub><mml:mtext>&#x3a8;</mml:mtext><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>. <bold>(a)</bold> Scatterplot of real and imaginary parts of horizontal wavenumber <inline-formula>
<mml:math display="inline" id="im69"><mml:mrow><mml:msub><mml:mi>k</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>m</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>. <bold>(b)</bold> Pseudo-color map of modal function <inline-formula>
<mml:math display="inline" id="im70"><mml:mrow><mml:msub><mml:mtext>&#x3a8;</mml:mtext><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> (real part). <bold>(c)</bold> Plot of the real and imaginary parts of the modal function <inline-formula>
<mml:math display="inline" id="im71"><mml:mrow><mml:msub><mml:mtext>&#x3a8;</mml:mtext><mml:mi>m</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g006.tif">
<alt-text content-type="machine-generated">Three visualizations of KRAKEN-Pekeris at 100 Hz: (a) Scatter plot showing Imaginary k vs. Real k with points along a curve. (b) Colorful heatmap depicting Depth vs. Mode index with a range of vivid colors. (c) Series of plots showing depth variations for modes one to fifteen, each with distinct wave patterns.</alt-text>
</graphic></fig>
<p>Since <xref ref-type="disp-formula" rid="eq8">Equation 8</xref> adopts the far-field approximation <inline-formula>
<mml:math display="inline" id="im72"><mml:mrow><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo>&#x226b;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></inline-formula> and combines with the actual sound field forecasting application requirements, a part of the receiving points are set to calculate the exact solution as the labeled data to be used for data driving. By setting the field (flp) file, set the receiving area <italic>r</italic> range of 2,000&#x2013;8,000 m, every interval of 10 m to take a point, a total number of points <inline-formula>
<mml:math display="inline" id="im73"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>r</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> = 601. <italic>Z</italic> range is 10&#x2013;90 m, every interval of 10 m to take a point, with a total number of points <inline-formula>
<mml:math display="inline" id="im74"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>Z</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> = 9. The total number of sampling points nr * nz of the exact solution data is 5,409. The generated sound pressure <inline-formula>
<mml:math display="inline" id="im75"><mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> is transformed into an envelope function through <xref ref-type="disp-formula" rid="eq23">Equation 23</xref>; the total number of sampling points <inline-formula>
<mml:math display="inline" id="im76"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>r</mml:mi></mml:msub><mml:mo>*</mml:mo><mml:msub><mml:mi>N</mml:mi><mml:mi>z</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is 5,409. The generated sound pressure data <inline-formula>
<mml:math display="inline" id="im77"><mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> are transformed into the envelope function <inline-formula>
<mml:math display="inline" id="im78"><mml:mrow><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>:</p>
<disp-formula id="eq23"><label>(23)</label>
<mml:math display="block" id="M23"><mml:mrow><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo stretchy="false">/</mml:mo><mml:msubsup><mml:mi>H</mml:mi><mml:mn>0</mml:mn><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>k</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mi>r</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math>
</disp-formula>
<p>This equation is obtained by reasoning from <xref ref-type="disp-formula" rid="eq6">Equation 6</xref>. The envelope function <inline-formula>
<mml:math display="inline" id="im79"><mml:mrow><mml:mi>&#x3c8;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> is then split into real part <inline-formula>
<mml:math display="inline" id="im80"><mml:mrow><mml:msub><mml:mi>&#x3c8;</mml:mi><mml:mrow><mml:mtext>real</mml:mtext></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> and imaginary part <inline-formula>
<mml:math display="inline" id="im81"><mml:mrow><mml:msub><mml:mi>&#x3c8;</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>m</mml:mi><mml:mi>a</mml:mi><mml:mi>g</mml:mi></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> to be used as input for the training set of the neural network.</p>
<p>According to the description of PINN training in Section 2.3, the sampling area inside the computational domain is set in the range of 1,000&#x2013;9,000 m for <italic>r</italic> and 0.1&#x2013;100 m for <italic>z</italic>. Considering the complexity of the problem, the GPU memory size limitation, the length of the training model, and the accuracy requirement, the number of random sampling points inside the computational domain is set to be <inline-formula>
<mml:math display="inline" id="im82"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>p</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> = 5,000. The sampling area <italic>r</italic> was set to range from 1,000 to 9,000 m at the soft boundary of the sea surface, <italic>z</italic> was set to 0 m, and the number of equally spaced sampling points was set to <inline-formula>
<mml:math display="inline" id="im83"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>b</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> = 200.</p>
<p>According to the findings of <xref ref-type="bibr" rid="B4">Du et&#xa0;al. (2023)</xref>, it can be seen that the weight settings of the three loss function sources have a significant impact on whether the model training is successful or not, and we are guided by their findings to set the weights of the loss function as <inline-formula>
<mml:math display="inline" id="im84"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi></mml:mrow></mml:msub><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:mn>1</mml:mn><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></inline-formula>.</p>
<p>The experimental training is run on Aurora supercomputing server nodes with four NVIDIA Tesla V100 32GB graphics cards. The deep learning framework and version used is TensorFlow 2.5, and the optimizer used is Adam with a learning rate of 0.001. The number of hidden layers, L = 5, is used with a fully connected layer, and the number of neurons in each layer, <inline-formula>
<mml:math display="inline" id="im85"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>k</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> = 100.</p>
<p>During the test, the random sampling area <italic>r</italic> is set to range from 1,000 to 9,000 m, and <italic>z</italic> is set to range from 0 to 100 m. By setting the field (flp) file in advance, the results calculated by KRAKEN in the same area are obtained for comparison to verify the accuracy of the method and the effectiveness of the prediction.</p>
<p>When the number of training rounds is 12,000, the model is saved, and a forecast is made, as shown in <xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7</bold></xref>, plotting the PINN forecast against the KRAKEN numerically calculated 2D transmission loss.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Epoch = 12,000, &#x3bb;<italic><sub>Mass</sub></italic>:&#x3bb;<italic><sub>BC</sub></italic>:&#x3bb;<italic><sub>PDE</sub></italic> = 1:1:1, PINN <italic>vs</italic>. KRAKEN 2D transmission loss pseudo-color maps with errors. <bold>(a)</bold> PINN forecast result. <bold>(b)</bold> KRAKEN calculation result. <bold>(c)</bold> Error between the two results. PINN, physics-informed neural network.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g007.tif">
<alt-text content-type="machine-generated">Three side-by-side heatmaps illustrate transmission loss and error. The first panel shows Transmission Loss (PINN) with data ranging from zero to eighty. The second panel displays Transmission Loss (kraken) with a similar range. The third panel compares the Error of Transmission Loss, ranging from zero to ten, showing variations across depth and range using a color scale from blue to red. Each graph includes depth in meters on the y-axis and range in meters on the x-axis, marked with color bars indicating intensity levels.</alt-text>
</graphic></fig>
<p>It can be concluded that regions with a small number of accurate solutions, as labeled data, are forecasted with higher accuracy, and most of the regional forecasts are basically comparable to the accuracy of the KRAKEN numerical solutions with an error of 0 dB (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7c</bold></xref>, red part). In contrast, simply relying only on purely physical drive, in the internal and boundary random sampling point region, can only roughly reflect the trend of the transmission loss; the accuracy of the error is larger, and it is only suitable for use when the accuracy requirements are not high. It also quantitatively proves the reasonableness of the design of the network structure of this paper in Section 2.3. Relying solely on the physical process for extrapolation is less effective, while the accuracy of the forecast results is significantly improved after adding the data-driven process, which shows the importance of relying on high-quality labeled data for the data-driven deep learning of the complex ocean dynamics process.</p>
<p>Setting the reception depth to 25, 50, and 75 m plots the PINN prediction against the 1D transmission loss calculated from KRAKEN values, as shown in <xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8</bold></xref>.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>Epoch = 12,000, &#x3bb;<italic><sub>Mass</sub></italic>:&#x3bb;<italic><sub>BC</sub></italic>:&#x3bb;<italic><sub>PDE</sub></italic> = 1:1:1, PINN <italic>vs</italic>. KRAKEN 1D transmission loss. <bold>(a)</bold> Comparison of 1D transmission loss at a reception depth of 25 m. <bold>(b)</bold> Comparison of 1D transmission loss at a reception depth of 50 m. <bold>(c)</bold> Comparison of 1D transmission loss at a reception depth of 75 m. PINN, physics-informed neural network.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g008.tif">
<alt-text content-type="machine-generated">Three line graphs compare transmission loss at depths of twenty-five, fifty, and seventy-five meters. Each graph plots the range in meters on the x-axis against transmission loss in decibels on the y-axis. The red dashed line represents &#x201c;PINN,&#x201d; and the black solid line represents &#x201c;kraken.&#x201d; Patterns show variations in alignment and divergence at different ranges and depths.</alt-text>
</graphic></fig>
<p>According to the results, it can be seen that PINN has poor learning ability for some extreme points, but good learning ability for some slow-change regions. Since the transmission loss curve at 50 m is smoother than that at 25 and 75 m, and the variation is smaller, PINN learns well, and basically agrees with the results of KRAKEN&#x2019;s calculation in the range of 2,000&#x2013;8,000 m except for some extreme points.</p>
<p>Based on the results, we believe that the poor results may be due to model underfitting, so we grow the number of training rounds to 50,000, with other conditions remaining unchanged, and again compare the 1D and 2D transmission loss.</p>
<p>At this point, the model is saved, and a forecast is made, as shown in <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref>, plotting the PINN forecast against the KRAKEN numerically calculated 2D transmission loss.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>Epoch = 50,000, &#x3bb;<italic><sub>Mass</sub></italic>:&#x3bb;<italic><sub>BC</sub></italic>:&#x3bb;<italic><sub>PDE</sub></italic> = 1:1:1, PINN <italic>vs</italic>. KRAKEN 2D transmission loss pseudo-color maps with errors. <bold>(a)</bold> PINN forecast result. <bold>(b)</bold> KRAKEN calculation result. <bold>(c)</bold> Error between the two results. PINN, physics-informed neural network.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g009.tif">
<alt-text content-type="machine-generated">Three heatmap graphs illustrating transmission loss in water over depth and range, each with a color scale. The first graph (a) shows data using the PINN method; the second (b) uses the kraken method. The third graph (c) displays the error between the two methods, highlighting differences.</alt-text>
</graphic></fig>
<p>As can be seen from <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9c</bold></xref>, compared to <xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7c</bold></xref>, the sound field prediction is significantly better, especially at the region where the accurate unlabeled data are not driven, and simply driven by physics alone, it can be seen that when the number of training times is not enough, the model will be underfitted, and it is difficult to predict the accurate results at the prediction place, which puts a higher demand on the computing power of the GPU.</p>
<p>Setting the reception depth to 25, 50, and 75 m plots the PINN prediction against the 1D transmission loss calculated numerically by KRAKEN, as shown in <xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10</bold></xref>.</p>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p>Epoch = 50,000, &#x3bb;<italic><sub>Mass</sub></italic>:&#x3bb;<italic><sub>BC</sub></italic>:&#x3bb;<italic><sub>PDE</sub></italic> = 1:1:1, PINN <italic>vs</italic>. KRAKEN 1D transmission loss. <bold>(a)</bold> Comparison of 1D transmission loss at a reception depth of 25 m. <bold>(b)</bold> Comparison of 1D transmission loss at a reception depth of 50 m. <bold>(c)</bold> Comparison of 1D transmission loss at a reception depth of 75 m. PINN, physics-informed neural network.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g010.tif">
<alt-text content-type="machine-generated">Three line graphs compare TL in decibels at depths of twenty-five, fifty, and seventy-five meters over a range of one thousand to nine thousand meters. The red dashed line represents the PINN model, and the black solid line represents the Kraken model. The graphs show significant variations in transmission loss across different depths, with distinctive dips and peaks in each model's data.</alt-text>
</graphic></fig>
<p>As can be seen from <xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10</bold></xref>, compared with <xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8</bold></xref>, the prediction effect of the acoustic field is obviously better; especially at the ranges of 1,000&#x2013;2,000 and 8,000&#x2013;9,000 m, the error is obviously reduced, and the prediction accuracy is higher. However, for some extreme points, the model prediction effect is still poor, and it is necessary to gradually adjust the hyperparameters to train a better model to improve the prediction accuracy.</p>
<p>Next, a quantitative error analysis of the 1D transmission loss in <xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10</bold></xref> is performed to better analyze the experimental results, as shown in <xref ref-type="fig" rid="f11"><bold>Figure&#xa0;11</bold></xref>.</p>
<fig id="f11" position="float">
<label>Figure&#xa0;11</label>
<caption>
<p>Epoch = 50,000, &#x3bb;<italic><sub>Mass</sub></italic>:&#x3bb;<italic><sub>BC</sub></italic>:&#x3bb;<italic><sub>PDE</sub></italic> = 1:1:1, PINN <italic>vs</italic>. KRAKEN 1D transmission loss error analysis. <bold>(a)</bold> 1D transmission loss error at a reception depth of 25 m. <bold>(b)</bold> 1D transmission loss error at a reception depth of 50 m. <bold>(c)</bold> 1D transmission loss error at a reception depth of 75 m. PINN, physics-informed neural network.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g011.tif">
<alt-text content-type="machine-generated">Three line graphs showing error of transmission loss in decibels versus range in meters. The graphs represent depths of twenty-five, fifty, and seventy-five meters. Erratic fluctuations are visible across different ranges, with peaks and troughs varying in each graph.</alt-text>
</graphic></fig>
<p>The 1D transmission loss error analysis in <xref ref-type="fig" rid="f11"><bold>Figure&#xa0;11</bold></xref> is able to analyze the model&#x2019;s forecasting effect, and the combined analysis with <xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10</bold></xref> shows that the forecast deviation is larger at some extreme points, which is caused by the neural network&#x2019;s difficulty in learning for the extreme points, but these extreme points account for a small proportion of the entire range of <italic>r</italic>. Combined with the needs of the practical application, the transmission loss gap at the vast majority of <italic>r</italic> is small, and the small undulation is carried out around the 0dB up and down fluctuations, proving the effectiveness of the model, which can be used for sound field prediction.</p>
<p>In the actual training process, we found that the size of <inline-formula>
<mml:math display="inline" id="im86"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is always about two orders of magnitude smaller than <inline-formula>
<mml:math display="inline" id="im87"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula>
<mml:math display="inline" id="im88"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>, so when synthesizing the total loss function <inline-formula>
<mml:math display="inline" id="im89"><mml:mrow><mml:mi>L</mml:mi><mml:mi>o</mml:mi><mml:mi>s</mml:mi><mml:msub><mml:mi>s</mml:mi><mml:mrow><mml:mi>T</mml:mi><mml:mi>o</mml:mi><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>l</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> in <xref ref-type="disp-formula" rid="eq14">Equation 14</xref>, the <inline-formula>
<mml:math display="inline" id="im90"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is easily overwhelmed by the other two terms because it is too small to be of much use. Therefore, we try to set the ratio of the three loss functions to <inline-formula>
<mml:math display="inline" id="im91"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi><mml:mo>&#xa0;</mml:mo></mml:mrow></mml:msub><mml:mo>:</mml:mo><mml:mo>&#xa0;</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:mn>1</mml:mn><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:mn>100</mml:mn></mml:mrow></mml:math></inline-formula>. Other parameters remain unchanged and still train 50,000 times. The model is saved, and a forecast is made, as shown in <xref ref-type="fig" rid="f12"><bold>Figure&#xa0;12</bold></xref>, plotting the PINN forecast against the KRAKEN numerically calculated 2D transmission loss.</p>
<fig id="f12" position="float">
<label>Figure&#xa0;12</label>
<caption>
<p>Epoch = 50,000, &#x3bb;<italic><sub>Mass</sub></italic>:&#x3bb;<italic><sub>BC</sub></italic>:&#x3bb;<italic><sub>PDE</sub></italic> = 1:1:100, PINN <italic>vs</italic>. KRAKEN 2D transmission loss pseudo-color maps with errors. <bold>(a)</bold> PINN forecast result. <bold>(b)</bold> KRAKEN calculation result. <bold>(c)</bold> Error between the two results. PINN, physics-informed neural network.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g012.tif">
<alt-text content-type="machine-generated">Three heatmaps comparing transmission loss and error over depth and range. Left: Transmission Loss (PINN) with values from fifty to eighty. Middle: Transmission Loss (Kraken) with similar range. Right: Error of Transmission Loss showing values from zero to ten. Each axis labeled with depth in meters and range in meters.</alt-text>
</graphic></fig>
<p>As can be seen from <xref ref-type="fig" rid="f12"><bold>Figure&#xa0;12c</bold></xref>, compared to <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9c</bold></xref>, the sound field prediction becomes significantly better, especially at the region where no accurate unlabeled data drive is performed, and the region is simply driven by the physical drive alone, which can be seen that when adjusting the ratio between the three loss functions, the role of the <inline-formula>
<mml:math display="inline" id="im92"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is more clearly demonstrated, and the training of the internal random sampling points is more effective.</p>
<p>Setting the reception depth to 25, 50, and 75 m plots the PINN prediction against the 1D transmission loss calculated numerically by KRAKEN, as shown in <xref ref-type="fig" rid="f13"><bold>Figure&#xa0;13</bold></xref>.</p>
<fig id="f13" position="float">
<label>Figure&#xa0;13</label>
<caption>
<p>Epoch = 50,000, &#x3bb;<italic><sub>Mass</sub></italic>:&#x3bb;<italic><sub>BC</sub></italic>:&#x3bb;<italic><sub>PDE</sub></italic> = 1:1:100, PINN <italic>vs</italic>. KRAKEN 1D transmission loss. <bold>(a)</bold> Comparison of 1D transmission loss at a reception depth of 25 m. <bold>(b)</bold> Comparison of 1D transmission loss at a reception depth of 50 m. <bold>(c)</bold> Comparison of 1D transmission loss at a reception depth of 75 m. PINN, physics-informed neural network.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g013.tif">
<alt-text content-type="machine-generated">Three line graphs compare transmission loss (TL) in decibels over range in meters at depths of 25, 50, and 75 meters. Each graph contrasts data sets labeled as &#x201c;PINN&#x201d; with a red dashed line and &#x201c;kraken&#x201d; with a solid black line, showing similar patterns across different ranges.</alt-text>
</graphic></fig>
<p>As can be seen from <xref ref-type="fig" rid="f13"><bold>Figure&#xa0;13</bold></xref>, compared with <xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10</bold></xref>, the prediction effect of the acoustic field is obviously better; especially in <italic>r</italic> ranges of 1,000&#x2013;2,000 and 8,000&#x2013;9,000 m, the error is obviously reduced, and the prediction accuracy is higher. However, for some extreme points, the model prediction effect is still poor, and it is necessary to gradually adjust each hyperparameter to train a better model to improve the prediction accuracy.</p>
<p>The variation of errors with propagation distance follows the acoustic propagation law of &#x201c;near-field mode excitation&#x2013;mid-field stable propagation&#x2013;far-field energy attenuation&#x201d; and forms a cross-influence with errors in the depth dimension:</p>
<p>1. Near field (1,000&#x2013;2,000 m): incomplete mode excitation and dynamics signal adjustment.</p>
<p>The near field is the excitation stage of normal modes, where the number of modes gradually increases from partial excitation to the full order (15 orders), and the signal fluctuation law changes continuously. However, PINN training relies on mid-field stable mode data, and its generalization ability for near-field dynamics signals is insufficient. Meanwhile, multipath interference in the near field is stronger, further amplifying the error.</p>
<p>2. Mid field (2,000&#x2013;8,000 m): stable modes and gentle attenuation, minimum error.</p>
<p>The mid-field is the stable propagation stage of normal modes. All 15 orders of modes are excited with fixed energy proportions, and sound waves propagate in the form of stable modal superposition. Energy attenuation only follows the spherical wave law, with a gentle rate and stable signal-to-noise ratio (SNR). This stable physical process is fully compatible with the learning characteristics of PINN, so the error at all depths in this interval is the smallest.</p>
<p>3. Far field (8,000&#x2013;9,000 m): cumulative energy attenuation and difficulty in capturing weak signals.</p>
<p>The far field is the energy attenuation stage of normal modes. In addition to spherical wave attenuation, the volume absorption effect of seawater emerges, causing the signal SNR to decrease significantly, below the threshold for effective fitting by PINN. Meanwhile, the energy proportion of high-order modes drops sharply, reducing the &#x201c;modal diversity&#x201d; of the signal. PINN is prone to the problem of gentle gradients when fitting weak signals + low-frequency fluctuations, leading to a slight increase in error.</p>
<p>Next, a quantitative error analysis of the 1D transmission loss in <xref ref-type="fig" rid="f13"><bold>Figure&#xa0;13</bold></xref> is performed to better analyze the experimental results, as shown in <xref ref-type="fig" rid="f14"><bold>Figure&#xa0;14</bold></xref>.</p>
<fig id="f14" position="float">
<label>Figure&#xa0;14</label>
<caption>
<p>Epoch = 50,000, &#x3bb;<italic><sub>Mass</sub></italic>:&#x3bb;<italic><sub>BC</sub></italic>:&#x3bb;<italic><sub>PDE</sub></italic> = 1:1:100, PINN <italic>vs</italic>. KRAKEN 1D transmission loss error analysis. <bold>(a)</bold> 1D transmission loss error at a reception depth of 25 m. <bold>(b)</bold> 1D transmission loss error at a reception depth of 50 m. <bold>(c)</bold> 1D transmission loss error at a reception depth of 75 m. PINN, physics-informed neural network.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1665305-g014.tif">
<alt-text content-type="machine-generated">Three line graphs display the error of transmission loss in decibels (dB) versus range in meters (m) at depths of 25m, 50m, and 75m. Each graph shows fluctuations in error values, with more pronounced peaks and troughs as the range increases. All graphs span a range from 1000m to 9000m, with error values between -20dB and 20dB.</alt-text>
</graphic></fig>
<p>The 1D transmission loss error analysis in <xref ref-type="fig" rid="f14"><bold>Figure&#xa0;14</bold></xref> is able to analyze the forecasting effect of the model, and the combination of the analysis with <xref ref-type="fig" rid="f13"><bold>Figure&#xa0;13</bold></xref> shows that the forecast deviation is larger at some extreme points, which is caused by the difficulty of the neural network to learn the extreme points, but these extreme points account for a small percentage in the whole range, and in combination with the practical application requirements, the transmission loss gap at the vast majority of the points is small, and small ups and downs are carried out around 0-dB fluctuations, proving the effectiveness of the model, which can be used for sound field prediction.</p>
<p>To intuitively quantify the prediction accuracy of PINN, under the experimental conditions of Epoch = 50 000 and loss weight ratio <inline-formula>
<mml:math display="inline" id="im93"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi><mml:mo>&#xa0;</mml:mo></mml:mrow></mml:msub><mml:mo>:</mml:mo><mml:mo>&#xa0;</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi><mml:mo>&#xa0;</mml:mo></mml:mrow></mml:msub><mml:mo>:</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:mn>1</mml:mn><mml:mo>:</mml:mo><mml:mn>100</mml:mn></mml:mrow></mml:math></inline-formula>, four core indicators are selected: RMSE, mean absolute error (MAE), mean relative error (MRE), and correlation coefficient (R). These indicators are used to compare the predicted values of PINN with the numerical solutions (ground truth) of KRAKEN. The following sections first clarify the definition and calculation formulas of each indicator, then present quantitative results in <xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>, and finally analyze the significance of the indicators.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Quantitative error results from training epoch.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Training epoch</th>
<th valign="middle" align="center">Receiver depth</th>
<th valign="middle" align="center">RMSE (dB)</th>
<th valign="middle" align="center">MAE (dB)</th>
<th valign="middle" align="center">MRE (%)</th>
<th valign="middle" align="center">Correlation coefficient (R)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="4" align="left">12,000</td>
<td valign="middle" align="center">25 m</td>
<td valign="middle" align="center">2.8</td>
<td valign="middle" align="center">2.1</td>
<td valign="middle" align="center">7.2</td>
<td valign="middle" align="center">0.86</td>
</tr>
<tr>
<td valign="middle" align="center">50 m</td>
<td valign="middle" align="center">1.3</td>
<td valign="middle" align="center">0.9</td>
<td valign="middle" align="center">3.5</td>
<td valign="middle" align="center">0.94</td>
</tr>
<tr>
<td valign="middle" align="center">75 m</td>
<td valign="middle" align="center">2.5</td>
<td valign="middle" align="center">1.9</td>
<td valign="middle" align="center">6.0</td>
<td valign="middle" align="center">0.88</td>
</tr>
<tr>
<td valign="middle" align="center">Full-depth average</td>
<td valign="middle" align="center">2.2</td>
<td valign="middle" align="center">1.7</td>
<td valign="middle" align="center">5.6</td>
<td valign="middle" align="center">0.90</td>
</tr>
<tr>
<td valign="middle" rowspan="4" align="left">50,000</td>
<td valign="middle" align="center">25 m</td>
<td valign="middle" align="center">1.6</td>
<td valign="middle" align="center">1.2</td>
<td valign="middle" align="center">4.0</td>
<td valign="middle" align="center">0.93</td>
</tr>
<tr>
<td valign="middle" align="center">50 m</td>
<td valign="middle" align="center">0.7</td>
<td valign="middle" align="center">0.5</td>
<td valign="middle" align="center">2.0</td>
<td valign="middle" align="center">0.98</td>
</tr>
<tr>
<td valign="middle" align="center">75 m</td>
<td valign="middle" align="center">1.4</td>
<td valign="middle" align="center">1.0</td>
<td valign="middle" align="center">3.5</td>
<td valign="middle" align="center">0.95</td>
</tr>
<tr>
<td valign="middle" align="center">Full-depth average</td>
<td valign="middle" align="center">1.2</td>
<td valign="middle" align="center">0.9</td>
<td valign="middle" align="center">3.2</td>
<td valign="middle" align="center">0.96</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>RMSE, root mean square error; MAE, mean absolute error; MRE, mean relative error.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>All indicators are calculated based on transmission loss. The sample statistical rules are as follows:</p>
<list list-type="bullet">
<list-item>
<p>Single depth (25/50/75 m): The calculation interval covers the propagation distance from 1,000 to 9,000 m, with a total of 801 sample points, and the sample size N = 801.</p></list-item>
<list-item>
<p>Full-depth average: The average of indicators for nine depths from 10 to 90 m (with an interval of 10 m) is calculated, and the sample size for each depth is 801.</p></list-item>
</list>
<p>The specific calculation formulas are as follows:</p>
<p>&#x2022; RMSE (unit: dB) reflects the overall deviation between predicted values and ground truth; the smaller the value, the higher the accuracy. The calculation formula as shown in <xref ref-type="disp-formula" rid="eq24">Equation 24</xref></p>
<disp-formula id="eq24"><label>(24)</label>
<mml:math display="block" id="M24"><mml:mrow><mml:mi>R</mml:mi><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:msqrt><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>N</mml:mi></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover></mml:mstyle><mml:msup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mtext>PINN</mml:mtext><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mtext>KRAKEN&#x2004;</mml:mtext><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:msqrt></mml:mrow></mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im94"><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mtext>PINN</mml:mtext><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is the <inline-formula>
<mml:math display="inline" id="im95"><mml:mi>i</mml:mi></mml:math></inline-formula>th transmission loss value predicted by PINN and <inline-formula>
<mml:math display="inline" id="im96"><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mtext>KRAKEN</mml:mtext><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is the <italic>i</italic>th ground truth transmission loss calculated by KRAKEN.</p>
<p>&#x2022; MAE (unit: dB) reflects the mean absolute deviation between predicted values and ground truth and has strong resistance to extreme value interference. The calculation formula as shown in <xref ref-type="disp-formula" rid="eq25">Equation 25</xref></p>
<disp-formula id="eq25"><label>(25)</label>
<mml:math display="block" id="M25"><mml:mrow><mml:mi>M</mml:mi><mml:mi>A</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>N</mml:mi></mml:mfrac><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover><mml:mo>|</mml:mo><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mtext>PINN</mml:mtext><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mtext>KRAKEN&#x2004;</mml:mtext><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo></mml:mrow></mml:math>
</disp-formula>
<p>&#x2022; MRE (unit: %) reflects the relative proportion of errors (eliminating the influence of TL magnitude), facilitating comparison across depths/distances. The calculation formula as shown in <xref ref-type="disp-formula" rid="eq26">Equation 26</xref></p>
<disp-formula id="eq26"><label>(26)</label>
<mml:math display="block" id="M26"><mml:mrow><mml:mi>M</mml:mi><mml:mi>R</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:mo>(</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>N</mml:mi></mml:mfrac><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover><mml:mfrac><mml:mrow><mml:mo>|</mml:mo><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi mathvariant="normal">P</mml:mi><mml:mi mathvariant="normal">I</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">R</mml:mi><mml:mi mathvariant="normal">A</mml:mi><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">E</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">R</mml:mi><mml:mi mathvariant="normal">A</mml:mi><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">E</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac><mml:mo>)</mml:mo><mml:mo>&#xd7;</mml:mo><mml:mn>100</mml:mn></mml:mrow></mml:math>
</disp-formula>
<p>&#x2022; Correlation coefficient (R) reflects the linear correlation between predicted values and ground truth, with a value range of [0, 1]. The closer it is to 1, the better the fitting consistency. The calculation formula as shown in <xref ref-type="disp-formula" rid="eq27">Equation 27</xref></p>
<disp-formula id="eq27"><label>(27)</label>
<mml:math display="block" id="M27"><mml:mrow><mml:mi>R</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:mrow><mml:msubsup><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:msubsup></mml:mrow></mml:mstyle><mml:mo stretchy="false">(</mml:mo><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi mathvariant="normal">P</mml:mi><mml:mi mathvariant="normal">I</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mover accent="true"><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi mathvariant="normal">P</mml:mi><mml:mi mathvariant="normal">I</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">&#xaf;</mml:mo></mml:mover><mml:mo stretchy="false">)</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">R</mml:mi><mml:mi mathvariant="normal">A</mml:mi><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">E</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mover accent="true"><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">R</mml:mi><mml:mi mathvariant="normal">A</mml:mi><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">E</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">&#xaf;</mml:mo></mml:mover><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mrow><mml:msqrt><mml:mrow><mml:mstyle displaystyle="true"><mml:mrow><mml:msubsup><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:msubsup></mml:mrow></mml:mstyle><mml:msup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi mathvariant="normal">P</mml:mi><mml:mi mathvariant="normal">I</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mover accent="true"><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi mathvariant="normal">P</mml:mi><mml:mi mathvariant="normal">I</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">&#xaf;</mml:mo></mml:mover><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:msqrt><mml:mo>&#xd7;</mml:mo><mml:msqrt><mml:mrow><mml:mstyle displaystyle="true"><mml:msubsup><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:msubsup></mml:mstyle><mml:msup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">R</mml:mi><mml:mi mathvariant="normal">A</mml:mi><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">E</mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mo>,</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mover accent="true"><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">R</mml:mi><mml:mi mathvariant="normal">A</mml:mi><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">K</mml:mi><mml:mi mathvariant="normal">E</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">&#xaf;</mml:mo></mml:mover><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:msqrt></mml:mrow></mml:mfrac></mml:mrow></mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im97"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mtext>PINN</mml:mtext></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">&#xaf;</mml:mo></mml:mover></mml:mrow></mml:math></inline-formula> is the mean value of TL predicted by PINN and <inline-formula>
<mml:math display="inline" id="im98"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mtext>KRAKEN&#x2004;</mml:mtext></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">&#xaf;</mml:mo></mml:mover></mml:mrow></mml:math></inline-formula> is the mean value of TL calculated by KRAKEN.</p>
<p>The variation of errors with depth is essentially the transmission of sea surface/seabed boundary effects to the model fitting results through signal complexity, specifically manifested as follows:</p>
<p>1. Surface layer at 25 m: multipath interference at the sea surface aggravates signal fluctuation.</p>
<p>At a depth of 25 m, close to the sea surface (only 25 m), sound waves form multipath interference of direct waves and sea surface reflected waves due to the sea surface pressure-release boundary. The acoustic pressure signal after interference exhibits a significant increase in fluctuation frequency and extreme point density, reducing its adaptability to the fully connected layers and activation function of PINN. The network is prone to vanishing gradients for high-frequency non-stationary fluctuations, leading to fitting deviations at extreme points, especially in the near-field region. Additionally, the surface water body is affected by potential wind-wave disturbances, resulting in lower signal phase stability than in the middle layer, further amplifying prediction deviations.</p>
<p>2. Middle layer at 50 m: stable propagation without boundary interference.</p>
<p>At a depth of 50 m, located in the middle of the water body and far from both the sea surface (50 m) and the seabed (including a 20-m sediment interface), it is a &#x201c;clean area&#x201d; with minimal boundary interference. The 15th-order normal modes have a uniform energy distribution at this depth, with no obvious modal superposition or cancellation. The acoustic pressure signal fluctuates gently and has a high SNR, fully matching the learning capability of PINN. Therefore, the prediction results at this depth have the highest coincidence with the numerical solution of KRAKEN, and the overall error is the smallest.</p>
<p>3. Bottom layer at 75 m: signal distortion caused by seabed sediments.</p>
<p>At a depth of 75 m, close to the seabed sediment interface (only 25 m), it is significantly affected by the acoustic impedance difference between sediments and water. On the one hand, normal modes (especially high-order ones) undergo modal conversion at the interface, breaking the original energy distribution and causing the signal fluctuation law to deviate from a stable state. On the other hand, sediments have a higher attenuation coefficient, leading to rapid energy loss of sound waves and a decrease in SNR in the far-field region. The combined effect of these two factors increases signal complexity, reducing PINN&#x2019;s fitting accuracy for weak signals and non-stationary fluctuations.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Hyperparameter configuration and sensitivity analysis</title>
<p>The hyperparameter configuration of the model in this study is based on the characteristics of the physical problem, literature references, and verification via the control variable method. The core hyperparameters and their selection principles are as follows:</p>
<list list-type="bullet">
<list-item>
<p>Activation function: The sine function (<inline-formula>
<mml:math display="inline" id="im99"><mml:mrow><mml:mi>&#x3c3;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>x</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mtext>sin&#xa0;</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:mi>x</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>) is selected. Referring to the research conclusions of <xref ref-type="bibr" rid="B26">Song et&#xa0;al. (2022)</xref>, this function exhibits significantly better fitting performance for frequency-domain wavefield PDE problems compared to commonly used functions, such as ReLU and Sigmoid, and can effectively avoid the vanishing gradient problem.</p></list-item>
<list-item>
<p>Optimizer and learning rate: The Adam optimizer (with a learning rate of 0.001) is adopted, which is widely used in deep learning for solving PDE problems (<xref ref-type="bibr" rid="B24">Raissi et&#xa0;al., 2019</xref>). Pre-experiment verification shows that when the learning rate is higher than 0.01, training tends to oscillate and diverge; when the learning rate is lower than 0.0001, the convergence speed is extremely slow (stable error cannot be achieved even after 50,000 iterations).</p></list-item>
<list-item>
<p>Network structure parameters: For the number of hidden layers (<inline-formula>
<mml:math display="inline" id="im100"><mml:mrow><mml:mi>L</mml:mi><mml:mo>=</mml:mo><mml:mn>5</mml:mn></mml:mrow></mml:math></inline-formula>) and the number of neurons per layer (<inline-formula>
<mml:math display="inline" id="im101"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn>100</mml:mn></mml:mrow></mml:math></inline-formula>), combinations of <inline-formula>
<mml:math display="inline" id="im102"><mml:mrow><mml:mi>L</mml:mi><mml:mo>=</mml:mo><mml:mn>3</mml:mn><mml:mo stretchy="false">/</mml:mo><mml:mn>5</mml:mn><mml:mo stretchy="false">/</mml:mo><mml:mn>7</mml:mn></mml:mrow></mml:math></inline-formula> and <inline-formula>
<mml:math display="inline" id="im103"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:mn>50</mml:mn><mml:mo stretchy="false">/</mml:mo><mml:mn>100</mml:mn><mml:mo stretchy="false">/</mml:mo><mml:mn>150</mml:mn></mml:mrow></mml:math></inline-formula> are tested using the control variable method. When <inline-formula>
<mml:math display="inline" id="im104"><mml:mrow><mml:mi>L</mml:mi><mml:mo>&lt;</mml:mo><mml:mn>5</mml:mn></mml:mrow></mml:math></inline-formula>, the model&#x2019;s fitting ability is insufficient; when <inline-formula>
<mml:math display="inline" id="im105"><mml:mrow><mml:mi>L</mml:mi><mml:mo>&gt;</mml:mo><mml:mn>5</mml:mn></mml:mrow></mml:math></inline-formula> or <inline-formula>
<mml:math display="inline" id="im106"><mml:mrow><mml:msub><mml:mi>N</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:mo>&gt;</mml:mo><mml:mn>100</mml:mn></mml:mrow></mml:math></inline-formula>, the model exhibits overfitting. The configuration of five hidden layers with 100 neurons achieves an optimal balance between accuracy and generalization ability.</p></list-item>
<list-item>
<p>Loss function weights: The selection of the core hyperparameter <inline-formula>
<mml:math display="inline" id="im107"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi></mml:mrow></mml:msub><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> needs to balance data fitting and physical constraints, and its sensitivity will be analyzed in detail in the following content.</p></list-item>
</list>
<p>Four groups of comparative experiments are designed (50,000 training epochs) to test the impact of different weight ratios on model performance.</p>
<p>The results are shown in <xref ref-type="table" rid="T3"><bold>Table&#xa0;3</bold></xref>.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Results of loss weight sensitivity analysis.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center"><inline-formula>
<mml:math display="inline" id="im108"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi><mml:mo>&#xa0;</mml:mo></mml:mrow></mml:msub><mml:mo>:</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula></th>
<th valign="middle" align="center">RMSE (dB)</th>
<th valign="middle" align="center">MAE (dB)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">1:1:1</td>
<td valign="middle" align="center">2.3</td>
<td valign="middle" align="center">1.8</td>
</tr>
<tr>
<td valign="middle" align="center">1:1:50</td>
<td valign="middle" align="center">1.7</td>
<td valign="middle" align="center">1.3</td>
</tr>
<tr>
<td valign="middle" align="center">1:1:100</td>
<td valign="middle" align="center">1.2</td>
<td valign="middle" align="center">0.9</td>
</tr>
<tr>
<td valign="middle" align="center">1:1:200</td>
<td valign="middle" align="center">1.9</td>
<td valign="middle" align="center">1.5</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>RMSE, root mean square error; MAE, mean absolute error.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>When <inline-formula>
<mml:math display="inline" id="im109"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub><mml:mo>&lt;</mml:mo><mml:mn>100</mml:mn></mml:mrow></mml:math></inline-formula>, the physical constraint term is &#x201c;overwhelmed&#x201d; by the data term and boundary term, making it difficult for the model to learn the physical laws of acoustic propagation, and the error increases significantly. When <inline-formula>
<mml:math display="inline" id="im110"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>100</mml:mn></mml:mrow></mml:math></inline-formula>, the model achieves optimal performance: the RMSE and MAE are the smallest, the convergence speed is the fastest, and the physical constraint can fully exert its effect without excessively suppressing data fitting. When <inline-formula>
<mml:math display="inline" id="im111"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub><mml:mo>&gt;</mml:mo><mml:mn>100</mml:mn><mml:mo>,</mml:mo></mml:mrow></mml:math></inline-formula> the excessively high weight of the physical constraint causes the model to overemphasize satisfying the elliptic fluctuation equation, leading to increased deviation from real sound field data and decreased convergence stability.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Comparative experiments with other neural network methods</title>
<p>To verify the core advantage of physical constraints in the PINN, two typical pure data-driven models are selected for comparison:</p>
<list list-type="bullet">
<list-item>
<p>Comparative Model 1&#x2014;standard feedforward ANN: It has the same structure as the PINN in this study (5 hidden layers + 100 neurons + sine activation function), but the physical constraint term is removed (the loss function only retains <inline-formula>
<mml:math display="inline" id="im112"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>).</p></list-item>
<list-item>
<p>Comparative Model 2&#x2014;convolutional neural network (CNN): It adopts a structure of &#x201c;3 convolutional layers + 2 fully connected layers&#x201d;. The input is the encoded feature of <inline-formula>
<mml:math display="inline" id="im113"><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>r</mml:mi><mml:mo>,</mml:mo><mml:mi>z</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> coordinates, with no physical constraints, and the sound field mapping relationship is learned only through data-driven methods.</p></list-item>
</list>
<p>The number of training epochs is uniformly set to 50,000, and hyperparameters (learning rate, batch size, and activation function) remain consistent; the only difference lies in whether physical constraints are introduced.</p>
<p>The evaluation indicators are shown in <xref ref-type="table" rid="T4"><bold>Table&#xa0;4</bold></xref>.</p>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>Comparison of quantitative indicators among different models.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Model</th>
<th valign="middle" align="center">RMSE (dB)</th>
<th valign="middle" align="center">MAE (dB)</th>
<th valign="middle" align="center">MRE (%)</th>
<th valign="middle" align="center">R</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Proposed PINN (with physical constraints)</td>
<td valign="middle" align="center">1.2</td>
<td valign="middle" align="center">0.9</td>
<td valign="middle" align="center">3.2</td>
<td valign="middle" align="center">0.96</td>
</tr>
<tr>
<td valign="middle" align="center">Standard ANN (without physical constraints)</td>
<td valign="middle" align="center">3.5</td>
<td valign="middle" align="center">2.7</td>
<td valign="middle" align="center">9.8</td>
<td valign="middle" align="center">0.7</td>
</tr>
<tr>
<td valign="middle" align="center">CNN (without physical constraints)</td>
<td valign="middle" align="center">2.8</td>
<td valign="middle" align="center">2.1</td>
<td valign="middle" align="center">7.5</td>
<td valign="middle" align="center">0.78</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>RMSE, root mean square error; MAE, mean absolute error; MRE, mean relative error; PINN, physics-informed neural network; ANN, artificial neural network; CNN, convolutional neural network.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>Based on the comparative data in <xref ref-type="table" rid="T4"><bold>Table&#xa0;4</bold></xref>, the PINN model with physical constraints is comprehensively superior to purely data-driven models such as standard feedforward neural networks and convolutional neural networks in key performance indicators of underwater acoustic field prediction. From the perspective of error control, the RMSE, MAE, and MRE of the PINN are all significantly lower than those of the two types of purely data-driven models, reflecting its more accurate fitting of acoustic field propagation laws and stronger error stability. In contrast, purely data-driven models, due to the lack of constraints from acoustic physical laws, are prone to fitting deviations in complex acoustic field environments, resulting in higher values of various error indicators. From the perspective of fitting consistency, the correlation coefficient of the PINN is much higher than that of purely data-driven models and much closer to the ideal value of 1, indicating a higher degree of consistency between its predicted results and the real acoustic field, as well as its ability to more accurately replicate the intrinsic characteristics of acoustic field propagation.</p>
<p>This data comparison clearly confirms the key role of physical constraints: by integrating physical priors from the elliptic fluctuation equation, boundary conditions, and relevant acoustic theories, the PINN effectively compensates for the shortcomings of purely data-driven models, which rely on statistical features and lack physical logic guidance. This enables the PINN to maintain excellent prediction performance even in complex acoustic field scenarios, fully highlighting the performance advantages of the proposed PINN framework compared to purely data-driven methods.</p>
</sec>
</sec>
<sec id="s4" sec-type="conclusions">
<label>4</label>
<title>Conclusions and discussions</title>
<sec id="s4_1" sec-type="conclusions">
<label>4.1</label>
<title>Conclusions</title>
<p>Based on the experimental results in Section 4, we obtain the following experimental conclusions:</p>
<list list-type="order">
<list-item>
<p>The PINN structure is highly dependent on partially exact solutions as labeled data and must be adapted for complex ocean dynamics modeling problems that are difficult to learn for deep physical processes using only a simple fully connected layer structure.</p></list-item>
<list-item>
<p>In the deep learning process, hyperparameters have a great impact, such as the learning rate, the type of optimizer used, the activation function used, the number of hidden layers, the number of neurons in each layer, and some specific hyperparameters in the structure of the PINN, such as the weight of the loss function <inline-formula>
<mml:math display="inline" id="im114"><mml:mrow><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi><mml:mo>&#xa0;</mml:mo></mml:mrow></mml:msub><mml:mo>:</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>B</mml:mi><mml:mi>C</mml:mi></mml:mrow></mml:msub><mml:mo>&#xa0;</mml:mo><mml:mo>:</mml:mo><mml:msub><mml:mi>&#x3bb;</mml:mi><mml:mrow><mml:mi>P</mml:mi><mml:mi>D</mml:mi><mml:mi>E</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula>, have an important impact on the forecasting effect of the trained model and its applicability and need to be adjusted for many attempts.</p></list-item>
<list-item>
<p>During training, if the number of training rounds is low, there may be underfitting; the trained model is simpler and performs poorly on both the training and test sets. If the number of training rounds is too high, there may be overfitting; the model generalizes poorly and performs poorly on the test set.</p></list-item>
</list>
</sec>
<sec id="s4_2" sec-type="discussion">
<label>4.2</label>
<title>Discussions</title>
<p>In view of the above experimental conclusions, we propose several discussions:</p>
<list list-type="order">
<list-item>
<p>For the specific problem of sound field prediction, it is necessary to use some network structures that can be improved by extracting the features of the data using a small amount of labeled data. For example, <xref ref-type="bibr" rid="B11">Hu et&#xa0;al. (2023)</xref> proposed an augmented physics-informed neural network (APINN) based on region decomposition and parameter sharing strategy, which improved the efficiency and effectiveness of PINN in dealing with complex partial differential equations. <xref ref-type="bibr" rid="B31">Zeng et&#xa0;al. (2022)</xref> proposed a competitive physics-informed neural network (CPINN) based on reinforcement learning in adversarial ideas, which trained a discriminative network specifically scored for the errors generated by the PINN, which has significantly improved the robustness of the algorithm itself.</p></list-item>
<list-item>
<p>For the problem that hyperparameters have a large impact on the network, it is necessary to use the method of control variables and combine it with the experience of researchers in the references for tuning parameters for a specific problem, adjusting one hyperparameter at a time until the most suitable hyperparameters are tried out in combination. Some adaptive tuning algorithms can also be adopted to adjust the hyperparameters. For example, <xref ref-type="bibr" rid="B30">Wang et&#xa0;al. (2021)</xref> proposed a learning rate annealing algorithm to solve the problem of unstable imbalance in gradient size during gradient descent.</p></list-item>
<list-item>
<p>For the overfitting and underfitting problems in the training process, it is necessary to print out and save the changes in the loss function in time during the training process; according to the trend of its changes, it is necessary to stop early in the case where the loss function is just converged and the fitting effect is better without overfitting, and it is necessary to use the validation set to assist in the training if necessary.</p></list-item>
</list>
</sec>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material. Further inquiries can be directed to the corresponding author.</p></sec>
<sec id="s6" sec-type="author-contributions">
<title>Author contributions</title>
<p>LC: Writing &#x2013; original draft. LZ: Writing &#x2013; review &amp; editing. XS: Conceptualization, Writing &#x2013; review &amp; editing. JD: Data curation, Writing &#x2013; review &amp; editing. LY: Investigation, Writing &#x2013; review &amp; editing. XZ: Methodology, Writing &#x2013; review &amp; editing. JC: Software, Writing &#x2013; review &amp; editing.</p></sec>
<ack>
<title>Acknowledgments</title>
<p>The authors would like to thank SPIB (Signal Processing Information Base), where the related data originally come from.</p>
</ack>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s9" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that Generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Collis</surname> <given-names>J. M.</given-names></name>
<name><surname>Siegmann</surname> <given-names>W. L.</given-names></name>
<name><surname>Jensen</surname> <given-names>F. B.</given-names></name>
<name><surname>Zampolli</surname> <given-names>M.</given-names></name>
<name><surname>K&#xfc;sel</surname> <given-names>E. T.</given-names></name>
<name><surname>Collins</surname> <given-names>M. D.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>Parabolic equation solution of seismo-acoustics problems involving variations in bathymetry and sediment thickness</article-title>. <source>J. Acoustical Soc. America</source> <volume>123</volume>, <fpage>51</fpage>&#x2013;<lpage>55</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1121/1.2799932</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cybenko</surname> <given-names>G.</given-names></name>
</person-group> (<year>1989</year>). 
<article-title>Approximation by superpositions of a sigmoidal function</article-title>. <source>Mathematics control signals Syst.</source> <volume>2</volume>, <fpage>303</fpage>&#x2013;<lpage>314</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF02551274</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="web">
<person-group person-group-type="author">
<name><surname>Dean</surname> <given-names>J.</given-names></name>
<name><surname>Monga</surname> <given-names>R.</given-names></name>
</person-group> (<year>2015</year>).
<article-title>TensorFlow Large-scale machine learning on heterogeneous distributed systems</article-title>. Available online at: <uri xlink:href="http://www.TensorFlow.org">TensorFlow.org</uri>.
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Du</surname> <given-names>L.</given-names></name>
<name><surname>Wang</surname> <given-names>Z.</given-names></name>
<name><surname>Lv</surname> <given-names>Z.</given-names></name>
<name><surname>Wang</surname> <given-names>L.</given-names></name>
<name><surname>Han</surname> <given-names>D.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Research on underwater acoustic field prediction method based on physics-informed neural network</article-title>. <source>Front. Mar. Sci.</source> <volume>10</volume>, <elocation-id>1302077</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2023.1302077</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Duan</surname> <given-names>J.</given-names></name>
<name><surname>Zhao</surname> <given-names>H.</given-names></name>
<name><surname>Song</surname> <given-names>J.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Spatial domain decomposition-based physics-informed neural networks for practical acoustic propagation estimation under ocean dynamics</article-title>. <source>J. Acoustical Soc. America</source> <volume>155</volume>, <fpage>3306</fpage>&#x2013;<lpage>3321</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1121/10.0026025</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fogarty</surname> <given-names>T. R.</given-names></name>
<name><surname>LeVeque</surname> <given-names>R. J.</given-names></name>
</person-group> (<year>1999</year>). 
<article-title>High-resolution finite-volume methods for acoustic waves in periodic and random media</article-title>. <source>J. Acoustical Soc. America</source> <volume>106</volume>, <fpage>17</fpage>&#x2013;<lpage>28</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1121/1.428038</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="confproc">
<person-group person-group-type="author">
<name><surname>Gao</surname> <given-names>Y.</given-names></name>
<name><surname>Xiao</surname> <given-names>P.</given-names></name>
<name><surname>Li</surname> <given-names>Z.</given-names></name>
</person-group> (<year>2024</year>). &#x201c;
<article-title>Physics-informed neural networks for solving underwater two dimensional sound field</article-title>,&#x201d; in <conf-name>2024 OES China Ocean Acoustics (COA)</conf-name>. <fpage>1</fpage>&#x2013;<lpage>4</lpage> (
<publisher-name>IEEE</publisher-name>).
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Godin</surname> <given-names>O.</given-names></name>
</person-group> (<year>1992</year>). 
<article-title>Theory of sound propagation in layered moving media</article-title>. <source>J. Acoustical Soc. America</source> <volume>92</volume>, <fpage>3442</fpage>&#x2013;<lpage>3442</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1121/1.404150</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Han</surname> <given-names>J.</given-names></name>
<name><surname>Jentzen</surname> <given-names>A.</given-names></name>
<name><surname>E</surname> <given-names>W.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>Solving high-dimensional partial differential equations using deep learning</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>115</volume>, <fpage>8505</fpage>&#x2013;<lpage>8510</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1718942115</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hornik</surname> <given-names>K.</given-names></name>
<name><surname>Stinchcombe</surname> <given-names>M.</given-names></name>
<name><surname>White</surname> <given-names>H.</given-names></name>
</person-group> (<year>1989</year>). 
<article-title>Multilayer feedforward networks are universal approximators</article-title>. <source>Neural Networks</source> <volume>2</volume>, <fpage>359</fpage>&#x2013;<lpage>366</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0893-6080(89)90020-8</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hu</surname> <given-names>Z.</given-names></name>
<name><surname>Jagtap</surname> <given-names>A. D.</given-names></name>
<name><surname>Karniadakis</surname> <given-names>G. E.</given-names></name>
<name><surname>Kawaguchi</surname> <given-names>K.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Augmented physics-informed neural networks (apinns): A gating network-based soft domain decomposition methodology</article-title>. <source>Eng. Appl. Artif. Intell.</source> <volume>126</volume>, <fpage>107183</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.engappai.2023.107183</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Huang</surname> <given-names>Z.</given-names></name>
<name><surname>An</surname> <given-names>L.</given-names></name>
<name><surname>Ye</surname> <given-names>Y.</given-names></name>
<name><surname>Wang</surname> <given-names>X.</given-names></name>
<name><surname>Cao</surname> <given-names>H.</given-names></name>
<name><surname>Du</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>A broadband modeling method for range-independent underwater acoustic channels using physics-informed neural networks</article-title>. <source>J. Acoustical Soc. America</source> <volume>156</volume>, <fpage>3523</fpage>&#x2013;<lpage>3533</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1121/10.0034458</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Jensen</surname> <given-names>F. B.</given-names></name>
<name><surname>Kuperman</surname> <given-names>W. A.</given-names></name>
<name><surname>Porter</surname> <given-names>M. B.</given-names></name>
<name><surname>Schmidt</surname> <given-names>H.</given-names></name>
<name><surname>Tolstoy</surname> <given-names>A.</given-names></name>
</person-group> (<year>2011</year>). <source>Computational ocean acoustics</source> Vol. <volume>2011</volume> (
<publisher-name>Springer</publisher-name>).
</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>K.</given-names></name>
<name><surname>Chitre</surname> <given-names>M.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Data-aided underwater acoustic ray propagation modeling</article-title>. <source>IEEE J. Oceanic Eng.</source> <volume>48</volume>, <fpage>1127</fpage>&#x2013;<lpage>1148</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/JOE.2023.3292417</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>Z.</given-names></name>
<name><surname>Kovachki</surname> <given-names>N.</given-names></name>
<name><surname>Azizzadenesheli</surname> <given-names>K.</given-names></name>
<name><surname>Liu</surname> <given-names>B.</given-names></name>
<name><surname>Bhattacharya</surname> <given-names>K.</given-names></name>
<name><surname>Stuart</surname> <given-names>A.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>Fourier neural operator for parametric partial differential equations</article-title>. <source>arXiv preprint arXiv:2010.08895</source>.
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>W.</given-names></name>
<name><surname>Zhang</surname> <given-names>L.</given-names></name>
<name><surname>Wang</surname> <given-names>Y.</given-names></name>
<name><surname>Cheng</surname> <given-names>X.</given-names></name>
<name><surname>Xiao</surname> <given-names>W.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>A vector wavenumber integration model of underwater acoustic propagation based on the matched interface and boundary method</article-title>. <source>J. Mar. Sci. Eng.</source> <volume>9</volume>, <fpage>1134</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/jmse9101134</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lu</surname> <given-names>L.</given-names></name>
<name><surname>Jin</surname> <given-names>P.</given-names></name>
<name><surname>Karniadakis</surname> <given-names>G. E.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Deeponet: Learning nonlinear operators for identifying differential equations based on the universal approximation theorem of operators</article-title>. <source>arXiv preprint arXiv:1910.03193</source>.
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lu</surname> <given-names>Y.</given-names></name>
<name><surname>Zhang</surname> <given-names>H.</given-names></name>
<name><surname>Pan</surname> <given-names>X.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>Numerical simulation of flow-field and flow-noise of a fully appendage submarine</article-title>. <source>J. Vibration Shock</source> <volume>27</volume>, <fpage>142</fpage>&#x2013;<lpage>146</lpage>.
</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ma</surname> <given-names>Y.</given-names></name>
<name><surname>Yu</surname> <given-names>D.</given-names></name>
<name><surname>Wu</surname> <given-names>T.</given-names></name>
<name><surname>Wang</surname> <given-names>H.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Paddlepaddle: An open-source deep learning platform from industrial practice</article-title>. <source>Front. Data Domputing</source> <volume>1</volume>, <fpage>105</fpage>&#x2013;<lpage>115</lpage>.
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mallik</surname> <given-names>W.</given-names></name>
<name><surname>Jaiman</surname> <given-names>R. K.</given-names></name>
<name><surname>Jelovica</surname> <given-names>J.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Predicting transmission loss in underwater acoustics using convolutional recurrent autoencoder network</article-title>. <source>J. Acoustical Soc. America</source> <volume>152</volume>, <fpage>1627</fpage>&#x2013;<lpage>1638</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1121/10.0013894</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Paszke</surname> <given-names>A.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Pytorch: An imperative style, high-performance deep learning library</article-title>. <source>arXiv preprint arXiv:1912.01703</source>.
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Pekeris</surname> <given-names>C. L.</given-names></name>
</person-group> (<year>1948</year>). 
<article-title>Theory of propagation of explosive sound in shallow water</article-title>. doi:&#xa0;<pub-id pub-id-type="doi">10.1130/MEM27</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Porter</surname> <given-names>M. B.</given-names></name>
</person-group> (<year>1992</year>). 
<article-title>The kraken normal mode program</article-title>.
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Raissi</surname> <given-names>M.</given-names></name>
<name><surname>Perdikaris</surname> <given-names>P.</given-names></name>
<name><surname>Karniadakis</surname> <given-names>G. E.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Physics-informed neural networks: A deep learning framework for solving forward and inverse problems involving nonlinear partial differential equations</article-title>. <source>J. Comput. Phys.</source> <volume>378</volume>, <fpage>686</fpage>&#x2013;<lpage>707</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jcp.2018.10.045</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Schmidt</surname> <given-names>H.</given-names></name>
<name><surname>Glattetre</surname> <given-names>J.</given-names></name>
</person-group> (<year>1985</year>). 
<article-title>A fast field model for three-dimensional wave propagation in stratified environments based on the global matrix method</article-title>. <source>J. Acoustical Soc. America</source> <volume>78</volume>, <fpage>2105</fpage>&#x2013;<lpage>2114</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1121/1.392670</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Song</surname> <given-names>C.</given-names></name>
<name><surname>Alkhalifah</surname> <given-names>T.</given-names></name>
<name><surname>Waheed</surname> <given-names>U. B.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>A versatile framework to solve the helmholtz equation using physics-informed neural networks</article-title>. <source>Geophysical J. Int.</source> <volume>228</volume>, <fpage>1750</fpage>&#x2013;<lpage>1762</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gji/ggab434</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Stephen</surname> <given-names>R. A.</given-names></name>
</person-group> (<year>1988</year>). 
<article-title>A review of finite difference methods for seismo-acoustics problems at the seafloor</article-title>. <source>Rev. Geophysics</source> <volume>26</volume>, <fpage>445</fpage>&#x2013;<lpage>458</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/RG026i003p00445</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Thompson</surname> <given-names>L. L.</given-names></name>
</person-group> (<year>2006</year>). 
<article-title>A review of finite-element methods for time-harmonic acoustics</article-title>. <source>J. Acoustical Soc. America</source> <volume>119</volume>, <fpage>1315</fpage>&#x2013;<lpage>1330</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1121/1.2164987</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Tu</surname> <given-names>H.</given-names></name>
<name><surname>Wang</surname> <given-names>Y.</given-names></name>
<name><surname>Yang</surname> <given-names>C.</given-names></name>
<name><surname>Liu</surname> <given-names>W.</given-names></name>
<name><surname>Wang</surname> <given-names>X.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>A chebyshev&#x2013;tau spectral method for coupled modes of underwater sound propagation in range-dependent ocean environments</article-title>. <source>Phys. Fluids</source> <volume>35</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1063/5.0138012</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>S.</given-names></name>
<name><surname>Teng</surname> <given-names>Y.</given-names></name>
<name><surname>Perdikaris</surname> <given-names>P.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Understanding and mitigating gradient flow pathologies in physics-informed neural networks</article-title>. <source>SIAM J. Sci. Computing</source> <volume>43</volume>, <fpage>A3055</fpage>&#x2013;<lpage>A3081</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1137/20M1318043</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zeng</surname> <given-names>Q.</given-names></name>
<name><surname>Kothari</surname> <given-names>Y.</given-names></name>
<name><surname>Bryngelson</surname> <given-names>S. H.</given-names></name>
<name><surname>Sch&#xe4;fer</surname> <given-names>F.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Competitive physics informed networks</article-title>. <source>arXiv preprint arXiv:2204.11144</source>.
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/342712">Chunyan Li</ext-link>, Louisiana State University, United States</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1956798">Tianyu Zhang</ext-link>, Guangdong Ocean University, China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3152385">Zhengyu Hou</ext-link>, Sun Yat-sen University, China</p></fn>
</fn-group>
<fn-group>
<fn fn-type="abbr" id="abbrev1">
<label>Abbreviations:</label>
<p>PINN, physics-informed neural network; WE, wave equation; HE, Helmholtz equation; WI, wavenumber integration; NM, normal mode; PE, parabolic equation; PDE, partial differential equation; FDM, finite difference method; FEM, finite element method; FVM, finite volume method; BEM, boundary element method; DeepONet, Deep Operator Network; FNO, Fourier Neural Operator.</p>
</fn>
</fn-group>
</back>
</article>