<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Clim.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Climate</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Clim.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2624-9553</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fclim.2026.1776202</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>A physical-environment-driven multi-stream deep neural network for short-term heavy precipitation potential identification</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Jie</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2914602"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>An</surname>
<given-names>Jingjing</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yao</surname>
<given-names>Chen</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wu</surname>
<given-names>Zhaoye</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1507001"/>
<role>reviewer</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Huimin</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhou</surname>
<given-names>Xiaoye</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Gaoping</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wu</surname>
<given-names>Ruijiao</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Anhui Provincial Meteorological Observatory</institution>, <city>Hefei</city>, <state>Anhui</state>, <country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>Anhui Provincial Meteorological Information Centre</institution>, <city>Hefei</city>, <state>Anhui</state>, <country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>&#x002A;</label>Correspondence: Jingjing An, <email xlink:href="mailto:anjingjing@amo.mobi">anjingjing@amo.mobi</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-03-04">
<day>04</day>
<month>03</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>8</volume>
<elocation-id>1776202</elocation-id>
<history>
<date date-type="received">
<day>27</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>14</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2026 Liu, An, Yao, Wu, Li, Zhou, Liu and Wu.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Liu, An, Yao, Wu, Li, Zhou, Liu and Wu</copyright-holder>
<license>
<ali:license_ref start_date="2026-03-04">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Accurate identification of short-term heavy precipitation (STHP), governed by multiscale atmospheric processes, is critical for effective disaster prevention and mitigation. Conventional statistical methods often fail to capture the complex nonlinear relationships inherent in multidimensional atmospheric systems, whereas deep learning (DL) approaches exhibit significant advantages in multi-factor fusion. However, existing DL architectures typically process heterogeneous inputs through single-branch networks, resulting in feature redundancy, and suffer from limited interpretability&#x2014;the &#x201C;black box&#x201D; problem&#x2014;that undermines operational reliability. To address these challenges, this study proposes a physics-driven multi-stream deep neural network (MSDNN) framework, complemented by interpretability analysis using the integrated gradients (IG) method. Using observational data from 976 meteorological stations in Anhui Province and ERA5 reanalysis data from 2021 to 2024, we categorized 71 environmental physical variables into five distinct input streams according to physical characteristics: water vapor conditions, dynamic conditions, thermal instability, composite indices, and height layer properties. The split-merge architecture of MSDNN enables integrated processing of these five feature categories, achieving accurate identification of STHP. Results show that the MSDNN model achieved a threat score (TS) of 0.851 and a Matthews correlation coefficient (MCC) of 0.844 on the test set, significantly outperforming both conventional ensemble learning methods (LightGBM, Random forest) and single-branch deep neural network (DNN). IG-based attribution analysis revealed that dynamic factors contributed most substantially to model performance (45%), followed by thermal (25%), vertical structure (15%), moisture-related (10%), and composite indices (5%). Furthermore, this study identified critical nonlinear thresholds: contribution polarity reversal at 80% relative humidity (700&#x202F;hPa), strong sensitivity to upward vertical velocity (500&#x202F;hPa). These quantified feature interactions provide data-driven physical insights into precipitation triggering mechanisms, elucidating the synergistic roles of moisture transport, dynamic lifting, and thermal instability. The MSDNN-IG framework establishes a technical pathway for severe convective weather identification that harmonizes accuracy with physical transparency, enhancing both the credibility and practical utility of AI methods in operational warning systems.</p>
</abstract>
<kwd-group>
<kwd>atmospheric physical variables</kwd>
<kwd>integrated gradients (IG)</kwd>
<kwd>machine learning</kwd>
<kwd>potential identification</kwd>
<kwd>short-term heavy precipitation (STHP)</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This research was funded by the Science and Technology Innovation Tackling Key Problems of Anhui Province &#x201C;Technology R&#x0026;D and application of a high-resolution precipitation-runoff forecasting model for the Lianjiang river basin&#x201D; (202523p09050001); Natural Science Foundation of Anhui Province &#x201C;Research on key technologies for strong convection forecast and early warning under complex terrain conditions&#x201D; (2408055UQ002); China Meteorological Administration innovative development project &#x201C;Research on the application of &#x2018;Feng Lei&#x2019; model in short-term landslide meteorological risk forecasting&#x201D; (CXFZ2025Q008).</funding-statement>
</funding-group>
<counts>
<fig-count count="6"/>
<table-count count="5"/>
<equation-count count="9"/>
<ref-count count="53"/>
<page-count count="17"/>
<word-count count="10090"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Climate Monitoring</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>Short-term heavy precipitation (STHP) refers to high-intensity precipitation events occurring over a short period, typically lasting 1&#x2013;6&#x202F;h, with rainfall rates generally exceeding 20&#x202F;mm/h&#x202F;s (<xref ref-type="bibr" rid="ref41">Xu et al., 2023</xref>). These events are closely associated with deep convective systems and exhibit strong locality and temporal abruptness (<xref ref-type="bibr" rid="ref28">Ravuri et al., 2021</xref>; <xref ref-type="bibr" rid="ref5">Chiappa et al., 2024</xref>; <xref ref-type="bibr" rid="ref54">Zhou et al., 2023</xref>). STHP frequently triggers secondary disasters such as urban waterlogging, flash floods, landslides, and debris flows, posing severe threats to socioeconomic development and public safety (<xref ref-type="bibr" rid="ref42">Yan et al., 2024</xref>; <xref ref-type="bibr" rid="ref23">Llasat et al., 2021</xref>). Against the background of global warming, STHP events have shown a significant increase in both frequency and intensity, particularly in urbanized regions (<xref ref-type="bibr" rid="ref11">Fowler et al., 2021</xref>). A study by <xref ref-type="bibr" rid="ref5">Chiappa et al. (2024)</xref> further reported a rising trend in extreme short-term summer precipitation across the central and eastern United States between 2003 and 2023, attributing this trend primarily to the influence of mesoscale convective systems (MCSs). Consequently, elucidating the influence mechanisms of environmental physical fields on MCSs is critical for improving the identification and early warning capabilities for such high-impact weather events.</p>
<p>The occurrence of STHP involves complex interactions among multiple atmospheric physical variables, especially the synergistic effects of thermal, moisture, and dynamic processes (<xref ref-type="bibr" rid="ref36">Tian et al., 2015</xref>; <xref ref-type="bibr" rid="ref4">Bhowmik et al., 2008</xref>). Variations in key parameters&#x2014;such as temperature, humidity, and wind profiles across different atmospheric layers&#x2014;often act as direct precursors to STHP events. Understanding the nonlinear relationships and spatiotemporal variability of these physical variables is thus essential for accurate STHP identification. To translate these physical principles into operational applications, numerical weather prediction (NWP) systems, specifically convection-permitting models, have become the cornerstone by explicitly simulating multiscale atmospheric dynamics (<xref ref-type="bibr" rid="ref3">Bauer et al., 2015</xref>; <xref ref-type="bibr" rid="ref34">Sun et al., 2014</xref>). However, the representation of extreme precipitation in NWP remains hindered by sensitivities in convective parameterizations and initial condition uncertainties, which often lead to spatial and temporal displacements in rainfall identification (<xref ref-type="bibr" rid="ref44">Yano et al., 2018</xref>). To compensate for these dynamical modeling deficiencies, previous studies have primarily relied on statistical approaches (e.g., significance testing, multiple regression) combined with radiosonde observations or reanalysis datasets to analyze typical STHP cases, identify triggering mechanisms, and derive threshold values for key parameters, such as convective available potential energy (CAPE), vertical wind shear, and lower- to mid-tropospheric humidity, within specific spatiotemporal contexts (<xref ref-type="bibr" rid="ref31">Shen et al., 2016</xref>; <xref ref-type="bibr" rid="ref49">Zhang et al., 2021</xref>). Nevertheless, these methods depend heavily on expert knowledge for case selection and subjective interpretation, limiting their capacity to extract nuanced patterns and subtle discriminative features from large-scale datasets (<xref ref-type="bibr" rid="ref38">Wang et al., 2020</xref>). Moreover, conventional statistical techniques are inherently constrained in modeling complex multi-physical interactions, failing to adequately capture the underlying relationships among multidimensional variables and accurately characterize their intrinsic dynamical couplings.</p>
<p>In recent years, artificial intelligence (AI) algorithms have become important tools for mining petabyte-scale meteorological datasets to support modern synoptic forecasting and identification (<xref ref-type="bibr" rid="ref52">Zheng et al., 2015</xref>; <xref ref-type="bibr" rid="ref29">Reichstein et al., 2019</xref>). Ensemble learning methods, including Random forest (RF), support vector machines (SVM), and extreme gradient boosting (XGBoost), have shown particular promise in extreme precipitation identification. By integrating multi-source observations such as surface measurements, radiosonde data, NWP outputs, and satellite/radar retrievals, these methods effectively identify thermodynamic and kinematic signatures characteristic of STHP. As a result, they consistently outperform both raw dynamical models and conventional statistical approaches in terms of skill scores and extreme event detection (<xref ref-type="bibr" rid="ref30">Retsch et al., 2022</xref>; <xref ref-type="bibr" rid="ref21">Li et al., 2024a</xref>; <xref ref-type="bibr" rid="ref14">Hess and Boers, 2022</xref>; <xref ref-type="bibr" rid="ref26">Nie et al., 2023</xref>). Deep learning (DL) architectures further extend these capabilities by capturing complex nonlinear relationships within multidimensional physical fields. <xref ref-type="bibr" rid="ref53">Zhou et al. (2019)</xref> developed a six-layer convolutional neural network (CNN) trained on NCEP reanalysis data that effectively classifies multiple severe convective weather types&#x2014;including STHP, hail, and thunderstorm gales&#x2014;surpassing both RF and SVM in skill score. <xref ref-type="bibr" rid="ref47">Zhang et al. (2024)</xref> developed a hybrid architecture that integrates convolutional neural network (CNN)-based spatial feature extraction with a bidirectional long short-term memory (BiLSTM) network and an attention mechanism (CNN-BiLSTM-AM). When applied to ERA5 reanalysis data, this architecture demonstrates superior probability of detection and threat scores for 1&#x2013;6&#x202F;h convective forecasts. At the global scale, AI-based weather prediction systems such as GraphCast and Pangu-Weather generate high-resolution (0.25&#x00B0;) resolution forecasts of temperature, humidity, and vertical wind shear within minutes, providing efficient preliminary assessment of convective potential up to 10&#x202F;days in advance (<xref ref-type="bibr" rid="ref10">Feldmann et al., 2024</xref>).</p>
<p>Although AI techniques have demonstrated preliminary success in identifying environmental physical fields associated with STHP, several critical challenges remain unresolved. First, the physical mechanisms driving STHP require the synergistic interaction of thermal instability, abundant moisture supply, dynamic lifting, and appropriate vertical wind shear (<xref ref-type="bibr" rid="ref51">Zhao et al., 2025</xref>). Given the distinct categorical characteristics and physical mechanisms represented by these environmental variables, the prevailing practice of undifferentiated input into unified architectures requires critical re-examination. Inspired by methodological advances in multimodal learning, we posit that implementing dedicated input pathways for heterogeneous feature categories could better preserve their intrinsic physical structures, thereby potentially enhancing the generalization capacity of STHP discrimination models (<xref ref-type="bibr" rid="ref20">Li et al., 2025</xref>; <xref ref-type="bibr" rid="ref17">Khan et al., 2025</xref>). Second, current research predominantly emphasizes identification accuracy, while paying insufficient attention to interpreting model decision mechanisms&#x2014;particularly the quantitative contribution of different physical variables to STHP occurrence. The imperative to unravel complex nonlinear transformations within deep neural networks, thereby demystifying their &#x201C;black-box&#x201D; nature, remains crucial for enhancing operational trustworthiness and guiding model refinement in STHP identification (<xref ref-type="bibr" rid="ref8">Du et al., 2019</xref>; <xref ref-type="bibr" rid="ref43">Yang et al., 2024</xref>). The integrated gradients (IG) method, which computes gradient integrals along the path from baseline to input, offers a promising approach for assigning quantitative importance scores to input features. This technique can identify key variables closely aligned with STHP physical mechanisms, thereby providing both scientific insight into deep convection triggering and practical guidance for identification performance.</p>
<p>To address these research gaps, this study develops a physics-aware multi-scale deep neural network (MSDNN) framework that explicitly incorporates categorized environmental physical features for STHP identification. Combined with the IG interpretability method, this study aims to establish an interpretable STHP identification system that clarifies the roles of different physical variables in convective initiation. The specific research objectives are as: (1) to construct an STHP identification framework based on the MSDNN architecture using ERA5 reanalysis data; (2) to enhance model interpretability through IG-based attribution analysis, quantifying the contributions and interactive effects of various physical features to STHP identification.</p>
</sec>
<sec id="sec2">
<label>2</label>
<title>Study area and data source</title>
<sec id="sec3">
<label>2.1</label>
<title>Study area</title>
<p>This study focuses on Anhui Province in eastern China (116.5&#x00B0;&#x2013;119.5&#x00B0; E, 29.5&#x00B0;&#x2013;31.2&#x00B0; N) (<xref ref-type="fig" rid="fig1">Figure 1a</xref>), covering approximately 140,000 km<sup>2</sup>. Located within the core region of the East Asian monsoon, the province experiences an average annual precipitation exceeding 1,200&#x202F;mm, with pronounced spatiotemporal variability&#x2014;over 70% of the annual total occurs from May to September (<xref ref-type="fig" rid="fig1">Figure 1c</xref>) (<xref ref-type="bibr" rid="ref39">Wang et al., 2024</xref>; <xref ref-type="bibr" rid="ref40">Wu et al., 2022</xref>). As a transitional zone between northern and southern climate regimes, Anhui is influenced by both cold air masses from Siberia and warm, moist flows from the Pacific Ocean, resulting in a complex atmospheric circulation system. This climatic configuration fosters frequent severe convective weather, including STHP events with intensities reaching 80&#x2013;100&#x202F;mm per hour (<xref ref-type="bibr" rid="ref13">Hao et al., 2012</xref>).</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Location of the study area <bold>(a)</bold>, topography of the study area and the distribution of meteorological stations <bold>(b)</bold>, and the monthly average precipitation and its proportion in the whole year in the study area from 1991 to 2020 <bold>(c)</bold>.</p>
</caption>
<graphic xlink:href="fclim-08-1776202-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel (a) shows a map of China with Anhui Province highlighted in red and Beijing marked with a star. Panel (b) displays a detailed elevation map of Anhui Province with green areas indicating lower elevation and yellow-to-red for higher elevation, featuring meteorological stations as purple dots, administrative center Hefei in a circle, neighboring provinces labeled, and a lake marked in blue. Panel (c) presents a combination chart where bars represent the proportion of annual precipitation for each month, while a line graph indicates the monthly total precipitation in millimeters, highlighting a peak during June and July.</alt-text>
</graphic>
</fig>
<p>The topography of Anhui is markedly heterogeneous (<xref ref-type="fig" rid="fig1">Figure 1b</xref>). The Yangtze and Huaihe Rivers divide the province into three distinct subregions: the Huaibei Plain in the north, characterized by flat terrain and agricultural landscapes; the central Jianghuai Hilly Area, which includes the western Dabie Mountains; and the southern Jiangnan Region, dominated by the mountainous terrain of Southern Anhui. Orographic lifting in the Southern Anhui and Dabie Mountains significantly enhances local precipitation intensity and frequency (<xref ref-type="bibr" rid="ref18">Kim et al., 2022</xref>; <xref ref-type="bibr" rid="ref37">Tong et al., 2017</xref>), often inducing secondary hazards such as flash floods and landslides. These precipitation patterns also contribute considerable uncertainty to flood risks in the Yangtze and Huaihe River basins.</p>
<p>The interplay of complex geography and monsoonal climate supports diverse dynamic&#x2013;thermal coupling mechanisms for precipitation formation (<xref ref-type="fig" rid="fig1">Figure 1c</xref>). Combined with the high density of meteorological stations across the region (<xref ref-type="fig" rid="fig1">Figure 1b</xref>), Anhui Province offers an ideal natural laboratory for studying multi-scale physical processes of STHP in a climatic transition zone, thereby supporting improved early warning systems and regional disaster prevention strategies.</p>
</sec>
<sec id="sec4">
<label>2.2</label>
<title>Data sources</title>
<sec id="sec5">
<label>2.2.1</label>
<title>Observed precipitation data</title>
<p>Hourly precipitation data were obtained from 976 meteorological stations managed by the Anhui Provincial Meteorological Administration (<xref ref-type="fig" rid="fig1">Figure 1b</xref>), covering the period from March to September for the years 2021&#x2013;2024. The stations are distributed relatively uniformly across the study area, enabling effective characterization of mesoscale spatiotemporal precipitation variability. In accordance with operational and research conventions, STHP events were defined as those with hourly precipitation &#x2265;20&#x202F;mm. Samples meeting this criterion were labeled as positive (STHP events) sample, while the remainder were classified as negative (non-STHP) samples. To minimize the influence of localized, isolated heavy rainfall, positive samples were filtered following the method of <xref ref-type="bibr" rid="ref21">Li et al. (2024a)</xref>, requiring concurrent STHP occurrence at a minimum of five stations. This screening process yielded 12,082 validated positive samples. To address class imbalance in the dataset, 13,290 negative samples were selected from precipitation-free and light-precipitation records at 16 national-level manned meteorological stations.</p>
</sec>
<sec id="sec6">
<label>2.2.2</label>
<title>ERA5 reanalysis data</title>
<p>To represent the large-scale circulation and thermodynamic environment associated with STHP, this study employed the ERA5 reanalysis dataset from the European Centre for Medium-Range Weather Forecasts (ECMWF). Generated using the IFS Cycle 41R2 and a 4D-Var data assimilation system, ERA5 integrates multi-source global observations&#x2014;including satellite, surface, and radiosonde data&#x2014;and has been widely validated for reliably reproducing atmospheric evolution (<xref ref-type="bibr" rid="ref32">Soci et al., 2024</xref>; <xref ref-type="bibr" rid="ref22">Li et al., 2024b</xref>). Data were retrieved from the official ECMWF portal.<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref></p>
<p>Hourly reanalysis fields from March to September (2021&#x2013;2024) were selected, with a spatial resolution of 0.25&#x00B0;&#x202F;&#x00D7;&#x202F;0.25&#x00B0;, covering the study area and its surroundings. The dataset includes surface variables (e.g., 2-m temperature, 2-m dewpoint, 10-m winds, surface pressure) and multi-level meteorological elements (e.g., temperature, geopotential height, relative humidity, wind vectors). To ensure spatiotemporal consistency with station observations, all reanalysis data were aligned to synoptic hours and interpolated to station locations using the nearest-neighbor method, forming an integrated dataset for subsequent modeling and analysis.</p>
</sec>
<sec id="sec7">
<label>2.2.3</label>
<title>Extraction of multi-category atmospheric environmental physical variables</title>
<p>Based on the ERA5 reanalysis, 71 atmospheric environmental physical variables were systematically derived to comprehensively characterize the environmental conditions governing the development and occurrence of STHP. These variables span five core categories: moisture conditions, dynamic conditions, thermal conditions, composite indices, and vertical-level characteristics. Specifically, moisture conditions cover humidity distribution and moisture transport; dynamic conditions include dynamic lift and shear structures (key to convective triggering); thermal conditions involve foundational thermal properties; composite indices encompass convective available potential energy (CAPE), stability indices, and other integrated diagnostics; while vertical-level characteristics directly link to stratification features such as key temperature levels and condensation heights. This multi-dimensional variable system enables diversified representation of the physical processes underlying STHP initiation and evolution. The classification and distribution of the 71 variables are summarized in <xref ref-type="table" rid="tab1">Table 1</xref>, with detailed computational formulas provided in <xref ref-type="supplementary-material" rid="SM1">Supplementary Table S1</xref>.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Physical variables used in this study.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Category</th>
<th align="left" valign="top">Subcategory</th>
<th align="left" valign="top">Physical variables</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" rowspan="4">Humidity-related variables (HRV)</td>
<td align="left" valign="middle">Specific humidity</td>
<td align="left" valign="middle">500&#x202F;hPa specific humidity (specific_humidity_500), 700&#x202F;hPa specific humidity (specific_humidity_700), 850&#x202F;hPa specific humidity (specific_humidity_850)</td>
</tr>
<tr>
<td align="left" valign="middle">Relative humidity</td>
<td align="left" valign="middle">500&#x202F;hPa relative humidity (RH_500), 700&#x202F;hPa relative humidity (RH_700), 850&#x202F;hPa relative humidity (RH_850), 950&#x202F;hPa relative humidity (RH_950)</td>
</tr>
<tr>
<td align="left" valign="middle">Dew point temperature</td>
<td align="left" valign="middle">700&#x202F;hPa dew point temperature (td_level_700), 850&#x202F;hPa dew point temperature (td_level_850), 950&#x202F;hPa dew point temperature (td_level_950)</td>
</tr>
<tr>
<td align="left" valign="middle">Integrated humidity</td>
<td align="left" valign="middle">Precipitable water vapor (pwv)</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="7">Wind and vertical motion variables (WVV)</td>
<td align="left" valign="middle">Horizontal divergence</td>
<td align="left" valign="middle">500&#x202F;hPa divergence (divergence_500), 700&#x202F;hPa divergence (divergence_700), 850&#x202F;hPa divergence (divergence_850)</td>
</tr>
<tr>
<td align="left" valign="middle">Vorticity</td>
<td align="left" valign="middle">500&#x202F;hPa vorticity (vor_500), 700&#x202F;hPa vorticity (vor_700), 850&#x202F;hPa vorticity (vor_850), 950&#x202F;hPa vorticity (vor_950)</td>
</tr>
<tr>
<td align="left" valign="middle">Vertical speed</td>
<td align="left" valign="middle">500&#x202F;hPa vertical speed (vertical_speed_500), 700&#x202F;hPa vertical speed (vertical_speed_700), 850&#x202F;hPa vertical speed (vertical_speed_850), 950&#x202F;hPa vertical speed (vertical_speed_950)</td>
</tr>
<tr>
<td align="left" valign="middle">Wind speed difference and average</td>
<td align="left" valign="middle">Average wind speed at 6&#x202F;km altitude and on the ground (avg_6), Wind speed difference between 2&#x202F;km altitude and the ground (wdiff_speed_02), Wind speed difference between 6&#x202F;km altitude and the ground (wdiff_speed_06), Wind speed difference between 6&#x202F;km altitude and 3&#x202F;km altitude (wdiff_speed_36), Inflow Parameter (inflow)</td>
</tr>
<tr>
<td align="left" valign="middle">Wind direction difference</td>
<td align="left" valign="middle">Wind direction difference between 2&#x202F;km altitude and the ground (wdiff_dir_02), Wind direction difference between 6&#x202F;km altitude and the ground (wdiff_dir_06), Wind direction difference between 6&#x202F;km altitude and 3&#x202F;km altitude (wdiff_dir_36)</td>
</tr>
<tr>
<td align="left" valign="middle">Maximum wind speed</td>
<td align="left" valign="middle">Maximum wind speed above 500&#x202F;hPa (mxw_GH_500), Maximum wind speed below 500&#x202F;hPa (mxw_LE_500)</td>
</tr>
<tr>
<td align="left" valign="middle">Southwest wind component</td>
<td align="left" valign="middle">200&#x202F;hPa southwest wind component (sw_wind_200), 500&#x202F;hPa southwest wind component (sw_wind_500), 850&#x202F;hPa southwest wind component (sw_wind_850), 950&#x202F;hPa southwest wind component (sw_wind_950)</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Stability and energy indices (SEI)</td>
<td align="left" valign="middle">Common convective indices</td>
<td align="left" valign="middle">CAPE (cape_index), A index (a_index), K index (k_index), Li index (li_index), Best Lifted index (bli), SI index (si_index), Total index (tot_index), J index (j_index)</td>
</tr>
<tr>
<td align="left" valign="middle">Temperature-related parameters</td>
<td align="left" valign="middle">The temperature difference between 850&#x202F;hPa and 500&#x202F;hPa (t8_t5), 500&#x202F;hPa theta-e (theta_se_level_500), 700&#x202F;hPa theta-e (theta_se_level_700), 850&#x202F;hPa theta-e (theta_se_level_850), 950&#x202F;hPa theta-e (theta_se_level_950)</td>
</tr>
<tr>
<td align="left" valign="middle">Downward energy</td>
<td align="left" valign="middle">DCAPE (dcape)</td>
</tr>
<tr>
<td align="left" valign="middle">Stratification-related indices</td>
<td align="left" valign="middle">IC Index (ic), IL Index (il), ILC Index (ilc)</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Severe convection and storm indices (SSI)</td>
<td align="left" valign="middle">Severe convection warning indices</td>
<td align="left" valign="middle">Storm strength index (ssi_index), SWEAT index (sweat_index), Swiss index (swiss), Deep convection index (dci_index), Modified deep convection index (mdci)</td>
</tr>
<tr>
<td align="left" valign="middle">Helicity-related indices</td>
<td align="left" valign="middle">Energy helicity index (ehi), Surface helicity (heli0)</td>
</tr>
<tr>
<td align="left" valign="middle">Buoyancy parameters</td>
<td align="left" valign="middle">Bulk Richardson number (brn_index)</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Height and thickness variables (HTV)</td>
<td align="left" valign="middle">Characteristic heights</td>
<td align="left" valign="middle">The height of the 0&#x00B0;C level (temp0)</td>
</tr>
<tr>
<td align="left" valign="middle">Height difference and thickness</td>
<td align="left" valign="middle">The thickness of the air column between &#x2212;20&#x202F;&#x00B0;C and 0&#x202F;&#x00B0;C (dpt_thickness)</td>
</tr>
<tr>
<td align="left" valign="middle">LCL, CCL sub-parameters</td>
<td align="left" valign="middle">The height difference between Lifting Condensation Level (LCL) and Convective Condensation Level (CCL) (lcl_ccl_difference), LCL Pressure (lcl_p), LCL Temperature (lcl_t), LCL Height (lcl_h), CCL Pressure (ccl_p), CCL Temperature (ccl_t), CCL Dew Point Temperature (ccl_td), CCL Height (ccl_h)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
</sec>
<sec sec-type="methods" id="sec8">
<label>3</label>
<title>Methods</title>
<p><xref ref-type="fig" rid="fig2">Figure 2</xref> illustrates the comprehensive methodological framework of this study, which comprises two interconnected components. The first component focuses on developing the MSDNN architecture for high-accuracy STHP discrimination, with systematic performance comparisons against established benchmark methods including RF, light gradient boosting machine (LightGBM, LGB), and conventional deep neural networks (DNN). The second component employs Integrated Gradients (IG) interpretability analysis to quantify the influence of different environmental variables on model decisions, specifically identifying key meteorological drivers and determining their critical physical thresholds for STHP occurrence.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Technical roadmap of this study.</p>
</caption>
<graphic xlink:href="fclim-08-1776202-g002.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Flowchart outlining a three-step process for analyzing physical variables and precipitation: Step one covers data collection and preprocessing from meteorological observations and ECMWF ERA5 reanalysis; step two details model construction, evaluation, and comparison using multiple deep neural network branches and indicators; step three involves analyzing feature importance and nonlinear relationships with integrated gradients and threshold analysis, including visual feature ranking and a scatterplot of variable thresholds.</alt-text>
</graphic>
</fig>
<sec id="sec9">
<label>3.1</label>
<title>Multi-stream deep neural network (MSDNN)</title>
<p>DNN is designed to extract hierarchical feature representations from raw inputs through successive nonlinear transformations. A standard layer-wise mapping can be summarized as:</p>
<disp-formula id="E1">
<mml:math id="M1">
<mml:mi mathvariant="normal">h</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>&#x03C3;</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>Wx</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mspace width="0.25em"/>
<mml:mspace width="0.25em"/>
</mml:math>
<label>(1)</label>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="E1">Equation 1</xref>, where x represents the input features, W and b denote the trainable weight matrix and bias vector, respectively, and <inline-formula>
<mml:math id="M2">
<mml:mi>&#x03C3;</mml:mi>
</mml:math>
</inline-formula> is the nonlinear activation function. While powerful, standard DNN often encounter performance plateaus when processing multi-source meteorological data. In such scenarios, directly concatenating variables with disparate physical meanings and statistical scales (e.g., moisture vs. dynamic factors) can dilute the expressive capacity of individual feature streams and hinder the model&#x2019;s ability to capture category-specific nuances.</p>
<p>To address these limitations, this study introduces a MSDNN framework (<xref ref-type="fig" rid="fig3">Figure 3</xref>). The core architectural philosophy is to decouple the initial feature extraction into five specialized sub-networks: SSI (severe convection and storm indices), HTV (height and thickness variables), HRV (humidity-related variables), SEI (stability and energy indices), and WVV (wind and vertical motion variables). Formally, the transformation for each sub-network <inline-formula>
<mml:math id="M3">
<mml:mi mathvariant="normal">i</mml:mi>
</mml:math>
</inline-formula> is expressed as:</p>
<disp-formula id="E2">
<mml:math id="M4">
<mml:msub>
<mml:mi mathvariant="normal">h</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">f</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x03B8;</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>3</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>4</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>5</mml:mn>
</mml:math>
<label>(2)</label>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="E2">Equation 2</xref>, where <inline-formula>
<mml:math id="M5">
<mml:msub>
<mml:mi mathvariant="normal">f</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> denotes the nonlinear mapping function of the <inline-formula>
<mml:math id="M6">
<mml:mi mathvariant="normal">i</mml:mi>
</mml:math>
</inline-formula>-th sub-network, <inline-formula>
<mml:math id="M7">
<mml:msub>
<mml:mi>&#x03B8;</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> represents its trainable parameters, and <inline-formula>
<mml:math id="M8">
<mml:msub>
<mml:mi mathvariant="normal">h</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> corresponds to the latent feature representation of that specific stream. These multi-stream features are subsequently integrated within a fusion layer, typically through concatenation or weighted combination:</p>
<disp-formula id="E3">
<mml:math id="M9">
<mml:msub>
<mml:mi mathvariant="normal">h</mml:mi>
<mml:mtext>fusion</mml:mtext>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mi mathvariant="normal">g</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">h</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">h</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mo>,</mml:mo>
<mml:mo>,</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">h</mml:mi>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x03B8;</mml:mi>
<mml:mtext>fusion</mml:mtext>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
<label>(3)</label>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="E3">Equation 3</xref>, where <inline-formula>
<mml:math id="M10">
<mml:mi mathvariant="normal">g</mml:mi>
</mml:math>
</inline-formula> denotes the fusion function and <inline-formula>
<mml:math id="M11">
<mml:msub>
<mml:mi>&#x03B8;</mml:mi>
<mml:mtext>fusion</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula> represents the parameters of the fusion stage. The resulting integrated representation is then fed into a fully connected layer, with the final identification result <inline-formula>
<mml:math id="M12">
<mml:mi mathvariant="normal">y</mml:mi>
</mml:math>
</inline-formula> generated through activation function mapping:</p>
<disp-formula id="E4">
<mml:math id="M13">
<mml:mi mathvariant="normal">y</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>&#x03C3;</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>Wh</mml:mi>
<mml:mtext>fusion</mml:mtext>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
<label>(4)</label>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="E4">Equation 4</xref>, where <inline-formula>
<mml:math id="M14">
<mml:mi>&#x03C3;</mml:mi>
</mml:math>
</inline-formula> denotes the nonlinear activation function <inline-formula>
<mml:math id="M15">
<mml:mi mathvariant="normal">W</mml:mi>
</mml:math>
</inline-formula> represents the learnable weight matrix that linearly projects the fused feature vector and <inline-formula>
<mml:math id="M16">
<mml:mi mathvariant="normal">b</mml:mi>
</mml:math>
</inline-formula> is the trainable bias vector that shifts the activation threshold.</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Architecture of the multi-stream deep neural network (MSDNN). The notation &#x2018;Dense (n&#x202F;&#x2192;&#x202F;m)&#x2019; represents a fully connected layer mapping n input neurons to m output neurons. Swish denotes the activation function.</p>
</caption>
<graphic xlink:href="fclim-08-1776202-g003.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Neural network architecture diagram showing five inputs named SSI, HTV, HRV, SEI, and WVV, each passing through multiple dense layers with Swish activation and batch normalization, followed by concatenation, additional dense and dropout layers, and ending with a sigmoid-activated output for classification.</alt-text>
</graphic>
</fig>
<p>As illustrated in <xref ref-type="fig" rid="fig3">Figure 3</xref>, each sub-network channel is composed of stacked dense layers interspersed with batch normalization (BN) and Swish activation functions [<inline-formula>
<mml:math id="M17">
<mml:mtext>Swish</mml:mtext>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo>&#x2217;</mml:mo>
<mml:mtext>sigmoid</mml:mtext>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">]</mml:mo>
</mml:math>
</inline-formula>. The notation Dense (<inline-formula>
<mml:math id="M18">
<mml:msub>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mtext mathvariant="italic">in</mml:mtext>
</mml:msub>
<mml:mo>&#x2192;</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mtext mathvariant="italic">out</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula>) signifies a fully connected layer projecting an input dimension of <inline-formula>
<mml:math id="M19">
<mml:msub>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mtext mathvariant="italic">in</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula> to an output dimension of <inline-formula>
<mml:math id="M20">
<mml:msub>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mtext mathvariant="italic">out</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula>. Notably, the WVV stream is assigned a deeper initial architecture (two layers: 25&#x202F;&#x2192;&#x202F;64&#x202F;&#x2192;&#x202F;128) compared to other streams. This specific design is motivated by the high dimensionality (25 features) and the complex, multi-scale turbulent nature of wind field and vorticity data, which requires a larger hypothesis space to capture the non-linear fluid dynamics essential for STHP identification. Following three stages of stream-specific abstraction, the latent representations are integrated into a 1,152-dimensional fused vector, which is processed through two deep transformation layers (1,152&#x202F;&#x2192;&#x202F;512&#x202F;&#x2192;&#x202F;512) to model complex physical interactions. To ensure numerical stability and generalization, we implemented a multi-tier regularization strategy: (1) BN (<xref ref-type="bibr" rid="ref15">Ioffe and Szegedy, 2015</xref>) is applied after each major transformation stage to stabilize training. (2) A Dropout layer (rate&#x202F;=&#x202F;0.5) is inserted before the final output (<xref ref-type="bibr" rid="ref2">Baldi and Sadowski, 2013</xref>), randomly deactivating 50% of neurons to prevent co-adaptation and enhance generalization. (3) The final layer projects the representation to a single unit (512&#x202F;&#x2192;&#x202F;1) with a Sigmoid activation function to generate the probability of STHP occurrence.</p>
<p>The MSDNN was trained using the binary cross-entropy loss function and the Adam optimizer (<xref ref-type="bibr" rid="ref19">Kingma and Ba, 2014</xref>). To facilitate convergence, an adaptive learning rate strategy (ranging from 10<sup>&#x2212;5</sup> to 10<sup>&#x2212;3</sup>) was employed over a maximum of 10,000 epochs with a batch size of 32. To evaluate its performance, two ensemble learning algorithms&#x2014;RF and LGB&#x2014;were employed as benchmarks. RF utilizes a Bagging framework to reduce variance through collective decision-tree voting, while LGB implements a gradient boosting framework optimized by gradient-based one-side sampling (GOSS) and exclusive feature bundling (EFB) to enhance efficiency and handle large-scale datasets. These models serve as relevant baselines for assessing the MSDNN&#x2019;s capacity to capture the complex nonlinear relationships inherent in STHP identification. Detailed hyperparameter specifications are provided in <xref ref-type="table" rid="tab2">Table 2</xref>.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>The hyper-parameters of models and their values.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Models</th>
<th align="left" valign="top">Hyperparameter</th>
<th align="left" valign="top">Description</th>
<th align="center" valign="top">Values</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" rowspan="6">MSDNN</td>
<td align="left" valign="middle">batch_size</td>
<td align="left" valign="middle">Batch size</td>
<td align="center" valign="middle">32</td>
</tr>
<tr>
<td align="left" valign="middle">Learning_rate</td>
<td align="left" valign="middle">Learning rate</td>
<td align="center" valign="middle">0.00001&#x202F;~&#x202F;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">dropout</td>
<td align="left" valign="middle">Dropout</td>
<td align="center" valign="middle">0.5</td>
</tr>
<tr>
<td align="left" valign="middle">Loss</td>
<td align="left" valign="middle">Loss function</td>
<td align="center" valign="middle">binary_crossentropy</td>
</tr>
<tr>
<td align="left" valign="middle">epoch</td>
<td align="left" valign="middle">Number of epoch</td>
<td align="center" valign="middle">10,000</td>
</tr>
<tr>
<td align="left" valign="middle">optimizer</td>
<td align="left" valign="middle">Optimizer</td>
<td align="center" valign="middle">Adam</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="6">DNN</td>
<td align="left" valign="middle">batch_size</td>
<td align="left" valign="middle">Batch size</td>
<td align="center" valign="middle">32</td>
</tr>
<tr>
<td align="left" valign="middle">Learning_rate</td>
<td align="left" valign="middle">Learning rate</td>
<td align="center" valign="middle">0.00001&#x202F;~&#x202F;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">dropout</td>
<td align="left" valign="middle">Dropout</td>
<td align="center" valign="middle">0.5</td>
</tr>
<tr>
<td align="left" valign="middle">Loss</td>
<td align="left" valign="middle">Loss function</td>
<td align="center" valign="middle">binary_crossentropy</td>
</tr>
<tr>
<td align="left" valign="middle">epoch</td>
<td align="left" valign="middle">Number of epoch</td>
<td align="center" valign="middle">10,000</td>
</tr>
<tr>
<td align="left" valign="middle">optimizer</td>
<td align="left" valign="middle">Optimizer</td>
<td align="center" valign="middle">Adam</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="6">RF</td>
<td align="left" valign="middle">Ntree</td>
<td align="left" valign="middle">Number of decision trees</td>
<td align="center" valign="middle">500</td>
</tr>
<tr>
<td align="left" valign="middle">Maxdeep</td>
<td align="left" valign="middle">Maximum deep of trees</td>
<td align="center" valign="middle">8</td>
</tr>
<tr>
<td align="left" valign="middle">Mtry</td>
<td align="left" valign="middle">Number of randomly selected features</td>
<td align="center" valign="middle">0.1</td>
</tr>
<tr>
<td align="left" valign="middle">Maxnodes</td>
<td align="left" valign="middle">Maximum number of nodes</td>
<td align="center" valign="middle">None</td>
</tr>
<tr>
<td align="left" valign="middle">min_samples_split</td>
<td align="left" valign="middle">Minimum samples split</td>
<td align="center" valign="middle">20</td>
</tr>
<tr>
<td align="left" valign="middle">Nodesize</td>
<td align="left" valign="middle">Minimum number of samples per leaf node</td>
<td align="center" valign="middle">1</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="9">LightGBM</td>
<td align="left" valign="middle">Ntree</td>
<td align="left" valign="middle">Number of decision trees</td>
<td align="center" valign="middle">500</td>
</tr>
<tr>
<td align="left" valign="middle">Maxdeep</td>
<td align="left" valign="middle">Maximum deep of trees</td>
<td align="center" valign="middle">10</td>
</tr>
<tr>
<td align="left" valign="middle">Num_leaves</td>
<td align="left" valign="middle">Number of leaf nodes</td>
<td align="center" valign="middle">30</td>
</tr>
<tr>
<td align="left" valign="middle">min_child_sample</td>
<td align="left" valign="middle">Minimum number of samples required in a leaf node</td>
<td align="center" valign="middle">2</td>
</tr>
<tr>
<td align="left" valign="middle">Learning_rate</td>
<td align="left" valign="middle">Learning rate</td>
<td align="center" valign="middle">0.03</td>
</tr>
<tr>
<td align="left" valign="middle">subsample</td>
<td align="left" valign="middle">Fraction of samples used for fitting each tree</td>
<td align="center" valign="middle">0.5</td>
</tr>
<tr>
<td align="left" valign="middle">colsample_bytree</td>
<td align="left" valign="middle">Fraction of features used for fitting each tree</td>
<td align="center" valign="middle">0.5</td>
</tr>
<tr>
<td align="left" valign="middle">Alpha_l1</td>
<td align="left" valign="middle">Regularization for the L1 coefficient</td>
<td align="center" valign="middle">0.1</td>
</tr>
<tr>
<td align="left" valign="middle">Lambda_l2</td>
<td align="left" valign="middle">Regularization for the L2 coefficient</td>
<td align="center" valign="middle">0.1</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec10">
<label>3.2</label>
<title>Integrated gradients (IG) interpretability method</title>
<p>To quantify the marginal contribution of individual environmental physical variables to STHP discrimination, we employed the IG method for feature attribution analysis in the MSDNN model. Introduced by <xref ref-type="bibr" rid="ref35">Sundararajan et al. (2017)</xref>, IG satisfies fundamental axiomatic properties including sensitivity and implementation invariance, while offering completeness in attribution. This approach overcomes limitations of gradient-based methods in saturated regions through path integration.</p>
<p>Assume that the output probability of a MSDNN for the positive &#x201C;STHP&#x201D; class is <inline-formula>
<mml:math id="M21">
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2208;</mml:mo>
<mml:mo stretchy="true">[</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">]</mml:mo>
</mml:math>
</inline-formula>, where <inline-formula>
<mml:math id="M22">
<mml:msub>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>3</mml:mn>
<mml:mo>&#x2026;</mml:mo>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:math>
</inline-formula> denotes the sample input and <inline-formula>
<mml:math id="M23">
<mml:msubsup>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
</mml:math>
</inline-formula> represents the baseline value. IG is defined as the integral of the gradient of the output with respect to each feature along the straight-line path from the baseline to the sample:</p>
<disp-formula id="E5">
<mml:math id="M24">
<mml:msub>
<mml:mi>IG</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
<mml:msubsup>
<mml:mo>&#x222B;</mml:mo>
<mml:mrow>
<mml:mi>&#x03B1;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mn>1</mml:mn>
</mml:msubsup>
<mml:mfrac>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
<mml:mo>+</mml:mo>
<mml:mi>&#x03B1;</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:msubsup>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
</mml:mrow>
</mml:mfrac>
<mml:mi mathvariant="italic">d&#x03B1;</mml:mi>
</mml:math>
<label>(5)</label>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="E5">Equation 5</xref>, where <inline-formula>
<mml:math id="M25">
<mml:msub>
<mml:mi>IG</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> represents the attribution of the <inline-formula>
<mml:math id="M26">
<mml:mi mathvariant="normal">i</mml:mi>
</mml:math>
</inline-formula>-th feature to the sample<inline-formula>
<mml:math id="M27">
<mml:mspace width="0.25em"/>
<mml:msub>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>,<inline-formula>
<mml:math id="M28">
<mml:mfrac>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:mi>F</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:math>
</inline-formula> represents the gradient of the model output with respect to the input features. Using Riemann summation for approximation, m equidistant steps are sampled within the interval <inline-formula>
<mml:math id="M29">
<mml:mo stretchy="true">[</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">]</mml:mo>
</mml:math>
</inline-formula>, yielding <xref ref-type="disp-formula" rid="E6">Equation 6</xref>:</p>
<disp-formula id="E6">
<mml:math id="M30">
<mml:msub>
<mml:mi>IG</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2248;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mi mathvariant="normal">m</mml:mi>
</mml:mfrac>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi mathvariant="normal">k</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi mathvariant="normal">m</mml:mi>
</mml:munderover>
<mml:mfrac>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:mi>F</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
<mml:mo>+</mml:mo>
<mml:mi mathvariant="normal">k</mml:mi>
<mml:mo>/</mml:mo>
<mml:mi mathvariant="normal">m</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:math>
<label>(6)</label>
</disp-formula>
<p>Owing to its completeness property, the sum of attributions across all features equals the total contribution to the model output <inline-formula>
<mml:math id="M31">
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> relative to the baseline. This allows the model&#x2019;s output probability to be decomposed into the baseline probability and the sum of individual feature attributions, yielding <xref ref-type="disp-formula" rid="E7">Equation 7</xref>:</p>
<disp-formula id="E7">
<mml:math id="M32">
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2248;</mml:mo>
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:munderover>
<mml:msub>
<mml:mi>IG</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
<label>(7)</label>
</disp-formula>
<p>In this study, the five-branch MSDNN processes 71 environmental variables for binary classification. IG computations were performed in the original input space following tensor preprocessing. For each sample, gradients were accumulated along integration paths from baselines to actual inputs across all five branches, generating feature-level attributions subsequently aggregated into sample-level spectra. To ensure numerical stability, stochastic components (e.g., Batch Normalization and Dropout) were disabled during inference. The integration step parameter m was set to 200, optimizing between computational efficiency and approximation accuracy.</p>
<p>The selection of baseline inputs critically influences IG attribution, as it establishes a reference state representing neutral or non-informative conditions. From this baseline, feature values are progressively introduced to quantify their contributions to model decision. To ensure physically meaningful inputs, we defined the baseline as the median vector computed across negative samples (non-STHP events, label&#x202F;=&#x202F;0) in the training set. Specifically, for each of the 71 physical variables, we calculated the median value from all negative samples to construct a 71-dimensional reference input. This choice is motivated by two key considerations: (1) Unlike zero vectors or random noise&#x2014;which often correspond to physically unrealistic atmospheric states (e.g., zero humidity or zero geopotential height)&#x2014;the median of non-STHP samples represents a climatologically stable and meteorologically plausible reference regime. (2) By anchoring the baseline to observed non-convective conditions, the IG integration path traverses realistic atmospheric transitions (e.g., from stable to unstable stratification), thereby yielding physically interpretable attributions that reflect how deviations from typical &#x201C;no-precipitation&#x201D; environments contribute to STHP occurrence. This baseline represents typical non-convective environmental conditions, ensuring the integration path remains within meteorologically stable regimes. Compared to model outputs <inline-formula>
<mml:math id="M33">
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msup>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> derived from this baseline typically exhibit low probabilities, this approach aligns with the physical narrative of transitioning from &#x201C;non-convective&#x201D; to &#x201C;potentially convective&#x201D; conditions.</p>
<p>We implemented the IG method using the Python captum library,<xref ref-type="fn" rid="fn0002"><sup>2</sup></xref> which handles gradient computation and path integration through the Integrated Gradients function. For global feature importance assessment, we calculated absolute attribution values for all test samples and averaged them across the dataset. Results were visualized using swarm plots and bar charts to display attribution distributions and importance scores, while partial dependence plots were employed to analyze how interactions between key physical variables influence STHP identification.</p>
</sec>
<sec id="sec11">
<label>3.3</label>
<title>Algorithm implementation and evaluation</title>
<p>All algorithms were evaluated on the same dataset randomly partitioned into training and test sets using an 8:2 ratio. The training set served for hyperparameter optimization and model development, while the test set was reserved exclusively for performance evaluation. To ensure reproducibility and minimize randomness in data partitioning, all experiments employed a fixed random seed (seed&#x202F;=&#x202F;42). All models were trained and evaluated on identical data splits, ensuring fair and consistent comparative analysis. This study formulates STHP identification as a binary classification task, where samples with STHP occurrence are labeled positive and non-STHP samples as negative. Model performance was assessed using a confusion matrix (<xref ref-type="table" rid="tab3">Table 3</xref>) and threat score (TS), supplemented by derived metrics including true positives (TP), false positives (FP), true negatives (TN), and false negatives (FN).</p>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Confusion matrix.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th>Actual/predicted</th>
<th align="left" valign="top">Predicted positive</th>
<th align="left" valign="top">Predicted negative</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Actual positive</td>
<td align="left" valign="top">True positive (TP)</td>
<td align="left" valign="top">False negative (FN)</td>
</tr>
<tr>
<td align="left" valign="top">Actual negative</td>
<td align="left" valign="top">False positive (FP)</td>
<td align="left" valign="top">True negative (TN)</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The TS and Matthews correlation coefficient (MCC) were calculated as primary evaluation metrics. The TS (<xref ref-type="disp-formula" rid="E8">Equation 8</xref>), widely adopted in the verification of meteorological event identification (<xref ref-type="bibr" rid="ref50">Zhao, 2022</xref>) and assesses the accuracy of event-based identification by accounting for TP, FP, and FN. The MCC (<xref ref-type="disp-formula" rid="E9">Equation 9</xref>) provides a balanced measure of classification quality across both classes, representing the correlation between identified and observed binary outcomes (<xref ref-type="bibr" rid="ref6">Chicco and Jurman, 2023</xref>; <xref ref-type="bibr" rid="ref33">Stoica and Babu, 2024</xref>). The computational formulas are as follows:</p>
<disp-formula id="E8">
<mml:math id="M34">
<mml:mi>TS</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mi>TP</mml:mi>
<mml:mrow>
<mml:mi>TP</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>FP</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>FN</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:math>
<label>(8)</label>
</disp-formula>
<disp-formula id="E9">
<mml:math id="M35">
<mml:mi>MCC</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>TP</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mi>TN</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>FP</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mi>FN</mml:mi>
</mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>TP</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>FP</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>TP</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>FN</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>TN</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>FP</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>TN</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>FN</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
</mml:msqrt>
</mml:mfrac>
</mml:math>
<label>(9)</label>
</disp-formula>
<p>The TS ranges from 0 to 1, where a value of 1 indicates perfect identification and 0 denotes complete identification failure. The MCC ranges from &#x2212;1 to 1, where 1 represents perfect identification, 0 equates to random guessing, and &#x2212;1 indicates total disagreement between identified and observed outcomes. Both metrics place particular emphasis on the accurate identification of STHP events, making them suitable for evaluating the rate of missed detections and false alarms of the models.</p>
</sec>
</sec>
<sec sec-type="results" id="sec12">
<label>4</label>
<title>Results</title>
<sec id="sec13">
<label>4.1</label>
<title>Performance comparison between MSDNN and benchmark models</title>
<p>This study evaluates the performance of the proposed MSDNN for STHP identification against three benchmark models&#x2014;LGB, RF, and DNN. Comprehensive performance metrics across both training and test datasets are systematically compared in <xref ref-type="table" rid="tab4">Table 4</xref>.</p>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>The results of different models on the training set and the test set.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Models</th>
<th align="center" valign="top" colspan="2">Training set</th>
<th align="center" valign="top" colspan="2">Test set</th>
</tr>
<tr>
<th align="center" valign="top">TS</th>
<th align="center" valign="top">MCC</th>
<th align="center" valign="top">TS</th>
<th align="center" valign="top">MCC</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">MSDNN</td>
<td align="char" valign="top" char=".">0.952</td>
<td align="char" valign="top" char=".">0.953</td>
<td align="char" valign="top" char=".">0.851</td>
<td align="char" valign="top" char=".">0.844</td>
</tr>
<tr>
<td align="left" valign="top">DNN</td>
<td align="char" valign="top" char=".">0.927</td>
<td align="char" valign="top" char=".">0.927</td>
<td align="char" valign="top" char=".">0.842</td>
<td align="char" valign="top" char=".">0.832</td>
</tr>
<tr>
<td align="left" valign="top">LGB</td>
<td align="char" valign="top" char=".">0.907</td>
<td align="char" valign="top" char=".">0.906</td>
<td align="char" valign="top" char=".">0.808</td>
<td align="char" valign="top" char=".">0.791</td>
</tr>
<tr>
<td align="left" valign="top">RF</td>
<td align="char" valign="top" char=".">0.755</td>
<td align="char" valign="top" char=".">0.723</td>
<td align="char" valign="top" char=".">0.711</td>
<td align="char" valign="top" char=".">0.663</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>On the training set, the MSDNN demonstrated exceptional capability, achieving the highest TS of 0.952 and MCC of 0.953, surpassing all comparative models. LGB (TS&#x202F;=&#x202F;0.907, MCC&#x202F;=&#x202F;0.906) and RF (TS&#x202F;=&#x202F;0.755, MCC&#x202F;=&#x202F;0.723) showed substantial performance gaps relative to the MSDNN. Confusion matrix analysis (<xref ref-type="fig" rid="fig4">Figure 4</xref>) further revealed that the MSDNN correctly identified 98.9% of positive samples (STHP events), exceeding the DNN (98.3%), LGB (97.5%), and RF (92.1%). For negative samples, the MSDNN attained a recognition rate of 96.5%, outperforming the DNN (94.5%), LightGBM (93.2%), and RF (80.0%). On the test set, although all models experienced performance degradation, the MSDNN maintained superior ability with a TS of 0.851 and MCC of 0.844. These results slightly exceeded those of the DNN (TS&#x202F;=&#x202F;0.842, MCC&#x202F;=&#x202F;0.832) and substantially outperformed LGB (TS&#x202F;=&#x202F;0.808, MCC&#x202F;=&#x202F;0.791) and RF (TS&#x202F;=&#x202F;0.711, MCC&#x202F;=&#x202F;0.663), indicating limited generalization capacity of the traditional ensemble methods in operational identification scenarios. Confusion matrix analysis (<xref ref-type="fig" rid="fig4">Figure 4</xref>) for the test set confirmed that the MSDNN correctly identified 95.3% of positive samples, marginally higher than the DNN (95.1%) and LGB (93.3%), and significantly exceeding RF (89.0%). For negative samples, the MSDNN achieved a recognition rate of 89.2%, again surpassing the DNN (88.2%), LGB (85.9%), and RF (77.1%).</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Confusion matrices of the MSDNN <bold>(a,e)</bold>, DNN <bold>(b,f)</bold>, LGB <bold>(c,g)</bold>, and RF <bold>(d,h)</bold> on the training <bold>(a&#x2013;d)</bold> and test <bold>(e&#x2013;h)</bold> datasets.</p>
</caption>
<graphic xlink:href="fclim-08-1776202-g004.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Eight heatmap confusion matrices compare model predictions for both training and test datasets using MSDNN, DNN, LGB, and RF algorithms. Each panel shows actual negative and positive cases against predicted values, with color intensity representing the number of samples, ranging from zero to over nine thousand or two thousand depending on dataset size. Panels (a) to (d) are for training datasets, while (e) to (h) correspond to test datasets. Each matrix details true positives, false positives, true negatives, and false negatives for each algorithm and dataset split.</alt-text>
</graphic>
</fig>
<p>The MSDNN consistently achieved optimal performance across both primary evaluation metrics (TS and MCC), demonstrating statistically significant advantages over traditional ensemble methods and a measurable improvement over the standard DNN architecture. Notably, the model exhibited enhanced stability and superior generalization capability in accurately identification both positive and negative cases, underscoring its practical potential for operational STHP identification.</p>
</sec>
<sec id="sec14">
<label>4.2</label>
<title>Interpretability of the MSDNN for STHP discrimination</title>
<sec id="sec15">
<label>4.2.1</label>
<title>Global importance analysis of environmental physical variables</title>
<p><xref ref-type="fig" rid="fig5">Figure 5</xref> presents the global importance of environmental physical variables. The five variables exhibiting the strongest contributions to MSDNN model were 700&#x202F;hPa relative humidity&#x3001;inflow parameter&#x3001;500&#x202F;hPa vertical speed&#x3001;700&#x202F;hPa specific humidity and maximum wind speed above 500&#x202F;hPa, each attaining mean absolute attribution scores approaching 0.1. Among these, 500&#x202F;hPa vertical speed and 700&#x202F;hPa specific humidity demonstrated significant negative correlations with model output: stronger upward motion enhanced positive contributions to STHP identification, whereas higher specific humidity unexpectedly increased negative influence. In contrast, 700&#x202F;hPa relative humidity, inflow parameter, and maximum wind speed above 500&#x202F;hPa consistently contributed positively to STHP discrimination. Categorical analysis of the top 20 features revealed that dynamic conditions dominated model decisions (45%), followed by thermal (25%), vertical structure (15%), moisture-related (10%), and composite indices (5%), indicating the primacy of dynamic processes in STHP formation within the MSDNN framework. To mitigate bias from unequal feature counts across categories, we further compared the top five variables per type (<xref ref-type="table" rid="tab5">Table 5</xref>). Dynamic, moisture, and thermal variables exhibited substantially higher mean attribution scores than comprehensive indices and vertical level parameters. Dynamic features achieved the highest overall importance, while moisture variables showed pronounced variability&#x2014;driven predominantly by the strong but opposing influences of 700&#x202F;hPa relative humidity and 700&#x202F;hPa specific humidity.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Global and category-specific importance of environmental physical variables based on Integrated gradients (IG). <bold>(a)</bold> Ranks the top 20 most influential variables across the entire feature set. <bold>(b&#x2013;f)</bold> Illustrate the internal importance rankings within each specialized category: <bold>(b)</bold> 11 humidity-related variables, <bold>(c)</bold> 17 stability and energy indices, <bold>(d)</bold> 25 wind and vertical motion variables, <bold>(e)</bold> 7 severe convection and storm indices, and <bold>(f)</bold> 10 height and thickness variables. The IG value quantifies the impact of each feature on the model output, where values above zero represent a positive contribution to STHP identification, and higher magnitudes indicate greater relative importance.</p>
</caption>
<graphic xlink:href="fclim-08-1776202-g005.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Six bar charts display the mean absolute IG for feature importance across different categories: (a) top twenty of seventy-one physical quantity features, (b) HRV, (c) SEI, (d) WVV, (e) SSI, and (f) HTV. X-axes list feature names, while y-axes indicate mean absolute IG values, visualizing the relative contribution and ranking of each feature within its group. All charts are labeled and have clear axes.</alt-text>
</graphic>
</fig>
<table-wrap position="float" id="tab5">
<label>Table 5</label>
<caption>
<p>Statistics of the IG attribution scores of the physical features for the five input categories.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Feature types</th>
<th align="center" valign="top">Mean</th>
<th align="center" valign="top">Max</th>
<th align="center" valign="top">Min</th>
<th align="center" valign="top">CV</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="bottom">HRV</td>
<td align="char" valign="bottom" char=".">0.089</td>
<td align="char" valign="bottom" char=".">0.191</td>
<td align="char" valign="bottom" char=".">0.045</td>
<td align="char" valign="bottom" char=".">0.638</td>
</tr>
<tr>
<td align="left" valign="bottom">WVV</td>
<td align="char" valign="bottom" char=".">0.108</td>
<td align="char" valign="bottom" char=".">0.148</td>
<td align="char" valign="bottom" char=".">0.072</td>
<td align="char" valign="bottom" char=".">0.300</td>
</tr>
<tr>
<td align="left" valign="bottom">SEI</td>
<td align="char" valign="bottom" char=".">0.086</td>
<td align="char" valign="bottom" char=".">0.131</td>
<td align="char" valign="bottom" char=".">0.062</td>
<td align="char" valign="bottom" char=".">0.282</td>
</tr>
<tr>
<td align="left" valign="bottom">SSI</td>
<td align="char" valign="bottom" char=".">0.048</td>
<td align="char" valign="bottom" char=".">0.075</td>
<td align="char" valign="bottom" char=".">0.037</td>
<td align="char" valign="bottom" char=".">0.294</td>
</tr>
<tr>
<td align="left" valign="bottom">HTV</td>
<td align="char" valign="bottom" char=".">0.060</td>
<td align="char" valign="bottom" char=".">0.092</td>
<td align="char" valign="bottom" char=".">0.046</td>
<td align="char" valign="bottom" char=".">0.283</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec16">
<label>4.2.2</label>
<title>Combined effects of environmental physical variables on the MSDNN</title>
<p>To elucidate the relative contributions and underlying mechanisms of various environmental physical variables in the MSDNN&#x2019;s discrimination of STHP, we performed an interpretability analysis of all 71 input features using the IG algorithm. <xref ref-type="fig" rid="fig6">Figure 6</xref> presents scatter plots depicting the relationship between IG attribution scores and corresponding physical values for the 20 most influential variables, ranked by contribution magnitude. In this representation, positive IG values indicate a feature&#x2019;s promoting effect on STHP occurrence, whereas negative values reflect an inhibitory influence, with the absolute magnitude quantifying the strength of each feature&#x2019;s contribution.</p>
<fig position="float" id="fig6">
<label>Figure 6</label>
<caption>
<p>Attribution value dependence plot for the top 20 environmental physical variables <bold>(a&#x2013;t)</bold> used in the discrimination of short-time heavy precipitation (STHP) weather. The y-axis represents the IG values of the features and the x-axis represents the actual values of the features.</p>
</caption>
<graphic xlink:href="fclim-08-1776202-g006.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Scatterplot matrix showing twenty individual charts labeled a to t, each graphing IG Value versus a different meteorological variable such as RH_700, inflow, vertical_speed_500, specific_humidity_700, and others. Data points are densely clustered, and each subplot highlights different relationships or distributions between IG Value and its corresponding feature. Each axis is clearly labeled with variable names and numerical increments.</alt-text>
</graphic>
</fig>
<p>Attribution patterns exhibit distinct distributions across variable categories, highlighting the MSDNN&#x2019;s capacity to extract discriminative signals from multi-category, multi-level atmospheric environmental factors. Dynamic and moisture-related variables&#x2014;including 700&#x202F;hPa relative humidity, inflow parameter, vertical velocities, southwesterly wind components at multiple levels&#x2014;collectively demonstrated the strongest positive contributions, underscoring the combined roles of low-level moisture transport and vertical motion in STHP development. As shown in <xref ref-type="fig" rid="fig6">Figure 6d</xref>, 700&#x202F;hPa specific humidity exhibits a transition in IG values, with a negative contribution emerging when specific humidity exceeds 9. This pattern suggests the model recognizes that excessively high low-level moisture under certain thermodynamic conditions may suppress convective intensity, reflecting a nuanced understanding of moisture-thermal coupling in convection initiation. Vertical level parameters display physically consistent threshold behaviors. Both the LCL Height and the height difference between LCL and CCL show reversed IG polarities below 500&#x202F;m (<xref ref-type="fig" rid="fig6">Figures 6f</xref>, <xref ref-type="fig" rid="fig6">6o</xref>). Optimal STHP identification occurs when LCL_H approaches 1,000&#x202F;m with minimal LCL-CCL difference (&#x003C;500&#x202F;m), indicating the model effectively identifies atmospheric configurations favoring deep convection development through condensation level constraints. CAPE_index shows a clear positive correlation with IG values (<xref ref-type="fig" rid="fig6">Figure 6i</xref>), confirming the expected role of CAPE in enhancing heavy precipitation probability. Meanwhile, wind field, including maximum wind speed above 500&#x202F;hPa, wind speed difference between 6&#x202F;km altitude and the ground, wind speed difference between 2&#x202F;km altitude and the ground, exhibit vertically structured contributions, revealing how the model leverages synergistic interactions between low-level shear and upper-level jet configurations to identify environments supporting sustained updrafts and prolonged convective duration.</p>
<p>The IG-derived attribution results demonstrate that the MSDNN effectively captures not only key parameters from traditional severe convection criteria&#x2014;such as CAPE, vertical velocity, and low-level humidity&#x2014;but also identifies complex nonlinear couplings among multi-scale atmospheric features. The model exhibits heightened sensitivity to fundamental convective processes, including thermal instability development, moisture transport mechanisms, and dynamic lifting forcing. These findings collectively validate the MSDNN&#x2019;s capability in fusing multi-source environmental information and extracting physically meaningful, discriminative patterns for STHP identification.</p>
</sec>
</sec>
</sec>
<sec sec-type="discussion" id="sec17">
<label>5</label>
<title>Discussion</title>
<sec id="sec18">
<label>5.1</label>
<title>Advantages of MSDNN model in short-term heavy precipitation weather identification</title>
<p>Accurate identification of STHP requires models capable of discerning complex correlations among interconnected physical variables. This study proposes a MSDNN that demonstrates substantially superior performance compared to traditional machine learning models and conventional DNN. The MSDNN&#x2019;s enhanced identification capability stems from its innovative architecture featuring five dedicated input branches for processing distinct meteorological variable categories. This design enables comprehensive feature extraction while preserving the unique physical properties of each variable type, with subsequent feature fusion creating highly discriminative representations. The &#x201C;divide-and-conquer&#x201D; approach effectively captures complex interdependencies and nonlinear interactions among diverse meteorological factors, significantly improving STHP identification.</p>
<p>Compared to traditional ensemble learning methods such as LGB and RF, the MSDNN demonstrates distinct advantages in handling STHP&#x2019;s complex patterns. While ensemble methods can provide stable identification performance in certain scenarios, they often struggle to achieve sufficient accuracy when confronted with multi-source data and strong nonlinear relationships (<xref ref-type="bibr" rid="ref46">Zhang et al., 2025</xref>). Existing research has established that DL architectures excel through hierarchical nonlinear transformations that automatically extract multi-level feature representations, providing inherent advantages in capturing complex meteorological processes (<xref ref-type="bibr" rid="ref25">Meenal et al., 2021</xref>; <xref ref-type="bibr" rid="ref1">Apayd&#x0131;n et al., 2022</xref>). In this study, although the benchmark DNN slightly underperformed relative to the MSDNN, it still surpassed both LGB and RF in identification capability, maintaining superior accuracy even under constrained computational resources. The MSDNN&#x2019;s effectiveness is further supported by evidence from agricultural remote sensing, where similar multi-stream architectures have demonstrated robust multi-source data processing capabilities. For instance, <xref ref-type="bibr" rid="ref17">Khan et al. (2025)</xref> achieved an <italic>R</italic><sup>2</sup> of 0.86 for corn yield prediction using a two-stream DNN, significantly outperforming traditional methods and single-stream DNNs. Similarly, <xref ref-type="bibr" rid="ref20">Li et al. (2025)</xref> developed a multi-source deep feature network for wheat chlorophyll estimation, attaining an <italic>R</italic><sup>2</sup> of 0.85 with a 6.4% improvement over conventional DNN. These findings collectively confirm that multi-stream architectures can effectively capture inherent characteristics and interactive relationships among variables with distinct physical meanings, strongly validating our study conclusions.</p>
</sec>
<sec id="sec19">
<label>5.2</label>
<title>Deciphering the driving mechanisms of physical variables in short-term heavy precipitation</title>
<p>This study applies the IG method to perform attribution analysis on the MSDNN model. The primary contribution lies not only in validating the discriminative logic of the model, but more importantly, in revealing complex nonlinear interactions and triggering mechanisms among environmental physical variables during STHP evolution. By combining model-derived feature attributions with classical convection theories, we elucidate the physical processes governing STHP occurrence.</p>
<p>The 700&#x202F;hPa relative humidity (RH_700) emerges as the dominant moisture discriminator, displaying a marked nonlinear threshold effect. IG analysis indicates that intermediate RH_700 values (40&#x2013;60%) strongly suppress STHP identification. In the Yangtze&#x2013;Huaihe region, low mid-level humidity typically signals dry intrusion with northerly upper-level winds. When coupled with warm, moist low-level flows, this generates strong vertical wind shear that organizes convection but accelerates cell propagation, shortens precipitation duration, and restricts accumulation for extreme events. Dry intrusion further promotes evaporative cooling and entrainment, inhibiting upscale convective growth. Conversely, RH_700 exceeding 80% sharply increases positive attribution: a deep moist layer supplies abundant vapor, reduces mid-level dissipation, preserves warm-core structures, and supports transition to efficient heavy precipitation. These results align with <xref ref-type="bibr" rid="ref16">Kang and Ebtehaj (2025)</xref>, who found moisture variables dominant in convective discrimination, and <xref ref-type="bibr" rid="ref45">Yousefnia et al. (2025)</xref>, who emphasized low-level RH for thunderstorm initiation. The specific humidity threshold of 9&#x202F;g/kg similarly marks a high-contribution regime, reflecting Clausius&#x2013;Clapeyron constraints requiring warm temperatures to sustain such moisture. The model&#x2019;s capture of this &#x201C;high temperature&#x2013;high humidity&#x201D; coupling matches observational thresholds (RH_700 of 76%; specific humidity of 8.36&#x202F;g/kg) from <xref ref-type="bibr" rid="ref31">Shen et al. (2016)</xref>.</p>
<p>WVV contribute 45% of total attribution, highlighting the pivotal role of large-scale synoptic forcing in regional STHP. 500&#x202F;hPa vertical speed is the key factor, with negative values yielding strong positive contributions. This reflects mesoscale control by favorable large-scale circulation. Quasi-geostrophic theory positions the 500&#x202F;hPa level near nondivergence, where ascent is weak under balance; only deep troughs and positive vorticity advection induce organized uplift. These findings corroborate <xref ref-type="bibr" rid="ref30">Retsch et al. (2022)</xref> on vertical velocity in deep convection and <xref ref-type="bibr" rid="ref9">Fan et al. (2024)</xref> SHAP-based sensitivities. Notably, the model integrates southwesterly winds across levels (950&#x2013;200&#x202F;hPa), capturing low-level jet convergence and upper-level divergence as a &#x201C;dynamic pump&#x201D; that compensates for modest CAPE and enables extreme precipitation under weakly unstable conditions. This contrasts with thermodynamically focused studies (e.g., <xref ref-type="bibr" rid="ref48">Zhang et al., 2019</xref>) and demonstrates MSDNN&#x2019;s capacity to autonomously extract three-dimensional dynamical structures.</p>
<p>Attributions related to thermodynamic conditions and vertical structure reveal a delicate balance between energy release and precipitation efficiency. CAPE contributions peak near 3,000&#x202F;J/kg before declining, suggesting microphysical limits: excessive CAPE may drive intense updrafts favoring ice-phase loading and reducing warm-rain efficiency. A high 700&#x202F;hPa pseudo-equivalent potential temperature (<inline-formula>
<mml:math id="M36">
<mml:msub>
<mml:mi mathvariant="normal">&#x03B8;</mml:mi>
<mml:mi mathvariant="italic">se</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> &#x2248; 340&#x202F;K) inhibits by flattening the vertical <inline-formula>
<mml:math id="M37">
<mml:msub>
<mml:mi mathvariant="normal">&#x03B8;</mml:mi>
<mml:mi mathvariant="italic">se</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> gradient and suppressing low-level instability, consistent with eastern China observations (<xref ref-type="bibr" rid="ref27">Qiu and He, 2013</xref>). Small vertical separation (&#x003C;500&#x202F;m) between the lifting condensation level (LCL) and convective condensation level (CCL) promotes STHP by enabling efficient warm-rain processes through high near-surface moisture and low trigger heights.</p>
<p>In summary, IG analysis not only confirms MSDNN&#x2019;s reliability in STHP identification but also quantitatively reconstructs a physically coherent convective scenario aligned with the &#x201C;ingredients-based&#x201D; framework (<xref ref-type="bibr" rid="ref7">Doswell et al., 1996</xref>). Deep moist layers with warm backgrounds mitigate entrainment (moisture constraint); large-scale troughs and dynamic pumping disrupt balance (dynamic constraint); and moderate energy with optimized stratification (thermodynamic constraint) collectively define the conditions for extreme precipitation.</p>
</sec>
<sec id="sec20">
<label>5.3</label>
<title>Strengths and limitations of this study</title>
<p>This study presents an innovative framework that integrates a MSDNN with IG interpretability analysis, establishing a novel methodology for STHP identification that effectively balances identification performance with physical interpretability. The principal strengths of this research are manifested in two key aspects. First, the MSDNN architecture is explicitly designed to align with established physical principles of severe convective weather. By categorizing 71 environmental physical variables into five specialized input streams&#x2014;moisture conditions, dynamic parameters, thermal instability, comprehensive indices, and vertical level features&#x2014;the model facilitates hierarchical extraction of features from heterogeneous meteorological elements. This design enables dedicated sub-networks to capture intrinsic patterns within specific physical processes, while a subsequent integration layer models cross-process nonlinear interactions. Validation result confirms that the MSDNN surpasses both conventional ensemble learning methods (LGB, RF) and single-stream DNN, demonstrating that this physics-informed partitioning strategy more effectively utilizes multi-source meteorological information and enhances discrimination capability for complex convective systems. Second, the successful application of the integrated gradients method provides an effective solution to the &#x201C;black-box&#x201D; problem of DL-based meteorological models. Beyond quantifying the marginal contributions of individual physical variables to model outputs, IG analysis reveals nonlinear threshold effects of key factors. These findings offer data-driven new perspectives for understanding the initiation mechanisms of STHP. Through feature attribution analysis, we establish a quantitative link between model identification and physical processes, enhancing the credibility of the model in operational applications.</p>
<p>However, several limitations warrant consideration. First, the station-based 1D feature representation, while enabling direct physical interpretation, does not encode spatial neighborhood dependencies critical for capturing mesoscale convective organization and frontal structures&#x2014;capabilities inherent to 2D convolutional architectures like U-Net. Second, the ERA5 reanalysis data employed in this study, while comprehensive, lacks the spatial resolution necessary to fully resolve fine-scale structures of mesoscale and microscale convective systems. This scale discrepancy consequently leads to elevated false alarm rates in identifying isolated severe convection events, particularly those initiated by subgrid-scale processes such as boundary layer convergence lines and localized frontal zones. Furthermore, the current feature representation system inadequately captures topographic forcing effects, despite the demonstrated significance of Anhui Province&#x2019;s complex terrain&#x2014;including the Dabie Mountains and southern mountainous regions&#x2014;in modulating precipitation distribution through mechanical lifting and moisture channeling mechanisms. The existing environmental physical variables prove insufficient in characterizing these topographically driven dynamic processes. Finally, the current framework utilizes reanalysis-based diagnostics to identify STHP precursors, which provides a retrospective understanding of critical atmospheric conditions but does not directly evaluate predictive skill at operational forecast lead times. Future research will address these limitations through three primary directions: (1) We will develop grid-based multi-branch architectures that combine spatial modeling techniques&#x2014;such as U-Net for local feature extraction and Transformer for long-range dependency capture&#x2014;with existing physics-based variable streams, thereby integrating spatial neighborhood correlations into the identification framework. (2) We will prioritize the integration and evaluation of high-resolution regional reanalysis products to better resolve convective-scale atmospheric structures. Concurrently, we plan to incorporate a dedicated topographic input branch within the MSDNN framework, integrating parameters such as elevation, slope gradient, aspect, and underlying surface characteristics. (3) To facilitate operational deployment, a transfer learning strategy (<xref ref-type="bibr" rid="ref12">Ham et al., 2019</xref>) will be employed. The MSDNN model pre-trained on ERA5 reanalysis data will serve as the initialization, with fine-tuning conducted using bias-corrected operational NWP fields. These enhancements are expected to strengthen the coupling between MSDNN and numerical weather prediction systems, advancing severe convective weather forecasting toward greater precision and enhanced physical interpretability.</p>
</sec>
</sec>
<sec sec-type="conclusions" id="sec21">
<label>6</label>
<title>Conclusion</title>
<p>Addressing the dual challenges of integrating heterogeneous environmental variables and ensuring model interpretability in short-term heavy precipitation (STHP) identification, this study developed a novel identification framework by combining a multi-stream deep neural network (MSDNN) with integrated gradients (IG) interpretability analysis. The results show that the MSDNN achieves effective integration of meteorological elements through its split-merge architecture, which processes 71 environmental physical variables partitioned into five specialized input streams according to their physical attributes. After dedicated feature extraction within substreams and subsequent feature fusion, the model attained a threat score (TS) of 0.851 and a Matthews correlation coefficient (MCC) of 0.844 on the test set, significantly outperforming both conventional ensemble learning methods and single-stream deep neural networks. The IG attribution analysis revealed distinct contribution patterns among environmental physical variables, with dynamic variables accounting for 45% of the top 20 influential features&#x2014;substantially exceeding the contributions of thermal variables (25%) and moisture-related variables (10%). Furthermore, the study quantitatively identified several critical nonlinear characteristics, including a sign reversal in the contribution of 700&#x202F;hPa relative humidity near 80% and high sensitivity of 500&#x202F;hPa vertical velocity to upward motion. These findings provide data-driven physical evidence for improving our understanding of convective triggering mechanisms. By integrating the powerful feature extraction capability of deep learning with physically grounded interpretability analysis, the proposed MSDNN-IG framework not only achieves accurate identification of STHP events but also offers quantitative insights into the underlying decision-making process.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec22">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="author-contributions" id="sec23">
<title>Author contributions</title>
<p>JL: Conceptualization, Formal analysis, Methodology, Software, Writing &#x2013; original draft. JA: Conceptualization, Funding acquisition, Supervision, Writing &#x2013; review &#x0026; editing. CY: Formal analysis, Investigation, Writing &#x2013; review &#x0026; editing. ZW: Software, Validation, Writing &#x2013; review &#x0026; editing. HL: Data curation, Resources, Writing &#x2013; review &#x0026; editing. XZ: Data curation, Visualization, Writing &#x2013; review &#x0026; editing. GL: Funding acquisition, Methodology, Resources, Writing &#x2013; review &#x0026; editing. RW: Software, Validation, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="COI-statement" id="sec24">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec25">
<title>Generative AI statement</title>
<p>The author(s) declared that Generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec26">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec27">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fclim.2026.1776202/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fclim.2026.1776202/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.pdf" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Apayd&#x0131;n</surname><given-names>M.</given-names></name> <name><surname>Yumu&#x015F;</surname><given-names>M.</given-names></name> <name><surname>De&#x011F;irmenci</surname><given-names>A.</given-names></name> <name><surname>Karal</surname><given-names>&#x00D6;.</given-names></name></person-group> (<year>2022</year>). <article-title>Evaluation of air temperature with machine learning regression methods using Seoul City meteorological data</article-title>. <source>Pamukkale Univ. J. Eng. Sci.</source> <volume>28</volume>, <fpage>737</fpage>&#x2013;<lpage>747</lpage>. doi: <pub-id pub-id-type="doi">10.5505/pajes.2022.66915</pub-id></mixed-citation></ref>
<ref id="ref2"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Baldi</surname><given-names>P.</given-names></name> <name><surname>Sadowski</surname><given-names>P. J.</given-names></name></person-group> (<year>2013</year>). <article-title>Understanding dropout</article-title>. Available online at: <ext-link xlink:href="https://papers.nips.cc/paper_files/paper/2013/file/71f6278d140af599e06ad9bf1ba03cb0-Paper.pdf" ext-link-type="uri">https://papers.nips.cc/paper_files/paper/2013/file/71f6278d140af599e06ad9bf1ba03cb0-Paper.pdf</ext-link> (Accessed February 2, 2026).</mixed-citation></ref>
<ref id="ref3"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bauer</surname><given-names>P.</given-names></name> <name><surname>Thorpe</surname><given-names>A.</given-names></name> <name><surname>Brunet</surname><given-names>G.</given-names></name></person-group> (<year>2015</year>). <article-title>The quiet revolution of numerical weather prediction</article-title>. <source>Nature</source> <volume>525</volume>, <fpage>47</fpage>&#x2013;<lpage>55</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nature14956</pub-id>, <pub-id pub-id-type="pmid">26333465</pub-id></mixed-citation></ref>
<ref id="ref4"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bhowmik</surname><given-names>S. K. R.</given-names></name> <name><surname>Roy</surname><given-names>S. S.</given-names></name> <name><surname>Kundu</surname><given-names>P. K.</given-names></name></person-group> (<year>2008</year>). <article-title>Analysis of large-scale conditions associated with convection over the Indian monsoon region</article-title>. <source>Int. J. Climatol.</source> <volume>28</volume>, <fpage>797</fpage>&#x2013;<lpage>821</lpage>. doi: <pub-id pub-id-type="doi">10.1002/joc.1567</pub-id></mixed-citation></ref>
<ref id="ref5"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chiappa</surname><given-names>J.</given-names></name> <name><surname>Parsons</surname><given-names>D. B.</given-names></name> <name><surname>Furtado</surname><given-names>J. C.</given-names></name> <name><surname>Shapiro</surname><given-names>A.</given-names></name></person-group> (<year>2024</year>). <article-title>Short-duration extreme rainfall events in the central and eastern United States during the summer: 2003&#x2013;2023 trends and variability</article-title>. <source>Geophys. Res. Lett.</source> <volume>51</volume>:<fpage>e2024GL110424</fpage>. doi: <pub-id pub-id-type="doi">10.1029/2024GL110424</pub-id></mixed-citation></ref>
<ref id="ref6"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chicco</surname><given-names>D.</given-names></name> <name><surname>Jurman</surname><given-names>G.</given-names></name></person-group> (<year>2023</year>). <article-title>The Matthews correlation coefficient (MCC) should replace the ROC AUC as the standard metric for assessing binary classification</article-title>. <source>BioData Min.</source> <volume>16</volume>:<fpage>4</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13040-023-00322-4</pub-id>, <pub-id pub-id-type="pmid">36800973</pub-id></mixed-citation></ref>
<ref id="ref7"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Doswell</surname><given-names>C. A.</given-names></name> <name><surname>Brooks</surname><given-names>H. E.</given-names></name> <name><surname>Maddox</surname><given-names>R. A.</given-names></name></person-group> (<year>1996</year>). <article-title>Flash flood forecasting: an ingredients-based methodology</article-title>. <source>Weather Forecast.</source> <volume>11</volume>, <fpage>560</fpage>&#x2013;<lpage>581</lpage>. doi: <pub-id pub-id-type="doi">10.1175/1520-0434(1996)011&#x003C;0560:FFFAIB&#x003E;2.0.CO;2</pub-id></mixed-citation></ref>
<ref id="ref8"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Du</surname><given-names>M.</given-names></name> <name><surname>Liu</surname><given-names>N.</given-names></name> <name><surname>Hu</surname><given-names>X.</given-names></name></person-group> (<year>2019</year>). <article-title>Techniques for interpretable machine learning</article-title>. <source>Commun. ACM</source> <volume>63</volume>, <fpage>68</fpage>&#x2013;<lpage>77</lpage>. doi: <pub-id pub-id-type="doi">10.1145/3359786</pub-id></mixed-citation></ref>
<ref id="ref9"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fan</surname><given-names>D.</given-names></name> <name><surname>Greybush</surname><given-names>S. J.</given-names></name> <name><surname>Clothiaux</surname><given-names>E. E.</given-names></name> <name><surname>Gagne</surname><given-names>D. J.</given-names></name></person-group> (<year>2024</year>). <article-title>Physically explainable deep learning for convective initiation nowcasting using GOES-16 satellite observations</article-title>. <source>Artif. Intell. Earth Syst.</source> <volume>3</volume>:<fpage>e230098</fpage>. doi: <pub-id pub-id-type="doi">10.1175/AIES-D-23-0098.1</pub-id></mixed-citation></ref>
<ref id="ref10"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Feldmann</surname><given-names>M.</given-names></name> <name><surname>Beucler</surname><given-names>T.</given-names></name> <name><surname>Gomez</surname><given-names>M.</given-names></name> <name><surname>Martius</surname><given-names>O.</given-names></name></person-group> (<year>2024</year>). <article-title>Lightning-fast convective outlooks: predicting severe convective environments with global AI-based weather models</article-title>. <source>Geophys. Res. Lett.</source> <volume>51</volume>:<fpage>e2024GL110960</fpage>. doi: <pub-id pub-id-type="doi">10.1029/2024GL110960</pub-id>, <pub-id pub-id-type="pmid">39582582</pub-id></mixed-citation></ref>
<ref id="ref11"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fowler</surname><given-names>H. J.</given-names></name> <name><surname>Lenderink</surname><given-names>G.</given-names></name> <name><surname>Prein</surname><given-names>A. F.</given-names></name> <name><surname>Westra</surname><given-names>S.</given-names></name> <name><surname>Allan</surname><given-names>R. P.</given-names></name> <name><surname>Ban</surname><given-names>N.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Anthropogenic intensification of short-duration rainfall extremes</article-title>. <source>Nat. Rev. Earth. Env.</source> <volume>2</volume>, <fpage>107</fpage>&#x2013;<lpage>122</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s43017-020-00128-6</pub-id></mixed-citation></ref>
<ref id="ref12"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ham</surname><given-names>Y. G.</given-names></name> <name><surname>Kim</surname><given-names>J. H.</given-names></name> <name><surname>Luo</surname><given-names>J. J.</given-names></name></person-group> (<year>2019</year>). <article-title>Deep learning for multi-year ENSO forecasts</article-title>. <source>Nature</source> <volume>573</volume>, <fpage>568</fpage>&#x2013;<lpage>572</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41586-019-1559-7</pub-id>, <pub-id pub-id-type="pmid">31534218</pub-id></mixed-citation></ref>
<ref id="ref13"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hao</surname><given-names>Y.</given-names></name> <name><surname>Yao</surname><given-names>Y.</given-names></name> <name><surname>Zheng</surname><given-names>Y.</given-names></name> <name><surname>Lu</surname><given-names>J.</given-names></name></person-group> (<year>2012</year>). <article-title>Multi scale analysis and nowcasting of short time heavy rainfall</article-title>. <source>Meteorol.</source> <volume>38</volume>, <fpage>903</fpage>&#x2013;<lpage>912</lpage>. doi: <pub-id pub-id-type="doi">10.7519/j.issn.1000-0526.2012.08.002</pub-id></mixed-citation></ref>
<ref id="ref14"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hess</surname><given-names>P.</given-names></name> <name><surname>Boers</surname><given-names>N.</given-names></name></person-group> (<year>2022</year>). <article-title>Deep learning for improving numerical weather prediction of heavy rainfall</article-title>. <source>J. Adv. Model. Earth Syst.</source> <volume>14</volume>:<fpage>e2021MS002765</fpage>. doi: <pub-id pub-id-type="doi">10.1029/2021MS002765</pub-id></mixed-citation></ref>
<ref id="ref15"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Ioffe</surname><given-names>S.</given-names></name> <name><surname>Szegedy</surname><given-names>C.</given-names></name></person-group> (<year>2015</year>). <source>Batch normalization: Accelerating deep network training by reducing internal covariate shift</source>. <italic>arXiv</italic>. Available online at: <ext-link xlink:href="https://doi.org/10.48550/arXiv.1502.03167" ext-link-type="uri">https://doi.org/10.48550/arXiv.1502.03167</ext-link></mixed-citation></ref>
<ref id="ref16"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kang</surname><given-names>H.</given-names></name> <name><surname>Ebtehaj</surname><given-names>A.</given-names></name></person-group> (<year>2025</year>). <article-title>Machine learning for explanation of subgrid convective precipitation: a case study over CONUS using a convection-allowing model and SHAP analysis</article-title>. <source>Artif. Intell. Earth Syst.</source> <volume>4</volume>:<fpage>e240062</fpage>. doi: <pub-id pub-id-type="doi">10.1175/AIES-D-24-0062.1</pub-id></mixed-citation></ref>
<ref id="ref17"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Khan</surname><given-names>S. N.</given-names></name> <name><surname>Iqbal</surname><given-names>J.</given-names></name> <name><surname>Khan</surname><given-names>M. R.</given-names></name> <name><surname>Malik</surname><given-names>N. A.</given-names></name> <name><surname>Khan</surname><given-names>F. A.</given-names></name> <name><surname>Khan</surname><given-names>K.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Using remotely sensed vegetation indices and multi-stream deep learning improves county-level corn yield predictions</article-title>. <source>Eur. J. Agron.</source> <volume>164</volume>:<fpage>127496</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.eja.2024.127496</pub-id></mixed-citation></ref>
<ref id="ref18"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname><given-names>J.</given-names></name> <name><surname>Shu</surname><given-names>E.</given-names></name> <name><surname>Lai</surname><given-names>K.</given-names></name> <name><surname>Amodeo</surname><given-names>M.</given-names></name> <name><surname>Porter</surname><given-names>J.</given-names></name> <name><surname>Kearns</surname><given-names>E.</given-names></name></person-group> (<year>2022</year>). <article-title>Assessment of the standard precipitation frequency estimates in the United States</article-title>. <source>J. Hydrol.-Reg. Stud.</source> <volume>44</volume>:<fpage>101276</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ejrh.2022.101276</pub-id></mixed-citation></ref>
<ref id="ref19"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Kingma</surname><given-names>D. P.</given-names></name> <name><surname>Ba</surname><given-names>J.</given-names></name></person-group> <article-title>Adam: a method for stochastic optimization</article-title>. <italic>arXiv</italic> (<year>2014</year>). Available online at: <ext-link xlink:href="https://doi.org/10.48550/arXiv.1412.6980" ext-link-type="uri">https://doi.org/10.48550/arXiv.1412.6980</ext-link></mixed-citation></ref>
<ref id="ref20"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>J.</given-names></name> <name><surname>Sheng</surname><given-names>Y.</given-names></name> <name><surname>Wang</surname><given-names>W.</given-names></name> <name><surname>Liu</surname><given-names>J.</given-names></name> <name><surname>Li</surname><given-names>X.</given-names></name></person-group> (<year>2025</year>). <article-title>Estimating wheat chlorophyll content using a multi-source deep feature neural network</article-title>. <source>Agriculture</source> <volume>15</volume>:<fpage>1624</fpage>. doi: <pub-id pub-id-type="doi">10.3390/agriculture15151624</pub-id></mixed-citation></ref>
<ref id="ref21"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>W.</given-names></name> <name><surname>Li</surname><given-names>M.</given-names></name> <name><surname>Ma</surname><given-names>H.</given-names></name> <name><surname>Huang</surname><given-names>X.</given-names></name> <name><surname>Zhang</surname><given-names>Z.</given-names></name></person-group> (<year>2024a</year>). <article-title>Severe convection prediction method based on xgboost classified algorithm and numerical model ingredients</article-title>. <source>Meteorol.</source> <volume>50</volume>, <fpage>1343</fpage>&#x2013;<lpage>1358</lpage>. doi: <pub-id pub-id-type="doi">10.7519/j.issn.1000-0526.2024.081902</pub-id></mixed-citation></ref>
<ref id="ref22"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>Z.</given-names></name> <name><surname>Mu</surname><given-names>Z.</given-names></name> <name><surname>Gao</surname><given-names>R.</given-names></name></person-group> (<year>2024b</year>). <article-title>Applicability of ERA5 reanalysis precipitation data in runoff modeling in China&#x2019;s Ili River basin</article-title>. <source>J. Hydrol. Eng.</source> <volume>29</volume>:<fpage>04024036</fpage>. doi: <pub-id pub-id-type="doi">10.1061/JHYEFF.HEENG-6161</pub-id></mixed-citation></ref>
<ref id="ref23"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Llasat</surname><given-names>M. C.</given-names></name> <name><surname>Del Moral</surname><given-names>A.</given-names></name> <name><surname>Cort&#x00E8;s</surname><given-names>M.</given-names></name> <name><surname>Rigo</surname><given-names>T.</given-names></name></person-group> (<year>2021</year>). <article-title>Convective precipitation trends in the Spanish Mediterranean region</article-title>. <source>Atmos. Res.</source> <volume>257</volume>:<fpage>105581</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.atmosres.2021.105581</pub-id></mixed-citation></ref>
<ref id="ref25"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Meenal</surname><given-names>R.</given-names></name> <name><surname>Michael</surname><given-names>P. A.</given-names></name> <name><surname>Pamela</surname><given-names>D.</given-names></name> <name><surname>Rajasekaran</surname><given-names>E.</given-names></name></person-group> (<year>2021</year>). <article-title>Weather prediction using random forest machine learning model</article-title>. <source>Indones. J. Electr. Eng. Comput. Sci.</source> <volume>22</volume>, <fpage>1208</fpage>&#x2013;<lpage>1215</lpage>. doi: <pub-id pub-id-type="doi">10.11591/ijeecs.v22.i2.pp1208-1215</pub-id></mixed-citation></ref>
<ref id="ref26"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nie</surname><given-names>Y.</given-names></name> <name><surname>Sun</surname><given-names>J.</given-names></name> <name><surname>Ma</surname><given-names>J.</given-names></name></person-group> (<year>2023</year>). <article-title>Seasonal prediction of summer extreme precipitation frequencies over Southwest China based on machine learning</article-title>. <source>Atmos. Res.</source> <volume>294</volume>:<fpage>106947</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.atmosres.2023.106947</pub-id></mixed-citation></ref>
<ref id="ref27"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Qiu</surname><given-names>J.</given-names></name> <name><surname>He</surname><given-names>L.</given-names></name></person-group> (<year>2013</year>). <article-title>Comparative analysis on weather characteristics and convective parameters of torrential rain and hail in Yangtze River Delta</article-title>. <source>Meteorology</source> <volume>39</volume>, <fpage>577</fpage>&#x2013;<lpage>584</lpage>. doi: <pub-id pub-id-type="doi">10.7519/j.issn.1000-0526.2013.05.005</pub-id></mixed-citation></ref>
<ref id="ref28"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ravuri</surname><given-names>S.</given-names></name> <name><surname>Lenc</surname><given-names>K.</given-names></name> <name><surname>Willson</surname><given-names>M.</given-names></name> <name><surname>Kangin</surname><given-names>D.</given-names></name> <name><surname>Lam</surname><given-names>R.</given-names></name> <name><surname>Mirowski</surname><given-names>P.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Skilful precipitation nowcasting using deep generative models of radar</article-title>. <source>Nature</source> <volume>597</volume>, <fpage>672</fpage>&#x2013;<lpage>677</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41586-021-03854-z</pub-id>, <pub-id pub-id-type="pmid">34588668</pub-id></mixed-citation></ref>
<ref id="ref29"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Reichstein</surname><given-names>M.</given-names></name> <name><surname>Camps-Valls</surname><given-names>G.</given-names></name> <name><surname>Stevens</surname><given-names>B.</given-names></name> <name><surname>Jung</surname><given-names>M.</given-names></name> <name><surname>Denzler</surname><given-names>J.</given-names></name> <name><surname>Carvalhais</surname><given-names>N.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Deep learning and process understanding for data-driven earth system science</article-title>. <source>Nature</source> <volume>566</volume>, <fpage>195</fpage>&#x2013;<lpage>204</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41586-019-0912-1</pub-id>, <pub-id pub-id-type="pmid">30760912</pub-id></mixed-citation></ref>
<ref id="ref30"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Retsch</surname><given-names>M. H.</given-names></name> <name><surname>Jakob</surname><given-names>C.</given-names></name> <name><surname>Singh</surname><given-names>M. S.</given-names></name></person-group> (<year>2022</year>). <article-title>Identifying relations between deep convection and the large-scale atmosphere using explainable artificial intelligence</article-title>. <source>J. Geophys. Res.-Atmos.</source> <volume>127</volume>:<fpage>e2021JD035388</fpage>. doi: <pub-id pub-id-type="doi">10.1029/2021JD035388</pub-id></mixed-citation></ref>
<ref id="ref31"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shen</surname><given-names>C.</given-names></name> <name><surname>Sun</surname><given-names>Y.</given-names></name> <name><surname>Wei</surname><given-names>X.</given-names></name> <name><surname>Yin</surname><given-names>D.</given-names></name></person-group> (<year>2016</year>). <article-title>Research of flash heavy rain forecast model in Jiangsu based on physical parameters</article-title>. <source>Meteorology</source> <volume>42</volume>, <fpage>557</fpage>&#x2013;<lpage>566</lpage>. doi: <pub-id pub-id-type="doi">10.7519/j.issn.1000-0526.2016.05.005</pub-id></mixed-citation></ref>
<ref id="ref32"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Soci</surname><given-names>C.</given-names></name> <name><surname>Hersbach</surname><given-names>H.</given-names></name> <name><surname>Simmons</surname><given-names>A.</given-names></name> <name><surname>Poli</surname><given-names>P.</given-names></name> <name><surname>Bell</surname><given-names>B.</given-names></name> <name><surname>Berrisford</surname><given-names>B.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>The ERA5 global reanalysis from 1940 to 2022</article-title>. <source>Q. J. R. Meteorol. Soc.</source> <volume>150</volume>, <fpage>4014</fpage>&#x2013;<lpage>4048</lpage>. doi: <pub-id pub-id-type="doi">10.1002/qj.4803</pub-id></mixed-citation></ref>
<ref id="ref33"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stoica</surname><given-names>P.</given-names></name> <name><surname>Babu</surname><given-names>P.</given-names></name></person-group> (<year>2024</year>). <article-title>Pearson-Matthews correlation coefficients for binary and multinary classification signal process</article-title>. <source>Signal Process.</source> <volume>222</volume>:<fpage>109511</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.sigpro.2024.109511</pub-id></mixed-citation></ref>
<ref id="ref34"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname><given-names>J.</given-names></name> <name><surname>Xue</surname><given-names>M.</given-names></name> <name><surname>Wilson</surname><given-names>J. W.</given-names></name> <name><surname>Zawadzki</surname><given-names>I.</given-names></name> <name><surname>Ballard</surname><given-names>S. P.</given-names></name> <name><surname>Onvlee-Hooimeyer</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Use of NWP for nowcasting convective precipitation: recent progress and challenges</article-title>. <source>Bull. Am. Meteorol. Soc.</source> <volume>95</volume>, <fpage>409</fpage>&#x2013;<lpage>426</lpage>. doi: <pub-id pub-id-type="doi">10.1175/BAMS-D-11-00263.1</pub-id></mixed-citation></ref>
<ref id="ref35"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Sundararajan</surname><given-names>M.</given-names></name> <name><surname>Taly</surname><given-names>A.</given-names></name> <name><surname>Yan</surname><given-names>Q.</given-names></name></person-group> <article-title>Axiomatic attribution for deep networks</article-title>. <source>arXiv</source> (<year>2017</year>). Available online at: <ext-link xlink:href="https://doi.org/10.48550/arXiv.1703.01365" ext-link-type="uri">https://doi.org/10.48550/arXiv.1703.01365</ext-link></mixed-citation></ref>
<ref id="ref36"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tian</surname><given-names>F.</given-names></name> <name><surname>Zheng</surname><given-names>Y.</given-names></name> <name><surname>Zhang</surname><given-names>T.</given-names></name> <name><surname>Zhang</surname><given-names>X.</given-names></name> <name><surname>Mao</surname><given-names>D.</given-names></name> <name><surname>Sun</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Statistical characteristics of environmental parameters for warm season short-duration heavy rainfall over central and eastern China</article-title>. <source>J. Meteorol. Res.</source> <volume>29</volume>, <fpage>370</fpage>&#x2013;<lpage>384</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s13351-014-4119-y</pub-id></mixed-citation></ref>
<ref id="ref37"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tong</surname><given-names>J.</given-names></name> <name><surname>Wei</surname><given-names>L.</given-names></name> <name><surname>Ye</surname><given-names>J.</given-names></name> <name><surname>Zhou</surname><given-names>K.</given-names></name> <name><surname>Yuan</surname><given-names>S.</given-names></name></person-group> (<year>2017</year>). <article-title>Spatial-temporal distribution characteristics of short-time strong precipitation in the flood season under different terrains over Anhui province</article-title>. <source>J. Meteorol. Environ.</source> <volume>33</volume>, <fpage>42</fpage>&#x2013;<lpage>48</lpage>. doi: <pub-id pub-id-type="doi">10.3969/j.issn.1673-503X.2017.06.006</pub-id></mixed-citation></ref>
<ref id="ref38"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>T.</given-names></name> <name><surname>Zhou</surname><given-names>K.</given-names></name> <name><surname>Zheng</surname><given-names>Y.</given-names></name></person-group> (<year>2020</year>). <article-title>Statistic analysis of thunderstorm characteristics in central and eastern China</article-title>. <source>Meteorology</source> <volume>46</volume>, <fpage>189</fpage>&#x2013;<lpage>199</lpage>. doi: <pub-id pub-id-type="doi">10.7519/j.issn.1000-0526.2020.02.005</pub-id></mixed-citation></ref>
<ref id="ref39"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>X.</given-names></name> <name><surname>Cui</surname><given-names>C.</given-names></name> <name><surname>Liu</surname><given-names>K.</given-names></name> <name><surname>Wang</surname><given-names>X.</given-names></name></person-group> (<year>2024</year>). <article-title>Spatio-Temperal distribution and diurnal variation of extreme hourly precipitation in China during the main rainy season</article-title>. <source>Meteorology</source> <volume>50</volume>, <fpage>393</fpage>&#x2013;<lpage>406</lpage>. doi: <pub-id pub-id-type="doi">10.7519/j.issn.1000-0526.2023.123001</pub-id></mixed-citation></ref>
<ref id="ref40"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname><given-names>Z.</given-names></name> <name><surname>Luo</surname><given-names>Y.</given-names></name> <name><surname>Liu</surname><given-names>X.</given-names></name> <name><surname>Cheng</surname><given-names>D.</given-names></name></person-group> (<year>2022</year>). <article-title>Statistical characteristics of the hourly heavy rainfall events over Anhui Province during the 2011-2018 warm seasons and the associated synoptic circulation patterns</article-title>. <source>Meteorology</source> <volume>48</volume>, <fpage>963</fpage>&#x2013;<lpage>978</lpage>. doi: <pub-id pub-id-type="doi">10.7519/j.issn.1000-0526.2022.041001</pub-id></mixed-citation></ref>
<ref id="ref41"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname><given-names>T.</given-names></name> <name><surname>Pang</surname><given-names>H.</given-names></name> <name><surname>Zhan</surname><given-names>Z.</given-names></name> <name><surname>Guo</surname><given-names>H.</given-names></name> <name><surname>Wu</surname><given-names>S.</given-names></name> <name><surname>Zhang</surname><given-names>W.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Characteristics of water vapor isotopes and moisture sources for short-duration heavy rainfall events in Nanjing, eastern China</article-title>. <source>J. Hydrol.</source> <volume>622</volume>:<fpage>129731</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jhydrol.2023.129731</pub-id></mixed-citation></ref>
<ref id="ref42"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yan</surname><given-names>H.</given-names></name> <name><surname>Gao</surname><given-names>Y.</given-names></name> <name><surname>Wilby</surname><given-names>R.</given-names></name> <name><surname>Yu</surname><given-names>D.</given-names></name> <name><surname>Wright</surname><given-names>N.</given-names></name> <name><surname>Yin</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Urbanization further intensifies short-duration rainfall extremes in a warmer climate</article-title>. <source>Geophys. Res. Lett.</source> <volume>51</volume>:<fpage>e2024GL108565</fpage>. doi: <pub-id pub-id-type="doi">10.1029/2024GL108565</pub-id></mixed-citation></ref>
<ref id="ref43"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname><given-names>R.</given-names></name> <name><surname>Hu</surname><given-names>J.</given-names></name> <name><surname>Li</surname><given-names>Z.</given-names></name> <name><surname>Mu</surname><given-names>J.</given-names></name> <name><surname>Yu</surname><given-names>T.</given-names></name> <name><surname>Xia</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Interpretable machine learning for weather and climate prediction: a review</article-title>. <source>Atmos. Environ.</source> <volume>338</volume>:<fpage>120797</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.atmosenv.2024.120797</pub-id></mixed-citation></ref>
<ref id="ref44"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yano</surname><given-names>J.</given-names></name> <name><surname>Ziemia&#x0144;ski</surname><given-names>M. Z.</given-names></name> <name><surname>Cullen</surname><given-names>M.</given-names></name> <name><surname>Termonia</surname><given-names>P.</given-names></name> <name><surname>Onvlee</surname><given-names>J.</given-names></name> <name><surname>Bengtsson</surname><given-names>L.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Scientific challenges of convective-scale numerical weather prediction</article-title>. <source>B. Am. Meteorol. Soc.</source> <volume>99</volume>, <fpage>699</fpage>&#x2013;<lpage>710</lpage>. doi: <pub-id pub-id-type="doi">10.1175/BAMS-D-17-0125.1</pub-id></mixed-citation></ref>
<ref id="ref45"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yousefnia</surname><given-names>K. V.</given-names></name> <name><surname>Metzl</surname><given-names>C.</given-names></name> <name><surname>B&#x00F6;lle</surname><given-names>T.</given-names></name></person-group> (<year>2025</year>). <article-title>Inferring thunderstorm occurrence from vertical profiles of convection-permitting simulations: physical insights from a physical deep learning model</article-title>. <source>Artif. Intell. Earth Syst.</source> <volume>4</volume>:<fpage>240096</fpage>. doi: <pub-id pub-id-type="doi">10.1175/AIES-D-24-0096.1</pub-id></mixed-citation></ref>
<ref id="ref46"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>H.</given-names></name> <name><surname>Liu</surname><given-names>Y.</given-names></name> <name><surname>Zhang</surname><given-names>C.</given-names></name> <name><surname>Li</surname><given-names>N.</given-names></name></person-group> (<year>2025</year>). <article-title>Machine learning methods for weather forecasting: a survey</article-title>. <source>Atmosphere</source> <volume>16</volume>:<fpage>82</fpage>. doi: <pub-id pub-id-type="doi">10.3390/atmos16010082</pub-id></mixed-citation></ref>
<ref id="ref47"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>J.</given-names></name> <name><surname>Yin</surname><given-names>M.</given-names></name> <name><surname>Wang</surname><given-names>P.</given-names></name> <name><surname>Gao</surname><given-names>Z.</given-names></name></person-group> (<year>2024</year>). <article-title>A method based on deep learning for severe convective weather forecast: CNN-BiLSTM-AM (version 1.0)</article-title>. <source>Atmos.</source> <volume>15</volume>:<fpage>1229</fpage>. doi: <pub-id pub-id-type="doi">10.3390/atmos15101229</pub-id></mixed-citation></ref>
<ref id="ref48"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>W.</given-names></name> <name><surname>Han</surname><given-names>L.</given-names></name> <name><surname>Sun</surname><given-names>J.</given-names></name> <name><surname>Guo</surname><given-names>H.</given-names></name> <name><surname>Dai</surname><given-names>J.</given-names></name></person-group> (<year>2019</year>). <source>Application of multi-channel 3D-cube successive convolution network for convective storm nowcasting</source>. <italic>arXiv</italic>. Available online at: <ext-link xlink:href="https://doi.org/10.1109/BigData47090.2019.9005568" ext-link-type="uri">https://doi.org/10.1109/BigData47090.2019.9005568</ext-link></mixed-citation></ref>
<ref id="ref49"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>W.</given-names></name> <name><surname>Kang</surname><given-names>L.</given-names></name> <name><surname>Yang</surname><given-names>K.</given-names></name> <name><surname>Yin</surname><given-names>H.</given-names></name></person-group> (<year>2021</year>). <article-title>Comparative analysis on characteristics of physical quantity of flash-rain under different intensities in Sichuan Basin</article-title>. <source>Meteorol.</source> <volume>47</volume>, <fpage>439</fpage>&#x2013;<lpage>449</lpage>. doi: <pub-id pub-id-type="doi">10.7519/j.issn.1000-0526.2021.04.005</pub-id></mixed-citation></ref>
<ref id="ref50"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname><given-names>M.</given-names></name></person-group> (<year>2022</year>). <article-title>A study of AR-, TS-, and MCS-associated precipitation and extreme precipitation in present and warmer climates</article-title>. <source>J. Clim.</source> <volume>35</volume>, <fpage>479</fpage>&#x2013;<lpage>497</lpage>. doi: <pub-id pub-id-type="doi">10.1175/JCLI-D-21-0145.1</pub-id></mixed-citation></ref>
<ref id="ref51"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname><given-names>Q.</given-names></name> <name><surname>Zheng</surname><given-names>Y.</given-names></name> <name><surname>Jing</surname><given-names>Y.</given-names></name> <name><surname>Feng</surname><given-names>D.</given-names></name> <name><surname>Liu</surname><given-names>J.</given-names></name></person-group> (<year>2025</year>). <article-title>Research Progress on short-duration heavy precipitation in China</article-title>. <source>Adv. Earth Sci.</source> <volume>40</volume>, <fpage>21</fpage>&#x2013;<lpage>38</lpage>. doi: <pub-id pub-id-type="doi">10.11867/j.issn.1001-8166.2025.002</pub-id></mixed-citation></ref>
<ref id="ref52"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zheng</surname><given-names>Y.</given-names></name> <name><surname>Zhou</surname><given-names>K.</given-names></name> <name><surname>Sheng</surname><given-names>J.</given-names></name> <name><surname>Lin</surname><given-names>Y.</given-names></name> <name><surname>Tian</surname><given-names>F.</given-names></name> <name><surname>Tang</surname><given-names>W.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Advances in techniques of monitoring, forecasting and warning of severe convective weather</article-title>. <source>J. Appl. Meteor. Sci.</source> <volume>26</volume>, <fpage>641</fpage>&#x2013;<lpage>657</lpage>. doi: <pub-id pub-id-type="doi">10.11898/1001-7313.20150601</pub-id></mixed-citation></ref>
<ref id="ref53"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname><given-names>K.</given-names></name> <name><surname>Zheng</surname><given-names>Y.</given-names></name> <name><surname>Li</surname><given-names>B.</given-names></name> <name><surname>Dong</surname><given-names>W.</given-names></name> <name><surname>Zhang</surname><given-names>X.</given-names></name></person-group> (<year>2019</year>). <article-title>Forecasting different types of convective weather: a deep learning approach</article-title>. <source>J. Meteorol. Res.</source> <volume>33</volume>, <fpage>797</fpage>&#x2013;<lpage>809</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s13351-019-8162-6</pub-id></mixed-citation></ref>
<ref id="ref54"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname><given-names>X.</given-names></name> <name><surname>Tian</surname><given-names>F.</given-names></name> <name><surname>Zheng</surname><given-names>Y.</given-names></name> <name><surname>Sun</surname><given-names>J.</given-names></name> <name><surname>Wang</surname><given-names>C.</given-names></name></person-group> (<year>2023</year>). <article-title>Contribution of short-duration heavy rainfall to rainstorm in China</article-title>. <source>Meteorology</source> <volume>49</volume>, <fpage>267</fpage>&#x2013;<lpage>278</lpage>. doi: <pub-id pub-id-type="doi">10.7519/j.issn.1000-0526.2022.071201</pub-id></mixed-citation></ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0003">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1071009/overview">Xi Cao</ext-link>, Chinese Academy of Sciences (CAS), China</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0004">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2133246/overview">Junhu Zhao</ext-link>, National Climate Center, China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3344106/overview">Qun Tian</ext-link>, Guangzhou Institute of Tropical and Marine Meteorology (GITMM), China</p>
</fn>
</fn-group>
<fn-group>
<fn id="fn0001">
<label>1</label>
<p><ext-link xlink:href="https://www.ecmwf.int/" ext-link-type="uri">https://www.ecmwf.int/</ext-link></p>
</fn>
<fn id="fn0002">
<label>2</label>
<p><ext-link xlink:href="https://github.com/pytorch/captum" ext-link-type="uri">https://github.com/pytorch/captum</ext-link></p>
</fn>
</fn-group>
</back>
</article>