<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" dtd-version="1.3" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Water</journal-id>
<journal-title-group>
<journal-title>Frontiers in Water</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Water</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2624-9375</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/frwa.2026.1753598</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>A hybrid CNN-LSTM approach for multi-step discharge forecasting with satellite data</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Wongchaisuwat</surname> <given-names>Papis</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3381553"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Yomwilai</surname> <given-names>Konlawat</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3381689"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Thaisiam</surname> <given-names>Wandee</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3291972"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Department of Industrial Engineering, Kasetsart University</institution>, <city>Bangkok</city>, <country country="th">Thailand</country></aff>
<aff id="aff2"><label>2</label><institution>Department of Water Resources Engineering, Kasetsart University</institution>, <city>Bangkok</city>, <country country="th">Thailand</country></aff>
<author-notes>
<corresp id="c001"><label>&#x0002A;</label>Correspondence: Wandee Thaisiam, <email xlink:href="mailto:wandee.t@ku.th">wandee.t@ku.th</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-19">
<day>19</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>8</volume>
<elocation-id>1753598</elocation-id>
<history>
<date date-type="received">
<day>25</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>28</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>28</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2026 Wongchaisuwat, Yomwilai and Thaisiam.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Wongchaisuwat, Yomwilai and Thaisiam</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-19">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Accurate river discharge forecasting is critical for flood mitigation and effective water resource management, particularly in data-scarce regions. Capturing both spatial rainfall variability and temporal discharge dynamics remains a challenge.</p>
</sec>
<sec>
<title>Methods</title>
<p>An innovative hybrid forecasting model was developed to predict hourly river discharges up to 24 h in advance. The proposed model combined the spatial analysis capabilities of convolutional neural networks with the temporal sequence modeling strengths of long short-term memory networks. It was designed to extract spatio-temporal patterns from satellite precipitation data while incorporating historical discharge trends to improve forecasting accuracy. The model was developed and internally validated on a 3 day lag dataset before being tested on an external test set with a relatively shorter 30min lag to simulate real-time conditions.</p>
</sec>
<sec>
<title>Results</title>
<p>The hybrid CNN-LSTM model demonstrated strong predictive performance across multiple evaluation metrics, including the correlation coefficient, Nash-Sutcliffe efficiency, root mean square error, and mean absolute error. Notably, our proposed model maintained a performance level well within acceptable error limits, even using the 24 h prediction horizon. The results confirmed the model&#x00027;s ability to generalize across datasets with differing temporal resolutions.</p>
</sec>
<sec>
<title>Discussion</title>
<p>The proposed framework provides a scalable and robust solution for improving short-term discharge predictions, particularly in upstream and unmeasured catchments where ground observations are limited. This approach has strong potential to support real-time water resource management and flood preparedness in data-scarce regions.</p>
</sec></abstract>
<kwd-group>
<kwd>convolutional neural networks</kwd>
<kwd>flood forecasting</kwd>
<kwd>hourly discharge data</kwd>
<kwd>long short-term memory</kwd>
<kwd>precipitation satellite data</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This research was supported by the Kasetsart University Research and Development Institute (KURDI), Bangkok, Thailand under the &#x0201C;FF(KU)36.69&#x0201D; project (to WT).</funding-statement>
</funding-group>
<counts>
<fig-count count="14"/>
<table-count count="4"/>
<equation-count count="0"/>
<ref-count count="27"/>
<page-count count="17"/>
<word-count count="8475"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Water and Artificial Intelligence</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<label>1</label>
<title>Introduction</title>
<p>The impacts of climate change have intensified extreme weather patterns globally, resulting in heavier rainfall, stronger cyclones, more intense heatwaves, and prolonged droughts. In 2023, Asia was the most disaster-affected region in the world due to extreme weather conditions. Cyclones and floods were the leading causes of fatalities and economic losses, with 79 meteorological disasters reported across the region. Over 80% of these events were attributed to floods and storms, resulting in more than 2,000 deaths and affecting over 9 million people (<xref ref-type="bibr" rid="B23">WMO, 2024</xref>). Early warning systems play a critical role in mitigating the devastating impacts of such hazards. These systems provide timely, relevant, interoperable, accessible, and accurate information to support preparedness and response efforts. Notably, disaster-related damage can be reduced by up to 30% if warnings are issued at least 24 h in advance (<xref ref-type="bibr" rid="B22">WMO, 2022</xref>) Flood forecasting is essential for early warning systems to develop appropriate measures to control flood risks, mitigate hazards, evacuate vulnerable populations from flood-prone areas, set insurance premiums, and optimize environmental and water resource management.</p>
<p>Over the past decade, deep learning (DL) techniques have emerged as a powerful tool for tackling complex hydrological challenges, particularly in flood forecasting. These techniques leverage their ability to handle sequential input data and capture the non-linear dependencies inherent in hydrological processes (<xref ref-type="bibr" rid="B8">Kumar et al., 2023</xref>; <xref ref-type="bibr" rid="B14">Shen et al., 2021</xref>; <xref ref-type="bibr" rid="B15">Sit et al., 2020</xref>). This development reflects a general trend toward the integration of data-driven methods into traditional hydrological domains. Recent advancements have introduced a range of DL architectures specifically tailored for flood forecasting. Recurrent neural networks (RNNs) and their derivatives, including gated recurrent units (GRUs) and long short-term memory networks (LSTMs), have shown promise in modeling temporal dependencies in flood-related data (<xref ref-type="bibr" rid="B21">Waqas and Humphries, 2024</xref>). In a notable study by <xref ref-type="bibr" rid="B6">Kratzert et al. (2018)</xref>, LSTMs have been used to simulate rainfall-runoff processes and showed superior performance compared to classical hydrological models in several catchments. Hydrological parameters have been incorporated into the learning process to improve the accuracy of DL models. These integrations enable a more comprehensive understanding of complex hydrological systems (<xref ref-type="bibr" rid="B1">Chang et al., 2023</xref>; <xref ref-type="bibr" rid="B13">Senent-Aparicio et al., 2019</xref>). <xref ref-type="bibr" rid="B19">Tongal and Booij (2018)</xref> proposed a framework for streamflow simulation and prediction, demonstrating improved predictive performance by decomposing streamflow into individual components. <xref ref-type="bibr" rid="B17">Thaisiam et al. (2022)</xref> introduced the concept of concentration time (TC) to enhance temporal correlations using backward lags. Integrating TC-related features with RNNs and their variants essentially demonstrated superior performance in multi-step hourly flood prediction. Several studies have investigated seasonal overflow of water, a phenomenon frequently observed during wet seasons and flood events (<xref ref-type="bibr" rid="B9">Lee et al., 2020</xref>; <xref ref-type="bibr" rid="B18">Thaisiam et al., 2024</xref>; <xref ref-type="bibr" rid="B26">Zanchetta et al., 2022</xref>). <xref ref-type="bibr" rid="B27">Zhang and Yan (2023)</xref> proposed LSTM-based network components to address long-term and short-term dependencies separately, while <xref ref-type="bibr" rid="B2">Chenmin et al. (2024)</xref> investigated feature selection techniques for a hybrid model using convolutional neural networks and bidirectional LSTMs with an attention mechanism for flood prediction. Overall, DL techniques have demonstrated exceptional efficiency in flood forecasting, particularly in study areas with long-term and continuous monitoring data.</p>
<p>Convolutional Neural Networks (CNNs) are valuable tools for analyzing satellite images because they are particularly adept at handling spatial data. For example, their ability to extract and analyze spatial features enables a deep understanding of patterns in satellite data, such as precipitation intensity and distribution. By learning localized and large-scale spatial dependencies, CNNs enable a more detailed representation of hydrometeorological processes compared to traditional approaches. The recent trend in flood forecasting research involves combining CNNs with other DL techniques to address varied challenges of predicting floods. These hybrid approaches aim to leverage the strengths of different methodologies, such as spatial data modeling via CNNs and temporal sequence prediction via recurrent models (<xref ref-type="bibr" rid="B24">Wu et al., 2020</xref>). For example, <xref ref-type="bibr" rid="B3">Feng et al. (2022)</xref> utilized hybrid models combining spatio-temporal graph convolutional networks and LSTMs to forecast flood levels, highlighting the potential of integrating spatial and temporal modeling. These approaches effectively bridged the gap between static and dynamic flood prediction factors.</p>
<p>In recent years, CNN&#x02013;LSTM architectures have been applied to rainfall&#x02013;runoff modeling by integrating meteorological forcing with hydrological observations from upstream catchments. For example, <xref ref-type="bibr" rid="B11">Li X. et al. (2022)</xref> introduced a CNN-LSTM based rainfall-runoff model that utilized observed precipitation represented as two-dimensional spatial inputs to predict downstream flow, while <xref ref-type="bibr" rid="B10">Li P. et al. (2022)</xref> incorporated radar maps together with upstream runoff observations. Later, a hybrid model based on CNN-LSTM and GRU with the improved sparrow search algorithm was proposed for runoff prediction using meteorological, hydrological, and runoff observations (<xref ref-type="bibr" rid="B25">Yao et al., 2023</xref>). <xref ref-type="bibr" rid="B20">Wang et al. (2023)</xref> proposed a CNN-LSTM model in which CNNs extracted physical and meteorological features from weather research and forecasting model outputs, and the resulting time-series features were used by LSTMs to simulate streamflow dynamics. Additionally, <xref ref-type="bibr" rid="B12">Malik et al. (2024)</xref> utilized a time-distributed CNN-LSTM model to improve the accuracy of flood predictions, particularly in forecasting flood occurrence times and peak intensities using station-based precipitation and streamflow data. <xref ref-type="bibr" rid="B5">Hu et al. (2024)</xref> used a CNN-LSTM model that integrated multiple grid-based meteorological data with gauged precipitation and runoff sequence inputs. Collectively, these studies demonstrate the effectiveness of CNN&#x02013;LSTM hybrid models for streamflow simulation and discharge prediction when rich observational data are available. However, despite their demonstrated performance, most existing CNN-LSTM based runoff forecasting studies rely on various ground-based observations from upstream areas, such as rain gauge data, upstream discharge stations, or hydrometeorological information, which limits their applicability in regions with sparse monitoring networks. In contrast, our proposed framework integrates satellite-based precipitation imagery with discharge observations from only the target prediction station, thereby reducing the dependence on upstream ground-based data. While satellite-based precipitation products provide extensive spatial coverage and consistent temporal resolution, their integration into deep learning&#x02013;based runoff forecasting frameworks remains relatively underexplored. Few studies have explicitly exploited the spatial structure of satellite-derived rainfall fields as primary model inputs, and uncertainties inherent in satellite observations are not fully addressed. Consequently, developing reliable streamflow prediction models for flood events in data-scarce catchments&#x02014;particularly with limited upstream ground-based information&#x02014; remains a challenge, and the practical potential of CNN&#x02013;LSTM architectures for discharge forecasting under such conditions has not been fully demonstrated.</p>
<p>In response, the main objective of this study was to develop a robust model for predicting hourly river discharge up to 24 h in advance using only satellite-based precipitation and target discharge records. The proposed model integrated the spatial analysis capabilities of CNNs with the temporal sequence modeling strengths of LSTMs. This hybrid architecture was designed to extract meaningful spatio-temporal patterns from satellite precipitation data while incorporating historical discharge trends to enhance forecast accuracy. The proposed model utilized spatial precipitation data from the Global Satellite Mapping of Precipitation (GSMaP), which are produced and distributed by the Earth Observation Research Center (EORC) of the Japan Aerospace Exploration Agency (JAXA), as comprehensively reviewed by <xref ref-type="bibr" rid="B7">Kubota et al. (2020)</xref>. The GSMaP dataset offers high-resolution, real-time precipitation measurements with broader spatial coverage than conventional ground-based sensors. The satellite data were complemented by historical discharge data from a downstream observation station, allowing the model to account for localized hydrological dynamics. The hybrid model demonstrated the ability to generalize across different datasets by combining CNNs for spatial feature extraction with LSTMs for temporal sequence analysis. Internal validation using GSMaP-MVK data assessed the reliability of the model within the training domain, while external tests with GSMaP-NOW data evaluated its performance under real-time conditions. The correlation coefficient (R), Nash-Sutcliffe efficiency (NSE), root mean square error (RMSE) and mean absolute error (MAE) were used to rigorously evaluate the predictive capabilities of the model.</p>
<p>Our main contribution highlighted the potential of hybrid deep learning approaches to enhance hydrological forecasting, particularly in data-scarce regions. We established a robust foundation for the development of advanced deep learning architectures by integrating satellite-based precipitation measurements with station-based discharge data. This integration not only enhanced the accuracy of the discharge predictions but also offered a scalable solution for improving water resource management, especially in catchments with limited upstream ground-based observations. Our proposed framework was rigorously evaluated across two distinct study areas to validate its robustness and generalizability. Furthermore, we implemented a training and validation strategy designed to account for differences in satellite precipitation latency between offline model development and near-real-time forecasting. The model was trained and internally validated on a dataset characterized by a relatively longer time lag, then, it was applied to a different dataset with a shorter time lag. This approach was specifically designed to optimize the model&#x00027;s readiness for real-time deployment, demonstrating its applicability in dynamic hydrological environments.</p>
</sec>
<sec sec-type="materials and methods" id="s2">
<label>2</label>
<title>Materials and methods</title>
<sec>
<label>2.1</label>
<title>Study area</title>
<p><xref ref-type="fig" rid="F1">Figure 1</xref> depicts the two study areas in Thailand: the Upper Yom River Basin and the Upper Chi River Basin. The Upper Yom River Basin is located in northern Thailand and is oriented in a north-south direction. The main river (Yom) originates from Doi Khun Yuam in the Phi Pan Nam mountain range, situated in the Pong and Chiang Muan districts of Phayao province, Thailand. The Yom river flows through a steep valley with a riverbed slope of approximately 1:120 and an elevation range of 180 to 360 m above mean sea level. Narrow plains are present along certain sections of the riverbank before the river flows into Phrae province, Thailand. Flooding in this basin occurs annually during the rainy season due to the absence of large water storage facilities and the steep terrain. These factors contribute to rapid runoff, which causes river overbank flows in downstream areas.</p>
<fig position="float" id="F1">
<label>Figure 1</label>
<caption><p>Study areas equipped with stream gauges for <bold>(a)</bold> The upper Yom River Basin, <bold>(b)</bold> The upper Chi River Basin.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0001.tif">
<alt-text content-type="machine-generated">Topographic map showing two river basins in Thailand with their district centers and stream gauges marked, province boundaries outlined, and elevation represented by color shading; inset map highlights their location within Thailand.</alt-text>
</graphic>
</fig>
<p>The topography of the Upper Chi River Basin consists of high mountain ranges. The Phu Phan Mountain Range lies to the east and north, while the Dong Phaya Yen Mountain Range, located to the west, serves as the source of the Chi River. The Chi River has a riverbed gradient of 1:630 in its upstream area. Additionally, the Chi River is fed by tributaries, including the Phrom River, Sapung River, Chiang Tha River, and Khan Chu River, respectively. The combination of the basin&#x00027;s topography and its hydrological system results in heavy rainfall in the upstream areas, causing simultaneous water flow from the main river and its tributaries toward Mueang district, Chaiyaphum province, Thailand. This often leads to flash floods in downstream areas. Key characteristics of study areas are summarized in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Characteristics of study areas.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Characteristics</bold></th>
<th valign="top" align="center"><bold>Upper Yom River basin</bold></th>
<th valign="top" align="center"><bold>Upper Chi River basin</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Observation station</td>
<td valign="top" align="center">Y.1C</td>
<td valign="top" align="center">E.21</td>
</tr>
<tr>
<td valign="top" align="left">Annual runoff (million cubic meters)</td>
<td valign="top" align="center">1,982</td>
<td valign="top" align="center">1,420</td>
</tr>
<tr>
<td valign="top" align="left">Data period</td>
<td valign="top" align="center">1998&#x02013;2024 (27 Years)</td>
<td valign="top" align="center">2005&#x02013;2024 (20 Years)</td>
</tr>
<tr>
<td valign="top" align="left">Watershed (square kilometers)</td>
<td valign="top" align="center">7,660</td>
<td valign="top" align="center">9,755</td>
</tr>
<tr>
<td valign="top" align="left">River length to station (kilometers)</td>
<td valign="top" align="center">180</td>
<td valign="top" align="center">273</td>
</tr>
<tr>
<td valign="top" align="left">Average river slope (kilometers/kilometers)</td>
<td valign="top" align="center">1:120</td>
<td valign="top" align="center">1:630</td>
</tr>
<tr>
<td valign="top" align="left">Time of concentration, Tc (hour)</td>
<td valign="top" align="center">50</td>
<td valign="top" align="center">48</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
<sec>
<label>2.2</label>
<title>Methodology</title>
<p>This study aimed to develop a robust model for predicting hourly discharge up to 24 h in advance, applicable to poorly gauged areas where traditional upstream observed data are unavailable. Satellite-based precipitation data served as the primary input for the model, complemented by historical station-based data of the target variable. A hybrid deep learning architecture was constructed to effectively capture the spatiotemporal relationships within the data, combining the strengths of CNNs and LSTMs. Preprocessed satellite data, along with historical discharge data, were used to train and fine-tune the model. A rigorous internal validation process, leveraging data from the same source, was conducted to evaluate the model&#x00027;s performance within the training domain. Subsequently, the model&#x00027;s generalizability was assessed by validating it on an external test set sourced from a different satellite source. A flow chart in <xref ref-type="fig" rid="F2">Figure 2</xref> illustrates the entire process, consisting of data acquisition, preprocessing, model training, and evaluation.</p>
<fig position="float" id="F2">
<label>Figure 2</label>
<caption><p>Process flowchart of <bold>(a)</bold> data pre-processing, <bold>(b)</bold> model development, <bold>(c)</bold> model evaluation, and <bold>(d)</bold> external testing.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0002.tif">
<alt-text content-type="machine-generated">Flowchart depicting a machine learning workflow for hydrological modeling, including data pre-processing of precipitation images and water levels, model development using CNN and LSTM layers, model fitting, evaluation with performance indices, external testing, and conclusion.</alt-text>
</graphic>
</fig>
<sec>
<label>2.2.1</label>
<title>Data pre-processing</title>
<p>Our primary objective was to develop a multi-step discharge prediction model for the downstream water level station. To achieve this, we initially preprocessed hourly water level data to compute more informative discharge values based on an annual rating curve. A traditional outlier detection method was applied to eliminate extreme anomalies from the dataset. Specifically, summary statistics including an interquartile range and time-series plots were examined to identify anomalous values. Extreme values that were consistent with known high-flow or intense rainfall events were retained, as such extremes represented meaningful hydrological behavior and were critical for evaluating model performance under flood conditions. The resulting discharge data at the downstream station served a dual role in the model, acting as both the prediction target and input features representing historical flow conditions. Due to the limited availability of upstream observed hydrological data, we incorporated satellite-based data to monitor hydrological patterns. Specifically, we utilized data from GSMaP, a network of geostationary weather satellites managed by JAXA. It provides real-time weather information, including precipitation, cloud cover, and atmospheric conditions, across the Asia-Pacific region. These data are generated from dual-frequency precipitation radar measurements collected by multiple satellites.in</p>
<p>For our model, we relied on hourly GSMaP precipitation data with a spatial resolution of 0.1 degrees (approximately 11.1 km), striking a balance between spatial coverage and fine-grained data granularity. The primary dataset used for model training was GSMaP-MVK, which incorporates a 3 day time lag. This dataset was selected for its reliability and the extensive availability of historical data, making it well-suited for developing a robust and accurate predictive model. To assess the model&#x00027;s real-time performance, we integrated GSMaP-NOW, a dataset offering precipitation data with a considerably reduced time lag of 30 min. This near-real-time data source enabled us to validate the model&#x00027;s capability in operational settings, facilitating its ability to deliver timely and actionable predictions for discharge scenarios.</p>
<p>After collecting and preprocessing the data, the GSMaP-MVK dataset was divided into three subsets for training, validation, and testing. The training set was used to fit the model, while the validation set facilitated fine-tuning of the model and mitigating the risk of overfitting. Then, the final model was evaluated on a holdout test set. The study focused on two key river basins: the Upper Yom River and the Upper Chi River. Validation utilized data from a 3 year period (2016&#x02013;2018), while the testing phase utilized data spanning 2019 to 2021. The training set covered 18 years of data (1998&#x02013;2015) for the Upper Yom River basin and 11 years (2005&#x02013;2015) for the Upper Chi River basin. The model&#x00027;s performance was further assessed based on recent data, using an external test set comprising GSMaP-MVK and GSMaP-NOW data from 2022 to 2024. An overview of the discharge data for both study areas, highlighting the temporal patterns and variability in water discharge observed during the study period, is provided in <xref ref-type="fig" rid="F3">Figure 3</xref>.</p>
<fig position="float" id="F3">
<label>Figure 3</label>
<caption><p>Data components for training, validation, testing and external testing for <bold>(a)</bold> Y.1C station in Upper Yom River Basin and <bold>(b)</bold> E.21 station in Upper Chi River Basin based on GSMaP-MVK and GSMaP-NOW data.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0003.tif">
<alt-text content-type="machine-generated">Two line graphs compare river discharge in cubic meters per second for stations Y.1C and E.21. Both graphs are split into shaded periods indicating training, validation, testing, and extended testing phases. Above the charts, a timeline marks the availability of GSMaP-MVK since 1998 and GSMaP-NOW since December 2021. The first graph (Y.1C) spans 18 years of training data, and the second graph (E.21) covers 11 years. Color-coded sections and labels highlight sequence and purpose of data periods.</alt-text>
</graphic>
</fig>
<p>To preprocess the satellite image data, we focused on extracting relevant grid data corresponding to the study areas, specifically targeting regions within the river basin boundaries. Regions outside these boundaries were excluded to ensure that the model processed only information pertinent to the river basins of interest. The zero-padding technique was applied to maintain a consistent input size of 16 by 16 pixels. Furthermore, instead of reshaping the entire image, which could distort spatial relationships within the data, zero-padding was used to fill empty grid cells with zero values. This approach preserved the integrity of spatial features while standardizing the image dimensions. According to <xref ref-type="bibr" rid="B4">Hashemi (2019)</xref>, the zero-padding technique had no negative impact on the model accuracy but essentially reduced the training time. The padding ensures uniform input dimensions without compromising the representation of hydrological features. A fixed input size of 16 by 16 pixels was applied across two study areas to ensure compatibility with the CNN architecture. <xref ref-type="fig" rid="F4">Figure 4</xref> illustrates an example of the satellite image processing workflow, highlighting both the boundary reshaping and the zero-padding technique applied to the Upper Chi River Basin. As shown in <xref ref-type="fig" rid="F4">Figure 4</xref>, white grid cells with actual rainfall values were retained to preserve the spatial structure of satellite precipitation fields. These zero values represent actual dry conditions reported by the satellite product rather than missing or zero-padding grids.</p>
<fig position="float" id="F4">
<label>Figure 4</label>
<caption><p>Imagery processing using boundary reshaping and zero padding for E.21 data.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0004.tif">
<alt-text content-type="machine-generated">Three-panel diagram illustrating rainfall data processing over a geographical area labeled E.21. The left panel shows raw rainfall intensity with a color scale, the center panel outlines area cropping with a red border, and the right panel displays the result fitted into a 16-by-16 pixel grid with gray zero padding.</alt-text>
</graphic>
</fig>
</sec>
<sec>
<label>2.2.2</label>
<title>Model development</title>
<p>Previous studies have applied CNN&#x02013;LSTM models for flood forecasting by learning from image-based representations of meteorological and hydrological conditions in upstream areas. The input images are typically generated from multiple data sources, including ground-based observations, model-derived products, radar rainfall imagery, and various supplementary data analyses, in order to construct images that effectively capture the factors influencing discharge at the forecasting station. Consequently, the preparation of such input images constitutes a labor-intensive and relatively complex process, which may constrain the practical applicability of these approaches for real-time forecasting. To overcome limitations associated with sparse ground-based observations in upstream areas and the complexity of input data preprocessing in data-scarce regions, we employed a hybrid deep learning model to capture spatiotemporal relationships within the satellite imagery and historical trends of the target variable. Inspired by <xref ref-type="bibr" rid="B16">Song (2022)</xref> and <xref ref-type="bibr" rid="B11">Li X. et al. (2022)</xref>, a time-distributed CNN was used to extract spatial features from satellite-based precipitation images. The resulting CNN-derived feature vectors were then concatenated with historical discharge inputs and passed to the LSTM component to learn temporal dependencies, using the TC concept as a look-back parameter.</p>
<p>In contrast to previous studies, our proposed framework exhibited key differences. <xref ref-type="bibr" rid="B16">Song (2022)</xref> employed a CNN-only architecture for runoff simulation, without incorporating recurrent layers to model temporal dynamics. <xref ref-type="bibr" rid="B11">Li X. et al. (2022)</xref> relied on CNN-LSTM architectures for rainfall-runoff modeling based on observation-derived rainfall inputs but did not integrate river flow as an explicit model input. From an architectural perspective, while prior studies primarily utilized custom-designed convolutional stacks tailored to specific datasets, we instead adopted a convolutional layer design based on the Visual Geometry Group-16 (VGG-16) architecture, which has demonstrated strong performance in image-related tasks compared to relatively simpler networks. Our simplified version of the VGG-16 model consisted of two consecutive 2D convolutional layers with 64 filters each. We applied a time-distributed wrapper around the convolutional layers to handle temporal sequences. This allowed the same convolutional operations to be applied to each temporal slice of the input data. In particular, we utilized a TC period as a look-back window (<xref ref-type="bibr" rid="B17">Thaisiam et al., 2022</xref>), enabling the model to recognize temporal patterns over longer periods. Max-pooling layers were added after the convolutional layers to reduce data dimensionality while retaining spatial information. A series of convolutional layers and max-pooling layers was additionally stacked, with the final output being flattened into a dense layer comprising 512 units.</p>
<p>The CNN-based architecture was designed to learn spatial relationships from satellite imagery while reducing the high-dimensional data into a 1D vector of size 512. To incorporate the historical discharge information, this 1D vector was concatenated with the downstream discharge data, resulting in a combined feature vector of 513 units, aligned with the same TC-period temporal window. Two LSTM layers, each with 16 units, were used to model the temporal relationships within the historical discharge data. LSTMs were chosen for their effectiveness in capturing long-term dependencies in sequential data. In addition, two fully connected layers were added to transform the LSTM outputs into a suitable representation for forecasting. The final layer consisted of 24 output units, corresponding to the desired forecasting horizons. <xref ref-type="fig" rid="F5">Figure 5</xref> illustrates the proposed network architecture.</p>
<fig position="float" id="F5">
<label>Figure 5</label>
<caption><p>Proposed network architecture.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0005.tif">
<alt-text content-type="machine-generated">Diagram of a deep learning architecture combining spatial and temporal inputs. Spatial features enter a simplified VGG-16 convolutional neural network with convolutional and max pooling layers. Temporal features are concatenated and passed to a flatten layer, followed by LSTM layers with sixteen units each, and finally fully connected layers producing a twenty-four dimensional output.</alt-text>
</graphic>
</fig>
<p>Several standard numerical metrics were utilized to evaluate the performance of our model. The correlation coefficient (R) was used to assess the strength of the linear relationship between the predicted values and the actual target variable. To further quantify the model&#x00027;s error, we calculated both the RMSE and the MAE. RMSE provides a measure of the standard deviation of the residuals, reflecting the average magnitude of the errors, while MAE indicates the average absolute deviation from the true values. Additionally, we computed the NSE coefficient to evaluate the model&#x00027;s effectiveness illogical context. The NSE represents the ratio of the residual variance to the variance of the observed data, offering insight into how well the model performs compared to a baseline prediction. The detailed configuration of the proposed CNN-LSTM framework is summarized in <xref ref-type="table" rid="T2">Table 2</xref>. The table reports the network architecture, key hyperparameters, and training settings adopted in this study, including input dimensions, convolutional and recurrent layer specifications, optimization strategy, and loss function.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Model configurations.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Model parameters</bold></th>
<th valign="top" align="left"><bold>Details</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Input shape 1 (images)</td>
<td valign="top" align="left">(TC, 16, 16, 1) [Time steps, Width, Height, Channel]</td>
</tr>
<tr>
<td valign="top" align="left">Input shape 2 (discharge)</td>
<td valign="top" align="left">(TC, 1) [Time steps, Feature]</td>
</tr>
<tr>
<td valign="top" align="left">CNN layers (TimeDistributed)</td>
<td valign="top" align="left">Conv2D (64, 128, 256, 512 filters) &#x0002B; MaxPooling2D</td>
</tr>
<tr>
<td valign="top" align="left">LSTM layers</td>
<td valign="top" align="left">2 Stacked layers (16 units each, activation: &#x0201C;relu&#x0201D;)</td>
</tr>
<tr>
<td valign="top" align="left">Dense layers</td>
<td valign="top" align="left">2 Layers (4,096 units each, Activation: &#x0201C;relu&#x0201D;) and an output layer (24 units)</td>
</tr>
<tr>
<td valign="top" align="left">Loss function</td>
<td valign="top" align="left">Mean squared error (MSE)</td>
</tr>
<tr>
<td valign="top" align="left">Optimizer</td>
<td valign="top" align="left">RMSprop</td>
</tr>
<tr>
<td valign="top" align="left">Hyperparameters</td>
<td valign="top" align="left">Lookback (History): TC, Future Target: 24, Step: 1</td>
</tr>
<tr>
<td valign="top" align="left">Training hyperparameters</td>
<td valign="top" align="left">Batch Size: 64, Epochs: 50, Steps per epoch: 50</td>
</tr>
<tr>
<td valign="top" align="left">Evaluation metrics</td>
<td valign="top" align="left">Mean absolute error (MAE), Root mean squared error (RMSE)</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
</sec>
</sec>
<sec id="s3">
<label>3</label>
<title>Results and discussion</title>
<sec>
<label>3.1</label>
<title>Testing dataset results</title>
<p>The multi-step hybrid model integrating CNNs and LSTMs was developed to predict discharge data 24 h in advance. We initially evaluated the performance of the proposed model using the GSMaP-MVK dataset for both the Upper Yom and Upper Chi River Basins. To comprehensively assess the model&#x00027;s accuracy and reliability, we calculated R, NSE, MAE, and RMSE at different forecasting horizons (specifically, 1-step, 6-step, 12-step and 24-step intervals), allowing us to observe how prediction errors progressed over time. <xref ref-type="table" rid="T3">Table 3</xref> provides a summary of all these metrics based on the internal test set of GSMaP-MVK for both river basins. The inclusion of multiple forecasting horizons evaluated both short-term prediction accuracy and the model&#x00027;s capability to maintain performance over longer periods.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Performance indices obtained from prediction results of testing dataset.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left" rowspan="2"><bold>Performance indices</bold></th>
<th valign="top" align="center" colspan="4">Upper Yom river basin</th>
<th valign="top" align="center" colspan="4">Upper Chi river basin</th>
</tr>
<tr>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>1H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>6H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>12H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>24H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>1H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>6H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>12H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>24H</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="9"><bold>GSMaP-MVK</bold></td>
</tr>
<tr>
<td valign="top" align="left">R</td>
<td valign="top" align="center">0.9926</td>
<td valign="top" align="center">0.9799</td>
<td valign="top" align="center">0.9526</td>
<td valign="top" align="center">0.8786</td>
<td valign="top" align="center">0.9970</td>
<td valign="top" align="center">0.9965</td>
<td valign="top" align="center">0.9954</td>
<td valign="top" align="center">0.9921</td>
</tr>
<tr>
<td valign="top" align="left">NSE</td>
<td valign="top" align="center">0.9765</td>
<td valign="top" align="center">0.9508</td>
<td valign="top" align="center">0.8983</td>
<td valign="top" align="center">0.7633</td>
<td valign="top" align="center">0.9743</td>
<td valign="top" align="center">0.9737</td>
<td valign="top" align="center">0.9726</td>
<td valign="top" align="center">0.9662</td>
</tr>
<tr>
<td valign="top" align="left">MAE (m<sup>3</sup>/s)</td>
<td valign="top" align="center">12.861</td>
<td valign="top" align="center">15.134</td>
<td valign="top" align="center">17.996</td>
<td valign="top" align="center">23.173</td>
<td valign="top" align="center">9.9051</td>
<td valign="top" align="center">9.8711</td>
<td valign="top" align="center">9.9351</td>
<td valign="top" align="center">10.065</td>
</tr>
<tr>
<td valign="top" align="left">RMSE (m<sup>3</sup>/s)</td>
<td valign="top" align="center">17.323</td>
<td valign="top" align="center">25.045</td>
<td valign="top" align="center">36.019</td>
<td valign="top" align="center">54.961</td>
<td valign="top" align="center">15.540</td>
<td valign="top" align="center">15.737</td>
<td valign="top" align="center">16.069</td>
<td valign="top" align="center">17.843</td>
</tr></tbody>
</table>
</table-wrap>
<p>According to <xref ref-type="table" rid="T3">Table 3</xref>, the proposed model exhibited an overall desirable performance. Specifically, it maintained a performance level well within acceptable error limits even for the 24-h prediction horizon. Overall, the model&#x00027;s predictive performance generally declined as the prediction horizon increased, particularly when evaluated using R, RMSE, and R. However, slight non-monotonic behavior is observed for MAE in certain cases, reflecting differences in metric sensitivity to extreme discharge errors. The non-monotonic behavior is attributable to its equal weighting of errors, whereas RMSE and NSE are more sensitive to large errors associated with peak flows, and R primarily reflects temporal pattern alignment rather than error magnitude. Across the two study areas, the results for the Upper Chi River Basin consistently outperformed those for the Upper Yom River Basin, achieving R and NSE values exceeding 0.95 for the 24-h forecasting horizon. This disparity could be attributed partially to the differences in the discharge patterns between the two basins. In the Upper Chi River Basin, the topography and river basin system promote a more synchronized flow of water from the main river and its tributaries toward the outlet. This results in relatively more stable discharge patterns with well-defined peaks occurring at specific intervals during the wet season of 2020 and 2021. In contrast, the Upper Yom River Basin, characterized by the feather-like pattern of its watercourses and steep upstream topography, displays highly variable discharge patterns, including abrupt peaks and irregular fluctuations, which make accurate prediction more challenging. These trends are visually represented in <xref ref-type="fig" rid="F6">Figures 6</xref>, <xref ref-type="fig" rid="F7">7</xref> for particular flood events, whereas <xref ref-type="supplementary-material" rid="SM1">Supplementary Figures 1</xref>, <xref ref-type="supplementary-material" rid="SM1">2</xref> in the Supplementary Material show the results for all test periods in the Upper Yom and Upper Chi River Basins, respectively.</p>
<fig position="float" id="F6">
<label>Figure 6</label>
<caption><p>Testing dataset results for the Upper Yom River Basin evaluated using GSMaP-MVK at T&#x0002B;1H, T&#x0002B;6H, T&#x0002B;12H, and T&#x0002B;24H. <bold>(a)</bold> Predicted discharge during flood periods; <bold>(b)</bold> scatter plot of predicted vs. observed discharge for the testing dataset.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0006.tif">
<alt-text content-type="machine-generated">Panel a displays two line charts comparing observed and predicted river discharge and precipitation over time, with multiple prediction intervals. Panel b contains four scatter plots showing predicted versus observed flow for time horizons of one, six, twelve, and twenty-four hours, each with corresponding correlation coefficients.</alt-text>
</graphic>
</fig>
<fig position="float" id="F7">
<label>Figure 7</label>
<caption><p>Testing dataset results for the Upper Chi River Basin evaluated using GSMaP-MVK at T&#x0002B;1H, T&#x0002B;6H, T&#x0002B;12H, and T&#x0002B;24H. <bold>(a)</bold> Predicted discharge during flood periods; <bold>(b)</bold> scatter plot of predicted vs. observed discharge for the testing dataset.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0007.tif">
<alt-text content-type="machine-generated">Panel a shows two line graphs comparing observed and predicted river discharge and precipitation over time, with multiple forecast lead times. Panel b features four scatter plots of predicted versus observed flow for different lead times, each displaying a high correlation coefficient.</alt-text>
</graphic>
</fig>
<p><xref ref-type="fig" rid="F6">Figures 6</xref>, <xref ref-type="fig" rid="F7">7</xref> provide a comparative analysis of the actual and predicted discharge data during the flood events in the internal testing period, alongside the average rainfall obtained from GSMaP-MVK. This visual representation facilitates an examination of the relationship between precipitation within the basin and observed discharge at the downstream station. Theoretically, these two variables could be expected to show a strong correlation, though there may be a noticeable lag between rainfall events and their impact on river discharge. In addition, scatter plots were generated to compare actual and predicted discharge values across various experimental forecasting horizons for both river basins (<xref ref-type="fig" rid="F6">Figures 6</xref>, <xref ref-type="fig" rid="F7">7</xref>). These plots enable a detailed analysis of model error trends, with points above the diagonal line indicating overpredictions and points below representing underpredictions. Furthermore, the degree of scattering around the diagonal line reflects the accuracy and consistency of the predictions.</p>
<p>In addition, box and whisker plots were constructed to analyze the distribution of actual discharge values with respect to the prediction, as well as the errors between the two, as depicted in <xref ref-type="fig" rid="F8">Figures 8</xref>, <xref ref-type="fig" rid="F9">9</xref>. These visualizations summarize key statistical characteristics of the data, including the interquartile range (represented by the box), the median (indicated by a horizontal line within the box), and the spread of the data (depicted by the whiskers and any identified outliers). By integrating these plots, the analysis not only identifies systematic biases in the model but also highlights the variability and extremities in the dataset, offering a comprehensive assessment of the model&#x00027;s predictive performance across different scenarios.</p>
<fig position="float" id="F8">
<label>Figure 8</label>
<caption><p>Box plots of testing dataset results for the Upper Yom River Basin in dry season (December 1 to April 30) and wet season (May1 to November 30) in <bold>(a)</bold> the distribution of the observed and predicted discharges over the forecast horizons and <bold>(b)</bold> the difference between the predicted and actual discharge.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0008.tif">
<alt-text content-type="machine-generated">Two box plot charts compare observed and predicted river discharge (m3/s) and associated error for dry and wet periods. Chart (a) shows discharge values for observed and forecasts at multiple lead times. Chart (b) presents forecast errors for the same periods, illustrating increasing discharge variability and errors with longer lead times.</alt-text>
</graphic>
</fig>
<fig position="float" id="F9">
<label>Figure 9</label>
<caption><p>Box plots of testing dataset results for the Upper Chi River Basin in dry season (December 1 to April 30) and wet season (May1 to November 30) in <bold>(a)</bold> the distribution of the observed and predicted discharges over the forecast horizons and <bold>(b)</bold> the difference between the predicted and actual discharge.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0009.tif">
<alt-text content-type="machine-generated">Two box plot charts compare observed and predicted river discharge (m&#x000B3;/s) and associated error for dry and wet periods. Chart (a) shows discharge values for observed and forecasts at multiple lead times. Chart (b) presents forecast errors for the same periods. Both charts indicate greater variability during wet conditions. Legends and box plot element keys are included for interpretation.</alt-text>
</graphic>
</fig>
<p>In the Upper Yom River Basin, the considerable average rainfall during 2020 was clearly correlated with a pronounced peak in the discharge data at a subsequent time lag, as illustrated in <xref ref-type="fig" rid="F6">Figure 6</xref>. This lag reflects the time required for the rainfall to flow through the basin and affects the downstream discharge station. During the early rainy season (May to June), due to high infiltration rates, rainfall in the catchment area contributes minimally to runoff at the outlet. In a major flood event in the Upper Yom River Basin during July 2020 (<xref ref-type="fig" rid="F6">Figure 6a</xref>), associated with Tropical Storm Higos, which caused severe flooding in northern Thailand. The predictions demonstrated good agreement with the observed flood hydrograph, particularly at short lead times of 1&#x02013;12 h. At these horizons, the model closely reproduced the flood hydrograph, accurately capturing both the timing and magnitude of the peak flow. However, as the prediction horizon extended to 24 h, model performance deteriorated, evidenced by increased errors and a delayed peak discharge relative to the observations. In addition, the scatter plot in <xref ref-type="fig" rid="F6">Figure 6b</xref> revealed a clustering of data points around the diagonal line, with some deviations, especially for longer forecasting horizons. The errors remained relatively small for lower discharge values but increased substantially for higher discharges. Both underprediction and overprediction were observed, with overprediction being slightly more prevalent for all forecasting horizons. This trend was further emphasized in <xref ref-type="fig" rid="F8">Figure 8b</xref>, depicting the difference between the predicted and actual discharge. The mean and median differences were positive for all modeled periods (both wet and dry), suggesting overprediction. Error variations, as evidenced by box size, gradually increased with longer forecasting horizons. Furthermore, the box sizes for the wet season were relatively larger than for the dry season, implying greater variability in the former, with some evidence of underprediction. <xref ref-type="fig" rid="F8">Figure 8a</xref> visually represents the distribution of the observed and predicted discharges across forecasting horizons, categorized into dry and wet seasons. In the dry season, the box plots were compact and centered near zero, with short whiskers, indicating minimal errors and well-performed model predictions. Conversely, during the wet season, the box plots expanded, reflecting greater variability in discharge values. The longer whiskers suggested a wider range of errors, accompanied by outliers that underscored the challenges for the model in capturing extreme events or abrupt flow changes. Notably, the box plots for the predicted values closely aligned with those of the observed values, indicating the model&#x00027;s robust performance, even under the dynamic conditions of the wet season.</p>
<p>The Upper Chi River Basin, which experienced comparatively lower precipitation levels, as shown in <xref ref-type="fig" rid="F7">Figure 7</xref>, had a weaker correlation between rainfall and discharge, attributable to the basin&#x00027;s characteristics, including its extensive river system and large catchment areas. Runoff from the upstream areas of the main river and its tributaries would reach the outlet almost simultaneously. As a result, even when rainfall in the tributary catchments was modest, the runoff at the outlet remained relatively high, particularly during the late rainy season. The scatter plots demonstrated an even closer clustering of data points along the diagonal line, particularly for lower discharge values. Deviations from the diagonal generally indicate model underprediction across all forecasting horizons. In <xref ref-type="fig" rid="F9">Figure 9b</xref> supported this observation, showing consistently negative values for the difference between predicted and actual discharge. The relatively similar spread of the box plots across forecasting horizons suggests that the overall distribution of prediction errors does not exhibit a pronounced change with increasing lead time. This may be attributed to the discharge pattern, characterized by a few peaks occurring within a short timeframe. Since most of the training data consisted of relatively low and stable discharge values, the model had a tendency to underpredict higher discharge events. The distributions of observed and predicted discharge, shown in <xref ref-type="fig" rid="F9">Figure 9a</xref>, had similar patterns to those observed in the Upper Yom River Basin.</p>
<p>To further assess the performance of the proposed model across temporal scales and seasonal conditions, <xref ref-type="fig" rid="F10">Figure 10</xref> presents the average monthly RMSE of discharge predictions at lead times of T &#x0002B; 1H, T &#x0002B; 6H, T &#x0002B; 12H, and T &#x0002B; 24H during the testing period (2019&#x02013;2022). Panels (a) and (b) show results for the Upper Yom and Upper Chi River basins, respectively. During the dry season, when discharge levels are low, prediction errors are comparable across all lead times in both basins. In contrast, errors increase during the wet season, particularly in months characterized by a wide range of discharge variability. In the Upper Yom River basin, discharge in July ranges from 0 to 1,252 m<sup>3</sup>/s and exhibits pronounced hourly fluctuations, which coincides with elevated prediction errors at longer lead times. A similar pattern is observed in the Upper Chi River Basin in September. The higher errors are associated with pronounced hourly discharge variability, which poses challenges for the model in accurately capturing rapid flow dynamics compared with periods of more stable discharge conditions.</p>
<fig position="float" id="F10">
<label>Figure 10</label>
<caption><p>The average monthly RMSE of discharge forecasts at lead time T &#x0002B; 1H, T &#x0002B; 6H, T &#x0002B; 12H, and T &#x0002B; 24H during the testing period (2019&#x02013;2022) <bold>(a)</bold> results for Upper Yom River Basin <bold>(b)</bold> results for Upper Chi River Basin.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0010.tif">
<alt-text content-type="machine-generated">Panel (a) and panel (b) present line graphs comparing root mean square error (RMSE) of predicted discharge at different forecast horizons (T+1H, T+6H, T+12H, T+24H) by month, overlaid with blue and orange bar charts showing hourly discharge ranges for wet and dry seasons, respectively, at two stations for the period 2019 to 2022.</alt-text>
</graphic>
</fig>
</sec>
<sec>
<label>3.2</label>
<title>External testing dataset results</title>
<p>After training and fine-tuning our models&#x00027; hyperparameters on the GSMaP-MVK validation set, we collected additional datasets as external test sets. An external test set is a crucial component in validating the performance of deep learning models as it helps in preventing overfitting, assessing generalization, aiding model selection, preventing data leakage, and providing a realistic prediction of real-world performance. By using an external test set, we could ensure that our model was robust, reliable, and ready for deployment.</p>
<p>In this work, we considered recent 2-year data obtained from the downstream station-based discharge data and the satellite-based precipitation data as our external test datasets. Specifically, we collected GSMaP-MVK and GSMaP-NOW data from 2022 to 2024. We prioritized GSMaP-NOW because it offers more up-to-date data with only a 30-min time lag compared to the 3-day lag in GSMaP-MVK. If our model (trained on GSMaP-MVK) demonstrated satisfactory performance on GSMaP-NOW, it would suggest high potential for implementation in a real-time early warning system. The ability to accurately predict discharge based on near-real-time precipitation data is essential for timely flood alerts. It should be noted that although the use of GSMaP-NOW enables relatively near real-time precipitation data within the proposed framework, operational hydrological forecasting systems may still face data latency issues. In practice, both discharge and precipitation data can be affected by reporting delays, data gaps, and quality control procedures, which may result in the unavailability of observations for the most recent hours. This operational limitation is not explicitly addressed in the current study. Future work should evaluate the proposed framework under fully operational conditions and explore strategies to mitigate potential data latency issues. <xref ref-type="table" rid="T4">Table 4</xref> summarizes the performance of the model on the external test datasets calculated from GSMaP-MVK and GSMaP-NOW for both study areas.</p>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p>Performance indices obtained from prediction results of external test dataset.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left" rowspan="2"><bold>Performance indices</bold></th>
<th valign="top" align="center" colspan="4">Upper Yom river basin</th>
<th valign="top" align="center" colspan="4">Upper Chi river basin</th>
</tr>
<tr>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>1H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>6H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>12H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>24H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>1H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>6H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>12H</bold></th>
<th valign="top" align="center"><bold>T</bold> &#x0002B; <bold>24H</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="9"><bold>GSMaP-MVK</bold></td>
</tr>
<tr>
<td valign="top" align="left">R</td>
<td valign="top" align="center">0.9919</td>
<td valign="top" align="center">0.9791</td>
<td valign="top" align="center">0.9514</td>
<td valign="top" align="center">0.8736</td>
<td valign="top" align="center">0.9989</td>
<td valign="top" align="center">0.9986</td>
<td valign="top" align="center">0.9980</td>
<td valign="top" align="center">0.9957</td>
</tr>
<tr>
<td valign="top" align="left">NSE</td>
<td valign="top" align="center">0.9826</td>
<td valign="top" align="center">0.9558</td>
<td valign="top" align="center">0.8981</td>
<td valign="top" align="center">0.7459</td>
<td valign="top" align="center">0.9769</td>
<td valign="top" align="center">0.9761</td>
<td valign="top" align="center">0.9757</td>
<td valign="top" align="center">0.9700</td>
</tr>
<tr>
<td valign="top" align="left">MAE (m<sup>3</sup>/s)</td>
<td valign="top" align="center">6.531</td>
<td valign="top" align="center">9.720</td>
<td valign="top" align="center">13.881</td>
<td valign="top" align="center">20.834</td>
<td valign="top" align="center">11.369</td>
<td valign="top" align="center">11.360</td>
<td valign="top" align="center">11.289</td>
<td valign="top" align="center">11.688</td>
</tr>
<tr>
<td valign="top" align="left">RMSE (m<sup>3</sup>/s)</td>
<td valign="top" align="center">13.024</td>
<td valign="top" align="center">20.009</td>
<td valign="top" align="center">29.921</td>
<td valign="top" align="center">46.915</td>
<td valign="top" align="center">15.233</td>
<td valign="top" align="center">15.490</td>
<td valign="top" align="center">15.609</td>
<td valign="top" align="center">17.365</td>
</tr>
<tr>
<td valign="top" align="left" colspan="9"><bold>GSMaP-NOW</bold></td>
</tr>
<tr>
<td valign="top" align="left">R</td>
<td valign="top" align="center">0.9925</td>
<td valign="top" align="center">0.9784</td>
<td valign="top" align="center">0.9476</td>
<td valign="top" align="center">0.8615</td>
<td valign="top" align="center">0.9988</td>
<td valign="top" align="center">0.9985</td>
<td valign="top" align="center">0.9980</td>
<td valign="top" align="center">0.9956</td>
</tr>
<tr>
<td valign="top" align="left">NSE</td>
<td valign="top" align="center">0.9817</td>
<td valign="top" align="center">0.9510</td>
<td valign="top" align="center">0.8861</td>
<td valign="top" align="center">0.7170</td>
<td valign="top" align="center">0.9767</td>
<td valign="top" align="center">0.9760</td>
<td valign="top" align="center">0.9753</td>
<td valign="top" align="center">0.9697</td>
</tr>
<tr>
<td valign="top" align="left">MAE(m<sup>3</sup>/s)</td>
<td valign="top" align="center">6.561</td>
<td valign="top" align="center">10.068</td>
<td valign="top" align="center">14.552</td>
<td valign="top" align="center">21.786</td>
<td valign="top" align="center">11.363</td>
<td valign="top" align="center">11.298</td>
<td valign="top" align="center">11.383</td>
<td valign="top" align="center">11.676</td>
</tr>
<tr>
<td valign="top" align="left">RMSE(m<sup>3</sup>/s)</td>
<td valign="top" align="center">13.332</td>
<td valign="top" align="center">21.014</td>
<td valign="top" align="center">31.607</td>
<td valign="top" align="center">49.493</td>
<td valign="top" align="center">15.303</td>
<td valign="top" align="center">15.522</td>
<td valign="top" align="center">15.764</td>
<td valign="top" align="center">17.436</td>
</tr></tbody>
</table>
</table-wrap>
<p>Based on the comparison of the evaluation metrics using GSMaP-MVK on the internal test set (<xref ref-type="table" rid="T3">Table 3</xref>) and the external test set (<xref ref-type="table" rid="T4">Table 4</xref>), the model performed consistently, with only slight variations between the two datasets. These minor differences suggested no evidence of overfitting, with the variation perhaps due to the different discharge patterns observed during the testing time periods. We further compared the model&#x00027;s performance based on the GSMaP-MVK and GSMaP-NOW datasets, with the performance differences between them being minimal, indicating that the model trained on one dataset was transferable to another dataset. The ability to apply a model trained on GSMaP-MVK to GSMaP-NOW is particularly advantageous for real-world applications. Notably, GSMaP-NOW data has a shorter lag time, making it more suitable for timely decision making and operational use.</p>
<p><xref ref-type="fig" rid="F11">Figures 11</xref>, <xref ref-type="fig" rid="F12">12</xref> present a comparative analysis of actual and predicted discharge during flood periods in the external test dataset for the Upper Yom River Basin, coupled with the average rainfall depth obtained from GSMaP-MVK and GSMaP-NOW, respectively. The model accurately reproduced both peak flood discharges and the timing of flood events across all forecasting lead times. Predicted discharge results for the entire external testing period using GSMaP-MVK and GSMaP-NOW are shown in <xref ref-type="supplementary-material" rid="SM1">Supplementary Figures 3</xref>, <xref ref-type="supplementary-material" rid="SM1">4</xref>, respectively. The model&#x00027;s performances were essentially consistent across datasets, despite slight differences in the rainfall patterns. The consistency of the model performance suggested that our proposed framework was robust and capable of handling input variability. The model effectively captured the major trends, delivering preferable final predictions even in the presence of outliers.</p>
<fig position="float" id="F11">
<label>Figure 11</label>
<caption><p>External test dataset for the Upper Yom River Basin evaluated using GSMaP-MVK at T &#x0002B; 1H, T &#x0002B; 6H, T &#x0002B; 12H, and T &#x0002B; 24H. <bold>(a)</bold> Predicted discharge during flood periods; <bold>(b)</bold> scatter plot of predicted vs. observed discharge for the external test dataset.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0011.tif">
<alt-text content-type="machine-generated">Panel (a) contains two line graphs comparing observed and predicted river discharge over time with corresponding precipitation, while panel (b) shows four scatter plots comparing observed and predicted flow at different forecast lead times, each labeled with correlation coefficients.</alt-text>
</graphic>
</fig>
<fig position="float" id="F12">
<label>Figure 12</label>
<caption><p>External test dataset for the Upper Yom River Basin evaluated using GSMaP-NOW at T &#x0002B; 1H, T &#x0002B; 6H, T &#x0002B; 12H, and T &#x0002B; 24H. <bold>(a)</bold> Predicted discharge during flood periods; <bold>(b)</bold> scatter plot of predicted vs. observed discharge for the external test dataset.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0012.tif">
<alt-text content-type="machine-generated">Figure contains two main panels labeled (a) and (b). Panel (a) displays two line graphs comparing observed and predicted river discharge against precipitation from August to October, differentiated by temporal prediction intervals. Panel (b) shows four scatterplots, each relating predicted and observed flow for forecast horizons of one, six, twelve, and twenty-four hours, with corresponding correlation coefficients decreasing as forecast interval increases.</alt-text>
</graphic>
</fig>
<p><xref ref-type="fig" rid="F13">Figures 13</xref>, <xref ref-type="fig" rid="F14">14</xref> provide a similar comparative analysis for the Upper Chi River Basin, while <xref ref-type="supplementary-material" rid="SM1">Supplementary Figures 5</xref>, <xref ref-type="supplementary-material" rid="SM1">6</xref> show results for the entire external test period using GSMaP-MVK and GSMaP-NOW, respectively. These results reinforce the model&#x00027;s generalizability and its ability to maintain stable performance across different river basins and input data sources. The plots demonstrate that model performance remains largely consistent, despite minor variations in rainfall patterns. Overall, the precipitation trends for both data sources were comparable, with a notable peak observed in GSMaP-NOW during the wet season of 2023 (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 6</xref>). This observation was corroborated by the mass curves, which indicated that the accumulated precipitation for both datasets was similar, with a slight increase in GSMaP-NOW, particularly during this peak period. Based on these results, our proposed model demonstrated robustness and the ability to adapt to subtle variations in the input data. This adaptability is crucial for real-world applications, particularly when the model is deployed as a flooding early warning system. In dynamic and often unpredictable environments, such as those involving fluctuating rainfall patterns and varying hydrological conditions, the model&#x00027;s flexibility ensures reliable performance, making it a strong candidate for operational use in flood prediction and management.</p>
<fig position="float" id="F13">
<label>Figure 13</label>
<caption><p>External test dataset for the Upper Chi River Basin evaluated using GSMaP-MVK at T &#x0002B; 1H, T &#x0002B; 6H, T &#x0002B; 12H, and T &#x0002B; 24H. <bold>(a)</bold> Predicted discharge during flood periods; <bold>(b)</bold> scatter plot of predicted vs. observed discharge for the external test dataset.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0013.tif">
<alt-text content-type="machine-generated">Figure with two panels labeled a and b. Panel a contains two time series charts displaying observed and predicted river discharge against precipitation from September to November, with a sharp peak in October and multiple lines for prediction intervals. Panel b contains four scatter plots comparing predicted and observed river flow at forecast horizons of one, six, twelve, and twenty-four hours, demonstrating strong linear correlation and high R values above 0.99.</alt-text>
</graphic>
</fig>
<fig position="float" id="F14">
<label>Figure 14</label>
<caption><p>External test dataset for the Upper Chi River Basin evaluated using GSMaP-NOW at T &#x0002B; 1H, T &#x0002B; 6H, T &#x0002B; 12H, and T &#x0002B; 24H. <bold>(a)</bold> Predicted discharge during flood periods; <bold>(b)</bold> scatter plot of predicted vs. observed discharge for the external test dataset.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1753598-g0014.tif">
<alt-text content-type="machine-generated">Panel (a) contains two time series plots showing river discharge in cubic meters per second overlaid with precipitation data for two different periods, with multiple predicted and observed discharge lines and a red precipitation bar chart. Panel (b) features four scatter plots comparing predicted versus observed flow for lead times of one, six, twelve, and twenty-four hours, each with a line indicating perfect agreement and R values above 0.99.</alt-text>
</graphic>
</fig>
<p>The use of satellite-based data has proven to be promising for predicting hydrological conditions in data-scarce areas, such as the regions in our study. Our model delivered reasonably good performance, even for extended forecasting horizons under realistic data constraints, while acknowledging that completely ungauged forecasting remains an important topic for future research. In addition, further refinements are necessary to optimize the model&#x00027;s effectiveness for long-term predictions, especially in early warning systems. Several strategies could be considered to enhance the model&#x00027;s performance for extended forecasts. Fine-tuning model parameters or integrating more advanced algorithms may enhance accuracy, especially in predicting extreme events. Additionally, incorporating variables, such as rainfall intensity, antecedent soil moisture conditions, or land use changes, could significantly improve the model&#x00027;s predictive capabilities. For real-world deployment, further testing with a larger and more diverse dataset, especially one that includes a broader range of extreme events, would offer a more comprehensive evaluation of the model&#x00027;s robustness and reliability. Moreover, extending the proposed framework to basins in different geographical regions may introduce additional challenges related to basin-scale variability, which remain to be explored in future work. To address these challenges, adaptive input representations&#x02014;such as basin-normalized spatial windows, multi-resolution pooling strategies, or attention-based spatial weighting mechanisms&#x02014;could be incorporated to better capture scale-dependent precipitation patterns. Such developments may enhance model transferability across basins of varying sizes and physiographic characteristics, thereby improving its suitability for operational early warning applications where accurate prediction of extreme hydrological events is critical for timely and effective decision-making.</p>
<p>In this study, all input data, including GSMaP precipitation products and discharge observations, are obtained from publicly available sources and responsible organizations. These datasets do not contain personal, proprietary, or sensitive information. Data processing and modeling procedures are documented to ensure transparency and reproducibility. However, the application of the proposed model for flood forecasting requires careful consideration of data limitations and potential bias, as historical precipitation and discharge datasets may reflect legacy effects of past water management practices and uneven spatial and temporal monitoring coverage. These issues are particularly relevant in flood early warning applications, where model outputs may directly support risk communication and emergency response. Therefore, the results should be interpreted as decision-support information rather than definitive predictions, with explicit recognition of uncertainty and the continued role of expert judgment in responsible flood risk management.</p>
</sec>
</sec>
<sec sec-type="conclusion" id="s4">
<label>4</label>
<title>Conclusion</title>
<p>The proposed network architecture effectively integrated both spatial and temporal information, leveraging the strengths of CNNs for spatial feature extraction and LSTMs for temporal dependency modeling. This approach demonstrated potential for satellite data analysis and time series forecasting in hydrological contexts. Internal and external validation using the GSMaP-MVK and GSMaP-NOW datasets confirmed the model&#x00027;s reliability and generalization across different data scenarios, especially for real-time conditions. The integration of advanced deep learning techniques and satellite data offers a scalable and practical solution for enhancing discharge predictions in data-limited regions. Our proposed framework should not only improve hydrological forecast accuracy but should also support proactive water resource management, particularly in catchments where upstream ground-based measurements are sparse or incomplete. Potential future research directions include expanding the model by incorporating additional environmental variables, exploring more sophisticated neural network architectures, and testing the approach across diverse hydrological systems to validate and extend its broader applicability.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec sec-type="author-contributions" id="s6">
<title>Author contributions</title>
<p>PW: Supervision, Software, Data curation, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing, Conceptualization, Methodology, Validation. KY: Writing &#x02013; original draft, Visualization, Formal analysis, Methodology. WT: Funding acquisition, Investigation, Supervision, Data curation, Writing &#x02013; original draft, Project administration, Conceptualization, Methodology.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s8">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/frwa.2026.1753598/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/frwa.2026.1753598/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Image_1.jpeg" id="SM1" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_2.jpeg" id="SM2" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_3.jpeg" id="SM3" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_4.jpeg" id="SM4" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_5.jpeg" id="SM5" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_6.jpeg" id="SM6" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chang</surname> <given-names>F.-J.</given-names></name> <name><surname>Chang</surname> <given-names>L.-C.</given-names></name> <name><surname>Chen</surname> <given-names>J.-F.</given-names></name></person-group> (<year>2023</year>). <article-title>Artificial intelligence techniques in hydrology and water resources management</article-title>. <source>Water</source> <volume>15</volume>:<fpage>1846</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w15101846</pub-id></mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chenmin</surname> <given-names>N.</given-names></name> <name><surname>Marsani</surname> <given-names>M. F.</given-names></name> <name><surname>Pei Shan</surname> <given-names>F.</given-names></name></person-group> (<year>2024</year>). <article-title>Flood prediction based on feature selection and a hybrid deep learning network</article-title>. <source>J. Water Clim. Change</source> <volume>15</volume>, <fpage>1245</fpage>&#x02013;<lpage>1261</lpage>. doi: <pub-id pub-id-type="doi">10.2166/wcc.2024.559</pub-id></mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Feng</surname> <given-names>J.</given-names></name> <name><surname>Sha</surname> <given-names>H.</given-names></name> <name><surname>Ding</surname> <given-names>Y.</given-names></name> <name><surname>Yan</surname> <given-names>L.</given-names></name> <name><surname>Yu</surname> <given-names>Z.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Graph convolution based spatial-temporal attention LSTM model for flood forecasting,&#x0201D;</article-title> in <source>Paper Presented at the 2022 International Joint Conference on Neural Networks (IJCNN)</source> (<publisher-loc>Padua</publisher-loc>: <publisher-name>IEEE</publisher-name>). doi: <pub-id pub-id-type="doi">10.1109/IJCNN55064.2022.9892371</pub-id></mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hashemi</surname> <given-names>M.</given-names></name></person-group> (<year>2019</year>). <article-title>Enlarging smaller images before inputting into convolutional neural network: zero-padding vs. interpolation</article-title>. <source>J. Big Data</source> <volume>6</volume>, <fpage>1</fpage>&#x02013;<lpage>13</lpage>. doi: <pub-id pub-id-type="doi">10.1186/s40537-019-0263-7</pub-id></mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>F.</given-names></name> <name><surname>Yang</surname> <given-names>Q.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name> <name><surname>Luo</surname> <given-names>Z.</given-names></name> <name><surname>Shao</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>G.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Incorporating multiple grid-based data in CNN-LSTM hybrid model for daily runoff prediction in the source region of the Yellow River Basin</article-title>. <source>J. Hydrol. Reg. Stud.</source> <volume>51</volume>:<fpage>101652</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ejrh.2023.101652</pub-id></mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kratzert</surname> <given-names>F.</given-names></name> <name><surname>Klotz</surname> <given-names>D.</given-names></name> <name><surname>Brenner</surname> <given-names>C.</given-names></name> <name><surname>Schulz</surname> <given-names>K.</given-names></name> <name><surname>Herrnegger</surname> <given-names>M.</given-names></name></person-group> (<year>2018</year>). <article-title>Rainfall-runoff modelling using long short-term memory (LSTM) networks</article-title>. <source>Hydrol. Earth Syst. Sci.</source> <volume>22</volume>, <fpage>6005</fpage>&#x02013;<lpage>6022</lpage>. doi: <pub-id pub-id-type="doi">10.5194/hess-22-6005-2018</pub-id></mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Kubota</surname> <given-names>T.</given-names></name> <name><surname>Aonashi</surname> <given-names>K.</given-names></name> <name><surname>Ushio</surname> <given-names>T.</given-names></name> <name><surname>Shige</surname> <given-names>S.</given-names></name> <name><surname>Takayabu</surname> <given-names>Y. N.</given-names></name> <name><surname>Kachi</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>&#x0201C;Global satellite mapping of precipitation (GSMaP) products in the GPM era,&#x0201D;</article-title> in <source>Satellite Precipitation Measurement</source> (<publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>355</fpage>&#x02013;<lpage>373</lpage>. doi: <pub-id pub-id-type="doi">10.1007/978-3-030-24568-9_20</pub-id></mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kumar</surname> <given-names>V.</given-names></name> <name><surname>Azamathulla</surname> <given-names>H. M.</given-names></name> <name><surname>Sharma</surname> <given-names>K. V.</given-names></name> <name><surname>Mehta</surname> <given-names>D. J.</given-names></name> <name><surname>Maharaj</surname> <given-names>K. T.</given-names></name></person-group> (<year>2023</year>). <article-title>The state of the art in deep learning applications, challenges, and future prospects: a comprehensive review of flood forecasting and management</article-title>. <source>Sustainability</source> <volume>15</volume>:<fpage>10543</fpage>. doi: <pub-id pub-id-type="doi">10.3390/su151310543</pub-id></mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>J.</given-names></name> <name><surname>Lee</surname> <given-names>J. E.</given-names></name> <name><surname>Kim</surname> <given-names>N. W.</given-names></name></person-group> (<year>2020</year>). <article-title>Estimation of hourly flood hydrograph from daily flows using artificial neural network and flow disaggregation technique</article-title>. <source>Water</source> <volume>13</volume>:<fpage>30</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w13010030</pub-id></mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>P.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Krebs</surname> <given-names>P.</given-names></name></person-group> (<year>2022</year>). <article-title>Prediction of flow based on a CNN-LSTM combined deep learning approach</article-title>. <source>Water</source> <volume>14</volume>:<fpage>993</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w14060993</pub-id></mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Xu</surname> <given-names>W.</given-names></name> <name><surname>Ren</surname> <given-names>M.</given-names></name> <name><surname>Jiang</surname> <given-names>Y.</given-names></name> <name><surname>Fu</surname> <given-names>G.</given-names></name></person-group> (<year>2022</year>). <article-title>Hybrid CNN-LSTM models for river flow prediction</article-title>. <source>Water Supply</source> <volume>22</volume>, <fpage>4902</fpage>&#x02013;<lpage>4919</lpage>. doi: <pub-id pub-id-type="doi">10.2166/ws.2022.170</pub-id></mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Malik</surname> <given-names>H.</given-names></name> <name><surname>Feng</surname> <given-names>J.</given-names></name> <name><surname>Shao</surname> <given-names>P.</given-names></name> <name><surname>Abduljabbar</surname> <given-names>Z. A.</given-names></name></person-group> (<year>2024</year>). <article-title>Improving flood forecasting using time-distributed CNN-LSTM model: a time-distributed spatiotemporal method</article-title>. <source>Earth Sci. Inf.</source> <volume>17</volume>, <fpage>1</fpage>&#x02013;<lpage>20</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s12145-024-01354-y</pub-id></mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Senent-Aparicio</surname> <given-names>J.</given-names></name> <name><surname>Jimeno-S&#x000E1;ez</surname> <given-names>P.</given-names></name> <name><surname>Bueno-Crespo</surname> <given-names>A.</given-names></name> <name><surname>P&#x000E9;rez-S&#x000E1;nchez</surname> <given-names>J.</given-names></name> <name><surname>Pulido-Vel&#x000E1;zquez</surname> <given-names>D.</given-names></name></person-group> (<year>2019</year>). <article-title>Coupling machine-learning techniques with SWAT model for instantaneous peak flow prediction</article-title>. <source>Biosyst. Eng.</source> <volume>177</volume>, <fpage>67</fpage>&#x02013;<lpage>77</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.biosystemseng.2018.04.022</pub-id></mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shen</surname> <given-names>C.</given-names></name> <name><surname>Chen</surname> <given-names>X.</given-names></name> <name><surname>Laloy</surname> <given-names>E.</given-names></name></person-group> (<year>2021</year>). <article-title>Broadening the use of machine learning in hydrology</article-title>. <source>Front Water</source> <volume>3</volume>:<fpage>681023</fpage>. doi: <pub-id pub-id-type="doi">10.3389/frwa.2021.681023</pub-id></mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sit</surname> <given-names>M.</given-names></name> <name><surname>Demiray</surname> <given-names>B. Z.</given-names></name> <name><surname>Xiang</surname> <given-names>Z.</given-names></name> <name><surname>Ewing</surname> <given-names>G. J.</given-names></name> <name><surname>Sermet</surname> <given-names>Y.</given-names></name> <name><surname>Demir</surname> <given-names>I.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>A comprehensive review of deep learning applications in hydrology and water resources</article-title>. <source>Water Sci. Technol.</source> <volume>82</volume>, <fpage>2635</fpage>&#x02013;<lpage>2670</lpage>. doi: <pub-id pub-id-type="doi">10.2166/wst.2020.369</pub-id><pub-id pub-id-type="pmid">33341760</pub-id></mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Song</surname> <given-names>C. M.</given-names></name></person-group> (<year>2022</year>). <article-title>Data construction methodology for convolution neural network based daily runoff prediction and assessment of its applicability</article-title>. <source>J. Hydrol.</source> <volume>605</volume>:<fpage>127324</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jhydrol.2021.127324</pub-id></mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Thaisiam</surname> <given-names>W.</given-names></name> <name><surname>Saelo</surname> <given-names>W.</given-names></name> <name><surname>Wongchaisuwat</surname> <given-names>P.</given-names></name></person-group> (<year>2022</year>). <article-title>Enhancing a multi-step discharge prediction with deep learning and a response time parameter</article-title>. <source>Water</source> <volume>14</volume>:<fpage>2898</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w14182898</pub-id></mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Thaisiam</surname> <given-names>W.</given-names></name> <name><surname>Yomwilai</surname> <given-names>K.</given-names></name> <name><surname>Wongchaisuwat</surname> <given-names>P.</given-names></name></person-group> (<year>2024</year>). <article-title>Utilizing sequential modeling in collaborative method for flood forecasting</article-title>. <source>J. Hydrol.</source> <volume>636</volume>:<fpage>131290</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jhydrol.2024.131290</pub-id></mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tongal</surname> <given-names>H.</given-names></name> <name><surname>Booij</surname> <given-names>M. J.</given-names></name></person-group> (<year>2018</year>). <article-title>Simulation and forecasting of streamflows using machine learning models coupled with base flow separation</article-title>. <source>J. Hydrol.</source> <volume>564</volume>, <fpage>266</fpage>&#x02013;<lpage>282</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jhydrol.2018.07.004</pub-id></mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Xu</surname> <given-names>L.</given-names></name> <name><surname>Yu</surname> <given-names>F.</given-names></name> <name><surname>Zhang</surname> <given-names>S.</given-names></name></person-group> (<year>2023</year>). <article-title>Streamflow simulation with high-resolution WRF input variables based on the CNN-LSTM hybrid model and gamma test</article-title>. <source>Water</source> <volume>15</volume>:<fpage>1422</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w15071422</pub-id></mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Waqas</surname> <given-names>M.</given-names></name> <name><surname>Humphries</surname> <given-names>U. W.</given-names></name></person-group> (<year>2024</year>). <article-title>A critical review of RNN and LSTM variants in hydrological time series predictions</article-title>. <source>MethodsX</source> <volume>13</volume>:<fpage>102946</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.mex.2024.102946</pub-id><pub-id pub-id-type="pmid">39324077</pub-id></mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="book"><collab>WMO</collab> (<year>2022</year>). <source>Early Warning System</source>. <publisher-loc>Geneva</publisher-loc>: <publisher-name>WMO</publisher-name>.</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="book"><collab>WMO</collab> (<year>2024</year>). <article-title>&#x0201C;State of the climate in Asia 2023 (WMO-No.1350),&#x0201D;</article-title> in <source>Paper Presented at the 80th Session of the Commission (ESCAP)</source> (<publisher-loc>Bangkok</publisher-loc>).</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname> <given-names>W.</given-names></name> <name><surname>Emerton</surname> <given-names>R.</given-names></name> <name><surname>Duan</surname> <given-names>Q.</given-names></name> <name><surname>Wood</surname> <given-names>A. W.</given-names></name> <name><surname>Wetterhall</surname> <given-names>F.</given-names></name> <name><surname>Robertson</surname> <given-names>D. E.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Ensemble flood forecasting: current status and future opportunities</article-title>. <source>Water</source> <volume>7</volume>:<fpage>e1432</fpage>. doi: <pub-id pub-id-type="doi">10.1002/wat2.1432</pub-id></mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yao</surname> <given-names>Z.</given-names></name> <name><surname>Wang</surname> <given-names>Z.</given-names></name> <name><surname>Wang</surname> <given-names>D.</given-names></name> <name><surname>Wu</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name></person-group> (<year>2023</year>). <article-title>An ensemble CNN-LSTM and GRU adaptive weighting model based improved sparrow search algorithm for predicting runoff using historical meteorological and runoff data as input</article-title>. <source>J. Hydrol.</source> <volume>625</volume>:<fpage>129977</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jhydrol.2023.129977</pub-id></mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zanchetta</surname> <given-names>A. D.</given-names></name> <name><surname>Coulibaly</surname> <given-names>P.</given-names></name> <name><surname>Fortin</surname> <given-names>V.</given-names></name></person-group> (<year>2022</year>). <article-title>Forecasting high-flow discharges in a flashy catchment using multiple precipitation estimates as predictors in machine learning models</article-title>. <source>Hydrology</source> <volume>9</volume>:<fpage>216</fpage>. doi: <pub-id pub-id-type="doi">10.3390/hydrology9120216</pub-id></mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Yan</surname> <given-names>H.</given-names></name></person-group> (<year>2023</year>). <article-title>A long short-term components neural network model with data augmentation for daily runoff forecasting</article-title>. <source>J. Hydrol.</source> <volume>617</volume>:<fpage>128853</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jhydrol.2022.128853</pub-id></mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0001">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/790005/overview">Alyssa Dausman</ext-link>, The Water Institute of the Gulf, United States</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0002">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2170429/overview">Yuan Yang</ext-link>, University of California, San Diego, United States</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3303557/overview">Yizhou Qian</ext-link>, Tsinghua University, China</p>
</fn>
</fn-group>
</back>
</article>