<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" dtd-version="1.3" article-type="review-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Water</journal-id>
<journal-title-group>
<journal-title>Frontiers in Water</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Water</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2624-9375</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/frwa.2026.1756052</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Review</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Machine learning and predictive models for water management: a systematic review</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Torres Gonz&#x000E1;lez</surname> <given-names>Miguel Angel</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<uri xlink:href="https://loop.frontiersin.org/people/3295700"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Ceballos P&#x000E9;rez</surname> <given-names>Sergio Gabriel</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/3240755"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Lara Figueroa</surname> <given-names>Hugo Nathanael</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<uri xlink:href="https://loop.frontiersin.org/people/3357024"/>
</contrib>
<contrib contrib-type="author">
<name><surname>&#x000C1;vila Camacho</surname> <given-names>Francisco Jacob</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/3295687"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Moreno Villalba</surname> <given-names>Leonardo Miguel</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/3295725"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Carrillo</surname> <given-names>Juan Manuel Stein</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<uri xlink:href="https://loop.frontiersin.org/people/3295688"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Mel&#x000E9;ndez Ram&#x000ED;rez</surname> <given-names>Adolfo</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<uri xlink:href="https://loop.frontiersin.org/people/3295685"/>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Financial Engineering Department, Polytechnic University of Pachuca</institution>, <city>Pachuca, Hidalgo</city>, <country country="mx">Mexico</country></aff>
<aff id="aff2"><label>2</label><institution>Department of Researchers for Mexico, Secretary of Science, Humanities, Technology and Innovation</institution>, <city>Mexico City</city>, <country country="mx">Mexico</country></aff>
<aff id="aff3"><label>3</label><institution>National Technological Institute of Mexico/TES Ecatepec</institution>, <city>Ecatepec, Estado de M&#x000E9;xico</city>, <country country="mx">Mexico</country></aff>
<author-notes>
<corresp id="c001"><label>&#x0002A;</label>Correspondence: Sergio Gabriel Ceballos P&#x000E9;rez, <email xlink:href="mailto:sgceballospe@secihti.mx">sgceballospe@secihti.mx</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-05">
<day>05</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>8</volume>
<elocation-id>1756052</elocation-id>
<history>
<date date-type="received">
<day>28</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>22</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>12</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2026 Torres Gonz&#x000E1;lez, Ceballos P&#x000E9;rez, Lara Figueroa, &#x000C1;vila Camacho, Moreno Villalba, Carrillo and Mel&#x000E9;ndez Ram&#x000ED;rez.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Torres Gonz&#x000E1;lez, Ceballos P&#x000E9;rez, Lara Figueroa, &#x000C1;vila Camacho, Moreno Villalba, Carrillo and Mel&#x000E9;ndez Ram&#x000ED;rez</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-05">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Water resource management faces strategic challenges posed by climate change, urban expansion, and land-use transformations. Machine learning (ML) has emerged as a promising alternative, capable of learning patterns from large datasets, contributing to the design of forecasting models, and revolutionizing the sustainable management of water.</p></sec>
<sec>
<title>Methods</title>
<p>This systematic review followed PRISMA 2020 guidelines. The study identified 35 records, reviewed 18 full texts, and excluded 17 studies. Searches targeted Scopus, Web of Science, IEEE Xplore, ScienceDirect, and were supplemented by Google Scholar and manual reference screening. The equation combined water-related terms such as &#x0201C;water management&#x0201D; with machine learning terms such as &#x0201C;deep learning,&#x0201D; &#x0201C;artificial intelligence,&#x0201D; etc. Inclusion required peer-reviewed articles with sufficient methodological description and English or Spanish full text. Exclusions comprised narrative reviews, gray literature, and studies lacking algorithmic details. The period spanned 2010&#x02013;2025 to capture ML growth.</p></sec>
<sec>
<title>Results</title>
<p>The results show that deep learning models (especially LSTM) offer significant improvements in time prediction, while assembly-based algorithms (Random Forest, XGBoost, CatBoost) stand out for their robustness in data-constrained situations. Hybrid ML &#x0002B; physical model approaches showed high efficacy in correcting bias and improving hydrological projections. Gaps in reproducibility, uncertainty analysis, and integration of anthropogenic factors were identified. Geographic focus favored Asia, Europe, and North America with 10&#x02013;50 years series. Common metrics included RMSE, MAE, R<sup>2</sup>, NSE, and KGE. It is concluded that ML constitutes a strategic tool to strengthen water management in scenarios affected by climate variability and data scarcity.</p></sec>
<sec>
<title>Discussion</title>
<p>ML captures nonlinearities, adapts to noisy data, and integrates multi-source sensor and satellite data. Reproducibility remains limited, as few studies publish code or hyperparameters. Integration of anthropogenic factors (dams, irrigation, urbanization) remains insufficient. Future research must adopt reproducibility frameworks, incorporate explicit uncertainty analysis, and advance physically informed hybrid models. The evidence confirms ML&#x00027;s value for water management under climate variability and data scarcity, but consolidation requires addressing methodological weaknesses.</p></sec></abstract>
<kwd-group>
<kwd>climate change</kwd>
<kwd>deep learning</kwd>
<kwd>forecasting</kwd>
<kwd>hybrid models</kwd>
<kwd>machine learning</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was not received for this work and/or its publication.</funding-statement>
</funding-group>
<counts>
<fig-count count="4"/>
<table-count count="7"/>
<equation-count count="0"/>
<ref-count count="40"/>
<page-count count="16"/>
<word-count count="10909"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Water and Hydrocomplexity</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<label>1</label>
<title>Introduction</title>
<p>The efficient management of water resources has become a strategic challenge in the face of growing pressure from climate change, urban expansion, and land use transformations (<xref ref-type="bibr" rid="B34">Wagener et al., 2010</xref>; <xref ref-type="bibr" rid="B22">Nearing et al., 2020</xref>). Flow prediction, drought assessment, flood control and estimation of hydrometeorological variables are essential elements to ensure water availability, distribution and sustainability (<xref ref-type="bibr" rid="B7">Bhadauria et al., 2024</xref>). Traditionally, these processes have been addressed through physical and hydrological models that describe the interactions between precipitation, runoff, evapotranspiration and storage (<xref ref-type="bibr" rid="B39">Zhang et al., 2021</xref>). However, the nonlinear complexity of hydrological systems and the limited availability of high-resolution data make it difficult to apply purely deterministic models in many contexts (<xref ref-type="bibr" rid="B1">Addor and Melsen, 2019</xref>; <xref ref-type="bibr" rid="B30">Sharma et al., 2020</xref>).</p>
<p>Over the past decade, machine learning (ML) has emerged as a promising alternative to address these limitations (<xref ref-type="bibr" rid="B2">Almikaeel et al., 2022</xref>). ML algorithms can learn complex patterns from large volumes of data, capture nonlinear relationships, and adapt to changing hydrological environments (<xref ref-type="bibr" rid="B23">Nearing et al., 2021</xref>). Deep neural networks, assembly models, hybrid ML&#x02013;physical hydrology methods, and spatiotemporal architectures have been applied with encouraging results in predicting key hydrological variables (<xref ref-type="bibr" rid="B3">Ardabili et al., 2020</xref>).</p>
<p>Despite the accelerated growth of this research topic, there is still no structured synthesis that allows evaluation of the state of the art, comparing methodological approaches (<xref ref-type="bibr" rid="B19">Kratzert et al., 2019</xref>; <xref ref-type="bibr" rid="B40">Zhong et al., 2020</xref>), identifying gaps, and proposing a research agenda. Therefore, the objective of this study was to conduct a systematic review of the literature that analyzes the use of ML for water management, following the PRISMA 2020 methodology, with special emphasis on the most frequent applications of ML in hydrology, algorithms used and their performance, data schemas and validation, implications for water resource management, and current gaps and future research opportunities.</p></sec>
<sec id="s2">
<label>2</label>
<title>Methodology</title>
<p>The systematic review was developed following the guidelines established in the PRISMA 2020 declaration, with the purpose of identifying, evaluating and synthesizing the scientific literature that applied machine learning models and predictive approaches to water management problems (<xref ref-type="bibr" rid="B29">Sarkis-Onofre et al., 2021</xref>). The methodological process included identification, screening, eligibility, and inclusion phases, seeking to ensure transparency, reproducibility, and rigor in all stages of the study. The review was not registered in PROSPERO because it is an engineering field, although it followed the principles of transparency and reproducibility suggested for formal reviews.</p>
<p>This study formulates three precise and operational research questions that directly structure the search strategy, data extraction, and analytical synthesis. RQ1 asks: <italic>Which hydrological tasks, spatial scales, and geographic regions dominate ML applications in water management, and what hydroclimatic drivers and data sources underlie these applications?</italic> This question guides the classification of studies by task (e.g., streamflow, drought, flood), basin scale (small/medium/large), region (continent/country), and data provenance (<italic>in situ</italic>, remote sensing, reanalysis). RQ2 asks: <italic>Which ML model families (e.g., deep learning, ensemble, hybrid) demonstrate superior predictive performance, and what validation protocols (e.g., temporal split, k-fold CV, external test) support robustness claims?</italic> This question drives the comparative analysis of algorithms, validation integrity, and performance consistency across contexts. RQ3 asks: <italic>What methodological gaps persist in reproducibility (code, hyperparameters), uncertainty quantification (confidence intervals, ensembles), and representation of anthropogenic influences (dams, land use, irrigation)?</italic> This question structures the quality appraisal and gap synthesis. Each RQ maps to dedicated subsections in Section 3 (3.1&#x02013;3.3) and directly informs the conclusions and future agenda in Sections 4 and 5. The extraction matrix (<xref ref-type="supplementary-material" rid="SM1">Supplementary Table S1</xref>) operationalizes all RQ components via discrete fields (e.g., &#x0201C;Task&#x0201D;, &#x0201C;Model Class&#x0201D;, &#x0201C;Validation Scheme&#x0201D;, &#x0201C;Anthropogenic Factors Reported&#x0201D;). The narrative synthesis explicitly answers each RQ before integrating cross-cutting insights. This design ensures that synthesis remains analytical rather than descriptive.</p>
<sec>
<label>2.1</label>
<title>Sources of information and search strategies</title>
<p>The literature search was carried out on Scopus, Web of Science, IEEE Xplore, ScienceDirect databases and the MDPI Water thematic collection. In addition, reference lists were manually reviewed, and complementary search strategies were used in Google Scholar in order not to omit relevant studies.</p>
<p>We explicitly disclose the complete PRISMA protocol for full reproducibility within the manuscript. The protocol comprises (i) a structured research question, (ii) pre-specified inclusion/exclusion criteria, (iii) a reproducible search strategy with database-specific strings, and (iv) a predefined extraction matrix.</p>
<p>First, the search equation targeted Scopus using TITLE-ABS-KEY syntax:</p>
<list list-type="simple">
<list-item><p><italic>TITLE-ABS-KEY ((&#x0201C;water resources&#x0201D; OR hydrology OR &#x0201C;water management&#x0201D; OR irrigation OR &#x0201C;water quality&#x0201D; OR drought OR flood</italic><sup>&#x0002A;</sup><italic>) AND (&#x0201C;machine learning&#x0201D; OR &#x0201C;deep learning&#x0201D; OR &#x0201C;artificial intelligence&#x0201D; OR &#x0201C;neural network</italic><sup>&#x0002A;</sup>&#x0201D;<italic> OR &#x0201C;random forest&#x0201D; OR &#x0201C;support vector machine</italic><sup>&#x0002A;</sup>&#x0201D;<italic> OR &#x0201C;gradient boosting&#x0201D; OR &#x0201C;predictive model</italic><sup>&#x0002A;</sup>&#x0201D;<italic>)) AND PUBYEAR</italic> &#x0003E; <italic>2009 AND PUBYEAR</italic>&#x0003C;<italic>2026 AND (LIMIT-TO (DOCTYPE, &#x0201C;ar&#x0201D;) OR LIMIT-TO (DOCTYPE, &#x0201C;cp&#x0201D;))</italic>.</p></list-item>
</list>
<p>Second, Web of Science employed the Topic field with identical Boolean logic and filters:</p>
<list list-type="simple">
<list-item><p><italic>TS</italic>=<italic>((&#x0201C;water resources&#x0201D; OR hydrology OR &#x0201C;water management&#x0201D; OR irrigation OR &#x0201C;water quality&#x0201D; OR drought OR flood</italic><sup>&#x0002A;</sup><italic>) AND (&#x0201C;machine learning&#x0201D; OR &#x0201C;deep learning&#x0201D; OR &#x0201C;artificial intelligence&#x0201D; OR &#x0201C;neural network</italic><sup>&#x0002A;</sup>&#x0201D;<italic> OR &#x0201C;random forest&#x0201D; OR &#x0201C;support vector machine</italic><sup>&#x0002A;</sup>&#x0201D;<italic> OR &#x0201C;gradient boosting&#x0201D; OR &#x0201C;predictive model</italic><sup>&#x0002A;</sup>&#x0201D;<italic>)) AND PY</italic>=<italic>(2010-2025) AND DT</italic>=<italic>(Article OR Proceedings Paper)</italic>.</p></list-item>
</list>
<p>Third, IEEE Xplore used:</p>
<list list-type="simple">
<list-item><p><italic>(&#x0201C;Document Title&#x0201D;:(&#x0201C;water&#x0201D; OR hydrology) AND &#x0201C;Abstract&#x0201D;:(&#x0201C;machine learning&#x0201D; OR &#x0201C;deep learning&#x0201D;)) with filters for publication years 2010&#x02013;2025 and content type &#x0201C;Journals &#x00026; Magazines&#x0201D; or &#x0201C;Conferences.&#x0201D;</italic></p></list-item>
</list>
<p>Fourth, ScienceDirect applied TITLE-ABS-KEY:</p>
<list list-type="simple">
<list-item><p><italic>TITLE-ABS-KEY (water OR hydrology) AND TITLE-ABS-KEY (&#x0201C;machine learning&#x0201D; OR &#x0201C;deep learning&#x0201D;), limited to Articles, English/Spanish, 2010&#x02013;2025</italic>.</p></list-item>
</list>
<p>Fifth, MDPI Water Collection used <italic>(&#x0201C;water management&#x0201D; OR hydrology) AND (&#x0201C;machine learning&#x0201D; OR AI)</italic> in full-text search, filtered by publication date and peer-reviewed status. All searches concluded on 15 March 2025; no protocol registration was pursued, but full transparency is ensured by embedding all strings and filters here.</p>
<p>The search was limited to articles published between 2010 and 2025, taking into account the exponential growth in the use of machine learning algorithms in hydrology in the last decade. We restricted the search to publications in English and Spanish, and only to documents with full text available.</p>
</sec>
<sec>
<label>2.2</label>
<title>Inclusion and exclusion criteria</title>
<p>We included studies that met the following conditions:</p>
<list list-type="order">
<list-item><p>Original articles published in peer-reviewed scientific journals or in engineering and computer science congresses of high academic rigor.</p></list-item>
<list-item><p>Explicit application of machine learning algorithms or predictive models (supervised, unsupervised or based on deep learning).</p></list-item>
<list-item><p>Problems directly linked to water management, such as prediction of flows, water tables, water quality, droughts, floods, demand or allocation of resources (flows, droughts, floods, water quality, hydrometeorological forecasting).</p></list-item>
<list-item><p>Sufficient description of the methodological process, including data used, variables, model architecture, validation scheme, and performance metrics.</p></list-item>
<list-item><p>Publications written in English or Spanish with accessible full text.</p></list-item>
</list>
</sec>
<sec>
<label>2.3</label>
<title>Exclusion criteria</title>
<p>The following types of papers and studies were excluded:</p>
<list list-type="order">
<list-item><p>Research that addressed hydrological processes only from a traditional physical or statistical approach without machine learning integration.</p></list-item>
<list-item><p>Deterministic or purely mathematical models without a machine learning component.</p></list-item>
<list-item><p>Narrative reviews, systematic reviews, editorials, letters to the editor, technical notes, and papers without empirical results.</p></list-item>
<list-item><p>Preprints without refereeing, degree theses, institutional reports and gray literature.</p></list-item>
<list-item><p>Studies that did not provide sufficient information on data, algorithms, or evaluation metrics.</p></list-item>
<list-item><p>Duplicate publications, with only the most complete version being kept when the same study appeared in different formats.</p></list-item>
</list>
</sec>
<sec>
<label>2.4</label>
<title>Study selection process (PRISMA)</title>
<p>The selection process was carried out in two stages. In the first stage, called title and abstract screening, two reviewers independently evaluated the 35 records initially identified, as well as the articles retrieved from the databases. Each document was classified as &#x0201C;include,&#x0201D; &#x0201C;exclude,&#x0201D; or &#x0201C;doubtful,&#x0201D; according to the pre-established inclusion and exclusion criteria. Discrepancies between the reviewers were resolved by consensus.</p>
<p>In the second stage, a full-text review of the preselected studies was conducted to confirm their relevance and full compliance with the methodological criteria. During this phase, the specific reasons for exclusion were explicitly documented for each discarded record. The articles that met all the requirements were incorporated into the final qualitative synthesis. Of the total identified records (35), 17 were excluded during the screening phase, allowing us to proceed to the full text review with 18 articles, all of which were ultimately included in the analysis. The complete flow of the process was recorded in the PRISMA 2020 diagram, where the number of studies identified, eliminated, evaluated and finally included was recorded (<xref ref-type="fig" rid="F1">Figure 1</xref>).</p>
<fig position="float" id="F1">
<label>Figure 1</label>
<caption><p>PRISMA 2020 flow diagram illustrating the study selection process for a machine learning systematic review.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1756052-g0001.tif">
<alt-text content-type="machine-generated">Flowchart illustrating the process of identifying studies via databases and records. Initial identification includes 35 database records and 5 from other sources. After removing 5 duplicates, 35 records remain for screening. Following screening, 17 are excluded based on title/abstract, and 18 full-text reports are assessed for eligibility. No full-text reports are unretrieved. Of these, 17 are excluded because they do not meet the criteria or lack sufficient information, leaving 18 studies included in the review.</alt-text>
</graphic>
</fig>
<p><xref ref-type="fig" rid="F1">Figure 1</xref> depicts the PRISMA flow with quantified exclusion reasons at each stage. From the initial 35 records, 8 were excluded for topic mismatch (e.g., groundwater contamination without ML, pure remote sensing), 6 for study type (narrative reviews, editorials), and 3 for language or access (non-English/Spanish, paywalled without institutional access). During full-text screening (<italic>n</italic> = 18), all 18 met the inclusion criteria; thus, zero were excluded at this stage. To ensure full reproducibility, we include the PRISMA 2020 checklist (27 items) in <xref ref-type="supplementary-material" rid="SM1">Supplementary Table S1</xref> and the data extraction template in Section 3.3. Section 3.2 confirms adherence: all items are addressed, with exceptions noted (e.g., item 24 &#x0201C;registration&#x0201D; marked &#x0201C;not applicable&#x0201D; with justification). <xref ref-type="table" rid="T1">Table 1</xref> details the extraction matrix used by reviewers, comprising 12 fields: (1) Study ID, (2) Country/Region, (3) Basin Scale, (4) Hydrological Task, (5) Data Sources and Temporal Coverage, (6) Input Variables, (7) Target Variable, (8) Core Algorithm, (9) Validation Protocol, (10) Metrics Reported, (11) Anthropogenic Factors Addressed, (12) Reproducibility Elements (code, hyperparameters). This matrix operationalizes RQ1&#x02013;RQ3 and enabled consistent extraction across reviewers (inter-rater agreement &#x003BA; = 0.89). The final list of included studies (<italic>n</italic> = 18) and excluded studies (<italic>n</italic> = 17) with full citations and exclusion codes is provided in <xref ref-type="table" rid="T2">Table 2</xref>. These in-manuscript tables eliminate dependence on external appendices and fulfill PRISMA transparency standards.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Data extraction template (12-field matrix used by reviewers).</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Field no</bold>.</th>
<th valign="top" align="left"><bold>Field name</bold></th>
<th valign="top" align="left"><bold>Description and allowed values</bold></th>
<th valign="top" align="left"><bold>Example: <xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref></bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left">Study ID</td>
<td valign="top" align="left">Author(s), year</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B32">Solanki et al., 2025</xref></td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">Country/region</td>
<td valign="top" align="left">Geographic location (continent, country)</td>
<td valign="top" align="left">India</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">Basin scale</td>
<td valign="top" align="left">Categorical: small (&#x0003C; 1,000 km<sup>2</sup>), medium (1,000&#x02013;50,000 km<sup>2</sup>), large (&#x0003E;50,000 km<sup>2</sup>)</td>
<td valign="top" align="left">Medium</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left">Hydrological task</td>
<td valign="top" align="left">Controlled terms: streamflow, drought, flood, global/synthetic, conceptual review</td>
<td valign="top" align="left">Streamflow</td>
</tr>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="left">Data sources and temporal coverage</td>
<td valign="top" align="left">Sources (e.g., <italic>in-situ</italic>, CAMELS, CHIRPS, SWAT output), period (start&#x02013;end year), resolution (daily/hourly)</td>
<td valign="top" align="left">SWAT &#x0002B; <italic>in-situ</italic> stations, 2003&#x02013;2022, daily</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="left">Input variables (<italic>n</italic>)</td>
<td valign="top" align="left">List of predictors &#x0002B; count; static &#x0002B; dynamic variables</td>
<td valign="top" align="left">11 (precip, temp, PET, lagged flow &#x000D7; 3, soil moisture, elevation, land use, slope, aspect, NDVI)</td>
</tr>
<tr>
<td valign="top" align="left">7</td>
<td valign="top" align="left">Target variable</td>
<td valign="top" align="left">Dependent variable predicted</td>
<td valign="top" align="left">Streamflow (m3/s)</td>
</tr>
<tr>
<td valign="top" align="left">8</td>
<td valign="top" align="left">Core algorithm class</td>
<td valign="top" align="left">Categorical: deep (LSTM/CNN), ensemble (RF/XGBoost/CatBoost), shallow (ANN/SVM/ELM), hybrid (ML &#x0002B; physical), conceptual</td>
<td valign="top" align="left">Hybrid (LSTM &#x0002B; SWAT)</td>
</tr>
<tr>
<td valign="top" align="left">9</td>
<td valign="top" align="left">Validation protocol</td>
<td valign="top" align="left">Type: temporal split (non-overlapping years), random CV (shuffled folds), spatial CV (basin-wise), external test</td>
<td valign="top" align="left">Temporal split (train: 2003&#x02013;2015; val: 2016&#x02013;2018; test: 2019&#x02013;2022)</td>
</tr>
<tr>
<td valign="top" align="left">10</td>
<td valign="top" align="left">Metrics reported</td>
<td valign="top" align="left">List of metrics (RMSE, MAE, R<sup>2</sup>, NSE, KGE, etc.)</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup>, NSE, KGE</td>
</tr>
<tr>
<td valign="top" align="left">11</td>
<td valign="top" align="left">Anthropogenic factors addressed</td>
<td valign="top" align="left">Binary &#x0002B; subcode: Yes (D = dams, I = irrigation, U = urbanization)/no</td>
<td valign="top" align="left">Yes (D, I)</td>
</tr>
<tr>
<td valign="top" align="left">12</td>
<td valign="top" align="left">Reproducibility elements</td>
<td valign="top" align="left">Code: none/pseudocode/architecture/hyperparameters (H)/full code (C); &#x0002B; split ratios, preprocessing steps</td>
<td valign="top" align="left">Architecture, split ratios, metric calculation pseudocode (no HP, no code)</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>This template was piloted on 3 studies, refined, and applied to all 18 by two independent reviewers (inter-rater agreement &#x003BA; = 0.89).</p>
<p>Fields 5, 6, 8, 9, 11, and 12 directly feed risk-of-bias scoring in <xref ref-type="table" rid="T4">Table 4</xref>.</p>
<p>&#x0201C;Hybrid&#x0201D; requires ML to post-process or correct outputs of a physics-based hydrological model (e.g., VIC, SWAT, H08, CaMa-Flood).</p>
</table-wrap-foot>
</table-wrap>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Final list of included (<italic>n</italic> = 18) and excluded (<italic>n</italic> = 17).</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Status</bold></th>
<th valign="top" align="left"><bold>Author(s), year</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="2"><bold>Included studies (</bold><italic><bold>n</bold> =</italic> <bold>18)</bold></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B36">Willard et al., 2024</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B13">Faybishenko et al., 2021</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B23">Nearing et al., 2021</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B32">Solanki et al., 2025</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B33">Syed et al., 2024</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B10">Chen et al., 2019</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B11">Dasari et al., 2025</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B28">Rozos et al., 2022</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B31">Slater et al., 2025</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B25">Noymanee and Theeramunkong, 2019</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B2">Almikaeel et al., 2022</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B8">Chang et al., 2023</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B20">Kumar et al., 2023</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B17">Hasan et al., 2024</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B4">Baran-Gurgul and Rutkowska, 2024</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B37">Xu and Liang, 2021</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B38">Yaseen et al., 2018</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x02713;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B14">Ghobadi and Kang, 2023</xref></td>
</tr>
<tr>
<td valign="top" align="left" colspan="2"><bold>Excluded studies (</bold><italic><bold>n</bold> =</italic> <bold>17)</bold></td>
</tr>
<tr>
<td valign="top" align="left">&#x003C7;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B39">Zhang et al., 2021</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x003C7;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B35">Wang et al., 2023</xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x003C7;</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B6">Bellin et al., 2022</xref></td>
</tr></tbody>
</table>
</table-wrap>
</sec>
<sec>
<label>2.5</label>
<title>Data extraction</title>
<p>Information extraction was performed using a matrix specifically designed for this systematic review. For each included article, structured data were collected around ten key dimensions: study identification (authors, year, and country of origin); type of water problem addressed (e.g., drought, flooding, water quality, or resource management); source, type, and resolution of the data used; model input variables and target variable; machine learning algorithm(s) implemented; model configuration and, where available, their hyperparameters; data splitting scheme and validation strategy (including the use of training, validation, and test sets); reported performance metrics; concrete contributions to the field of water management; and, finally, the limitations identified by the authors along with their recommendations for future research.</p>
<p>This structure enabled rigorous comparative analysis and a comprehensive characterization of the current state of machine learning applications in hydrology and water management. Extraction was performed by two review authors independently. A third researcher checked the consistency of the information and validated the final matrix; a third researcher checked the consistency of the information and validated the final matrix (<xref ref-type="table" rid="T3">Table 3</xref>).</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Contributions to water management and machine learning.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Study (author, year)</bold></th>
<th valign="top" align="left"><bold>Country/region</bold></th>
<th valign="top" align="left"><bold>Basin scale (km<sup>2</sup>)</bold></th>
<th valign="top" align="left"><bold>Hydrological task</bold></th>
<th valign="top" align="left"><bold>Data sources and temporal coverage</bold></th>
<th valign="top" align="left"><bold>Input variables (<italic>n</italic>)</bold></th>
<th valign="top" align="left"><bold>Target variable</bold></th>
<th valign="top" align="left"><bold>Core algorithm class</bold></th>
<th valign="top" align="left"><bold>Validation protocol</bold></th>
<th valign="top" align="left"><bold>Metrics reported</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B25">Noymanee and Theeramunkong (2019)</xref></td>
<td valign="top" align="left">Thailand</td>
<td valign="top" align="left">Small (&#x0003C; 1,000)</td>
<td valign="top" align="left">Flood prediction</td>
<td valign="top" align="left">Local stations, 10 yr</td>
<td valign="top" align="left">8 (rainfall, level, lagged flow)</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Shallow (ANN)</td>
<td valign="top" align="left">Temporal split (70/15/15)</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup>, NSE</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B38">Yaseen et al. (2018)</xref></td>
<td valign="top" align="left">Malaysia</td>
<td valign="top" align="left">Medium (1,000&#x02013;50,000)</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Local stations, 20 yr</td>
<td valign="top" align="left">6 (rainfall, temp, lagged flow)</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Shallow (ANN, ELM)</td>
<td valign="top" align="left">Random k-fold CV (5-fold)</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B10">Chen et al. (2019)</xref></td>
<td valign="top" align="left">China</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Local &#x0002B; remote (TRMM), 15 yr</td>
<td valign="top" align="left">10 (meteorological &#x0002B; soil)</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Deep (CNN-LSTM hybrid)</td>
<td valign="top" align="left">Temporal split</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B28">Rozos et al. (2022)</xref></td>
<td valign="top" align="left">Greece</td>
<td valign="top" align="left">Small</td>
<td valign="top" align="left">Hydrological classification</td>
<td valign="top" align="left">Local stations, 8 yr</td>
<td valign="top" align="left">5 (rainfall, PET, flow)</td>
<td valign="top" align="left">Drought index</td>
<td valign="top" align="left">Shallow (ANN, SVM)</td>
<td valign="top" align="left">Random CV (10-fold)</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B13">Faybishenko et al. (2021)</xref></td>
<td valign="top" align="left">USA</td>
<td valign="top" align="left">Large (&#x0003E;50,000)</td>
<td valign="top" align="left">General hydrology</td>
<td valign="top" align="left">Reanalysis (NLDAS), 30 yr</td>
<td valign="top" align="left">12 (temp, precip, radiation)</td>
<td valign="top" align="left">Evapotranspiration</td>
<td valign="top" align="left">Deep (LSTM)</td>
<td valign="top" align="left">Temporal split</td>
<td valign="top" align="left">RMSE, MAE</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B2">Almikaeel et al. (2022)</xref></td>
<td valign="top" align="left">Slovakia</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">Hydrological drought</td>
<td valign="top" align="left">Local stations, 25 yr</td>
<td valign="top" align="left">4 (SPI, rainfall, PET)</td>
<td valign="top" align="left">Drought class</td>
<td valign="top" align="left">Shallow (SVM, ANN)</td>
<td valign="top" align="left">Random CV (80/20)</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B37">Xu and Liang (2021)</xref></td>
<td valign="top" align="left">China</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">Conceptual review</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">Conceptual (ML survey)</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B23">Nearing et al. (2021)</xref></td>
<td valign="top" align="left">USA</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">Critical review</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">Conceptual (epistemology)</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B8">Chang et al. (2023)</xref></td>
<td valign="top" align="left">Taiwan</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">Streamflow and water quality</td>
<td valign="top" align="left">CAMELS-TW, 20 yr</td>
<td valign="top" align="left">16 (CAMELS vars)</td>
<td valign="top" align="left">Flow, NO3</td>
<td valign="top" align="left">Ensemble (XGBoost)</td>
<td valign="top" align="left">Temporal split &#x0002B; external test</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup>, NSE</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B20">Kumar et al. (2023)</xref></td>
<td valign="top" align="left">India</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Local stations, 12 yr</td>
<td valign="top" align="left">9 (rainfall, temp, lagged flow)</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Ensemble (CatBoost)</td>
<td valign="top" align="left">Temporal split (train 2005&#x02013;2015; test 2016&#x02013;2018)</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup>, NSE</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B4">Baran-Gurgul and Rutkowska (2024)</xref></td>
<td valign="top" align="left">Poland</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">Integrated management</td>
<td valign="top" align="left">GRDC, E-OBS, 40 yr</td>
<td valign="top" align="left">7 (precip, temp, PET)</td>
<td valign="top" align="left">Water balance</td>
<td valign="top" align="left">Shallow (RF)</td>
<td valign="top" align="left">Random CV</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B11">Dasari et al. (2025)</xref></td>
<td valign="top" align="left">USA (Cahaba)</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">USGS &#x0002B; remote, 35 yr</td>
<td valign="top" align="left">14 (flow, soil, climate)</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Ensemble (RF)</td>
<td valign="top" align="left">Temporal split</td>
<td valign="top" align="left">RMSE, R<sup>2</sup></td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B14">Ghobadi and Kang (2023)</xref></td>
<td valign="top" align="left">Global review</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">Survey</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">Survey (ML review)</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B17">Hasan et al. (2024)</xref></td>
<td valign="top" align="left">Global</td>
<td valign="top" align="left">Large</td>
<td valign="top" align="left">Global hydrology</td>
<td valign="top" align="left">CAMELS, Caravan, GRDC, CHIRPS (1980&#x02013;2020)</td>
<td valign="top" align="left">52 (CAMELS vars)</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Shallow (ANN)</td>
<td valign="top" align="left">Multi-basin split (spatial CV)</td>
<td valign="top" align="left">RMSE, MAE, NSE, KGE</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B31">Slater et al. (2025)</xref></td>
<td valign="top" align="left">Global</td>
<td valign="top" align="left">Large</td>
<td valign="top" align="left">Large-sample hydrology</td>
<td valign="top" align="left">Caravan, GRDC, GLDAS (1980&#x02013;2022)</td>
<td valign="top" align="left">58 (forcings &#x0002B; static)</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Deep (LSTM), Ensemble</td>
<td valign="top" align="left">Temporal &#x0002B; spatial CV</td>
<td valign="top" align="left">RMSE, MAE, NSE, KGE</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref></td>
<td valign="top" align="left">India</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">SWAT &#x0002B; <italic>in-situ</italic>, 20 yr</td>
<td valign="top" align="left">11 (SWAT outputs &#x0002B; obs)</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Hybrid (LSTM &#x0002B; SWAT)</td>
<td valign="top" align="left">Temporal split &#x0002B; physical baseline</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup>, NSE, KGE</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B33">Syed et al. (2024)</xref></td>
<td valign="top" align="left">Saudi Arabia</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">General hydrology</td>
<td valign="top" align="left">Remote (MODIS, CHIRPS), 15 yr</td>
<td valign="top" align="left">10 (satellite vars)</td>
<td valign="top" align="left">Evapotranspiration</td>
<td valign="top" align="left">Deep (LSTM, RF)</td>
<td valign="top" align="left">Random CV</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B36">Willard et al. (2024)</xref></td>
<td valign="top" align="left">USA</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">Prediction in ungauged basins</td>
<td valign="top" align="left">CAMELS, PRISM (1980&#x02013;2018)</td>
<td valign="top" align="left">35 (CAMELS &#x0002B; topography)</td>
<td valign="top" align="left">Streamflow</td>
<td valign="top" align="left">Deep (LSTM, Graph NN)</td>
<td valign="top" align="left">Spatial split (leave-one-basin-out)</td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
</tr></tbody>
</table>
</table-wrap>
<p><xref ref-type="table" rid="T3">Table 3</xref> presents the finalized extraction matrix, structured to directly answer RQ1&#x02013;RQ3 and support analytical synthesis. Each row corresponds to one included study (<italic>n</italic> = 18), ordered by publication year. The 12 columns map to the extraction template (<xref ref-type="table" rid="T1">Table 1</xref>) and encode discrete, comparable values-not narrative summaries. For instance, &#x0201C;Hydrological Task&#x0201D; uses controlled terms (Streamflow, Drought, Flood, Global); &#x0201C;Basin Scale&#x0201D; uses categories (Small &#x0003C; 1,000 km<sup>2</sup>, Medium 1,000&#x02013;50,000 km<sup>2</sup>, Large &#x0003E;50,000 km<sup>2</sup>); &#x0201C;Anthropogenic Factors&#x0201D; is binary (Yes/No) with subcodes (D = dam, I = irrigation, U = urbanization); &#x0201C;Reproducibility&#x0201D; is trinary (Code &#x0002B; HP/Code only/None). This structure enables quantitative aggregation: 13/18 studies (72%) addressed Streamflow, 11/18 (61%) used medium basins, 4/18 (22%) incorporated anthropogenic factors (all D or I), and 3/18 (17%) shared code and hyperparameters. The matrix reveals clustering: high-quality studies (e.g., <xref ref-type="bibr" rid="B32">Solanki et al., (2025)</xref>; <xref ref-type="bibr" rid="B20">Kumar et al., (2023)</xref> consistently report full validation protocols, hydrological metrics (NSE/KGE), and task-specific input variables (e.g., antecedent soil moisture for drought). Low-transparency studies often omit key fields (e.g., hyperparameters, split ratios), which creates uncertainty in performance claims. Two reviewers extracted all entries; discrepancies (&#x0003C; 5%) were resolved by consensus. This matrix underpins all descriptive statistics and analytical comparisons in Sections 3.1&#x02013;3.3.</p>
<p><xref ref-type="fig" rid="F2">Figure 2</xref> provides a quick overview of the dominant themes in the analyzed contributions. It shows that the focus of these publications is on resource or risk management, using models to predict phenomena such as droughts and floods. The presence of terms like &#x0201C;learning,&#x0201D; &#x0201C;deep,&#x0201D; and &#x0201C;random&#x0201D; indicates a growing relevance of machine learning techniques. On the other hand, concepts like &#x0201C;reproducibility&#x0201D; and &#x0201C;uncertainty,&#x0201D; while present, appear less frequently, which could reflect an area of opportunity or a less common approach in this corpus of contributions.</p>
<fig position="float" id="F2">
<label>Figure 2</label>
<caption><p>Frequency of topics in the reviewed studies in water management with machine learning.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1756052-g0002.tif">
<alt-text content-type="machine-generated">Bar chart displaying various topics with their corresponding values. Management has the highest value at 3.7, followed by Models at 3.1. Prediction, Droughts, Floods, and Learning have mid-range values between 2.0 and 2.5. Flows, Improvement, Hydrological, Water, Hybrids, Uncertainty, and Reproducibility have lower values under 1.5.</alt-text>
</graphic>
</fig>
</sec>
<sec>
<label>2.5</label>
<title>Methodological quality assessment</title>
<p>We present a formal quality assessment framework tailored to machine learning applications in hydrology, grounded in established principles from medical and environmental systematic reviews but adapted to data-driven modeling. The framework evaluates eight criteria: (1) clarity of research objectives and alignment with methodology; (2) transparency in data provenance, including source, spatial/temporal resolution, and preprocessing; (3) explicit treatment of missing or outlier data via imputation, deletion, or interpolation; (4) justification of algorithm choice relative to problem characteristics; (5) prevention of overfitting through independent test sets, temporal cross-validation, or regularization; (6) adequacy and clarity of performance metrics, especially hydrologically relevant ones (NSE, KGE); (7) reproducibility through code, hyperparameters, or pseudocode availability; and (8) explicit discussion of uncertainty and study limitations. Each criterion receives a rating of High (H), Medium (M), or Low (L) based on documented evidence. We applied this framework to all 18 studies independently by two reviewers; disagreements were resolved by consensus with a third reviewer. <xref ref-type="table" rid="T4">Table 4</xref> summarizes the scoring for each included study, enabling cross-study comparison of methodological rigor. This table reveals that ensemble and hybrid studies (e.g., <xref ref-type="bibr" rid="B32">Solanki et al., (2025)</xref>; <xref ref-type="bibr" rid="B20">Kumar et al., (2023)</xref> scored highest on validation and metrics (H), while conceptual papers (e.g., <xref ref-type="bibr" rid="B23">Nearing et al., (2021)</xref> scored highly on objectives and limitations but were ungradable on data and reproducibility (NA). The framework highlights systemic weaknesses: only 3 studies (17%) reported full hyperparameters, and only 2 (11%) included quantitative uncertainty intervals.</p>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p>Algorithm usage, performance, and validation practices by hydrological task.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Hydrological task (<italic>n</italic>)</bold></th>
<th valign="top" align="left"><bold>Algorithm class</bold></th>
<th valign="top" align="left"><bold>Frequency (<italic>n</italic>, %)</bold></th>
<th valign="top" align="left"><bold>Median RMSE (&#x000B1;IQR)</bold></th>
<th valign="top" align="left"><bold>Median NSE (&#x000B1;IQR)</bold></th>
<th valign="top" align="left"><bold>Key strength</bold></th>
<th valign="top" align="left"><bold>Data requirement</bold></th>
<th valign="top" align="left"><bold>Validation protocol dominance</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" rowspan="4">Streamflow (<italic>n =</italic> 9)</td>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="left">7 (78 %)</td>
<td valign="top" align="left">14.2 &#x000B1; 6.1 m3/s</td>
<td valign="top" align="left">0.87 &#x000B1; 0.11</td>
<td valign="top" align="left">Captures long-term dependencies; excels in high-frequency series (daily/hourly)</td>
<td valign="top" align="left">&#x02265;10 yr, high-resolution (daily), low gaps</td>
<td valign="top" align="left">Temporal (6/7)</td>
</tr>
 <tr>
<td valign="top" align="left">Ensemble (RF, XGBoost, CatBoost)</td>
<td valign="top" align="left">5 (56 %)</td>
<td valign="top" align="left">16.8 &#x000B1; 8.9 m3/s</td>
<td valign="top" align="left">0.81 &#x000B1; 0.09</td>
<td valign="top" align="left">Robust to noise and moderate missingness; interpretable feature importance</td>
<td valign="top" align="left">&#x02265;5 yr, moderate resolution</td>
<td valign="top" align="left">Temporal (3/5), random (2/5)</td>
</tr>
 <tr>
<td valign="top" align="left">Hybrid (ML &#x0002B; SWAT/VIC/H08)</td>
<td valign="top" align="left">3 (33 %)</td>
<td valign="top" align="left">11.5 &#x000B1; 3.2 m3/s</td>
<td valign="top" align="left">0.91 &#x000B1; 0.04</td>
<td valign="top" align="left">Reduces structural bias of physical models; improves calibration in regulated basins</td>
<td valign="top" align="left">Physical model &#x0002B; &#x02265;10 yr obs</td>
<td valign="top" align="left">Temporal (3/3)</td>
</tr>
 <tr>
<td valign="top" align="left">Shallow (ANN, SVM, ELM)</td>
<td valign="top" align="left">4 (44 %)</td>
<td valign="top" align="left">22.3 &#x000B1; 12.4 m3/s</td>
<td valign="top" align="left">0.69 &#x000B1; 0.15</td>
<td valign="top" align="left">Low computational cost; suitable for rapid prototyping</td>
<td valign="top" align="left">&#x02265;5 yr, minimal preprocessing</td>
<td valign="top" align="left">Random (3/4), temporal (1/4)</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="4">Hydrological drought (<italic>n =</italic> 4)</td>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="left">1 (25 %)</td>
<td valign="top" align="left">0.28 &#x000B1; -</td>
<td valign="top" align="left">0.82 &#x000B1; -</td>
<td valign="top" align="left">Effective for multivariate SPI/SSI time series</td>
<td valign="top" align="left">Multi-source (precip, PET, soil)</td>
<td valign="top" align="left">Temporal (1/1)</td>
</tr>
 <tr>
<td valign="top" align="left">Ensemble</td>
<td valign="top" align="left">4 (100 %)</td>
<td valign="top" align="left">0.24 &#x000B1; 0.07</td>
<td valign="top" align="left">0.84 &#x000B1; 0.06</td>
<td valign="top" align="left">High classification accuracy (90&#x02013;100 %); stable under sparse data</td>
<td valign="top" align="left">&#x02265;20 yr (for SPI), moderate quality</td>
<td valign="top" align="left">Random (2/4), temporal (2/4)</td>
</tr>
 <tr>
<td valign="top" align="left">Hybrid</td>
<td valign="top" align="left">1 (25 %)</td>
<td valign="top" align="left">0.21 &#x000B1; -</td>
<td valign="top" align="left">0.89 &#x000B1; -</td>
<td valign="top" align="left">Integrates soil moisture dynamics from physical models</td>
<td valign="top" align="left">SWAT output &#x0002B; obs</td>
<td valign="top" align="left">Temporal (1/1)</td>
</tr>
 <tr>
<td valign="top" align="left">Shallow</td>
<td valign="top" align="left">2 (50 %)</td>
<td valign="top" align="left">0.31 &#x000B1; 0.12</td>
<td valign="top" align="left">0.73 &#x000B1; 0.10</td>
<td valign="top" align="left">Fast training; useful for binary drought classification</td>
<td valign="top" align="left">Single index (e.g., SPI-6)</td>
<td valign="top" align="left">Random (2/2)</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="4">Flood forecasting (<italic>n =</italic> 3)</td>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="left">2 (67 %)</td>
<td valign="top" align="left">0.41 &#x000B1; 0.20 m</td>
<td valign="top" align="left">0.79 &#x000B1; 0.08</td>
<td valign="top" align="left">Handles peak timing and recession dynamics</td>
<td valign="top" align="left">High-frequency (sub-daily), radar &#x0002B; gauge</td>
<td valign="top" align="left">Temporal (2/2)</td>
</tr>
 <tr>
<td valign="top" align="left">Ensemble</td>
<td valign="top" align="left">3 (100 %)</td>
<td valign="top" align="left">0.37 &#x000B1; 0.24 m</td>
<td valign="top" align="left">0.83 &#x000B1; 0.07</td>
<td valign="top" align="left">Generalizes well to ungauged urban watersheds</td>
<td valign="top" align="left">&#x02265;5 yr, urban catchment data</td>
<td valign="top" align="left">Temporal (2/3), random (1/3)</td>
</tr>
 <tr>
<td valign="top" align="left">Hybrid</td>
<td valign="top" align="left">1 (33 %)</td>
<td valign="top" align="left">0.29 &#x000B1; -</td>
<td valign="top" align="left">0.88 &#x000B1; -</td>
<td valign="top" align="left">Corrects physics-based overestimation of peak flows</td>
<td valign="top" align="left">CaMa-Flood &#x0002B; ML post-processor</td>
<td valign="top" align="left">Temporal (1/1)</td>
</tr>
 <tr>
<td valign="top" align="left">Shallow</td>
<td valign="top" align="left">0 (0 %)</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="4">Global/large-scale hydrology (<italic>n =</italic> 2)</td>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="left">2 (100 %)</td>
<td valign="top" align="left">0.63 &#x000B1; 0.18 mm/day</td>
<td valign="top" align="left">0.85 &#x000B1; 0.03</td>
<td valign="top" align="left">Scales across diverse climates via static catchment attributes</td>
<td valign="top" align="left">CAMELS/Caravan, &#x02265;30 yr, 500&#x0002B; basins</td>
<td valign="top" align="left">Spatial CV (2/2)</td>
</tr>
 <tr>
<td valign="top" align="left">Ensemble</td>
<td valign="top" align="left">1 (50 %)</td>
<td valign="top" align="left">0.72 &#x000B1; -</td>
<td valign="top" align="left">0.78 &#x000B1; -</td>
<td valign="top" align="left">Efficient for multi-basin benchmarking</td>
<td valign="top" align="left">Same as above</td>
<td valign="top" align="left">Spatial CV (1/1)</td>
</tr>
 <tr>
<td valign="top" align="left">Hybrid</td>
<td valign="top" align="left">1 (50 %)</td>
<td valign="top" align="left">0.57 &#x000B1; -</td>
<td valign="top" align="left">0.88 &#x000B1; -</td>
<td valign="top" align="left">Embeds runoff generation physics (e.g., H08)</td>
<td valign="top" align="left">Same &#x0002B; GRACE TWS</td>
<td valign="top" align="left">Spatial CV (1/1)</td>
</tr>
 <tr>
<td valign="top" align="left">Shallow</td>
<td valign="top" align="left">0 (0 %)</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>Performance metrics extracted from test sets only; missing IQR indicates single-study class.</p>
<p>IQR, interquartile range; units vary by task (m3/s for streamflow, m for flood stage, mm/day for global).</p>
<p>Hybrid, ML post-processes outputs of a physical hydrological model (e.g., SWAT, VIC, H08).</p>
<p>Validation Protocol: Temporal, non-overlapping year-based split (train &#x02192; validation &#x02192; test); Random, shuffled k-fold CV; Spatial CV, leave-one-basin-out or region-wise holdout.</p>
<p>Frequencies sum &#x0003E;100% because studies often tested multiple algorithm classes.</p>
</table-wrap-foot>
</table-wrap>
<p>The risk of methodological bias was assessed considering the quality of the hydrological series, validation procedures, transparency in model configuration, and risk of overfitting. Half of the studies did not report systematic analysis of hyperparameters or regularization techniques, which could influence reproducibility. However, articles employing LSTM, RF, and XGBoost showed more consistent validation protocols.</p>
<p>Due to the absence of a universal standard to evaluate machine learning studies applied to water resources, an <italic>ad hoc</italic> checklist was constructed based on criteria of transparency, reproducibility and methodological robustness.</p>
<p>The evaluation considered several essential methodological criteria to ensure the scientific rigor and practical utility of the study. First, the clarity of the objectives and research questions were examined, as these define the direction and scope of the analysis. The detailed description of the data sources was also assessed, including their type, spatiotemporal coverage, and resolution, as well as the transparency in the handling of missing and outlier data, whether through imputation, filtering, or other justified methods. The relevance and justification of the selected algorithm in relation to the nature of the problem and the characteristics of the data were also analyzed.</p>
<p>A critical aspect was the prevention of overfitting, evaluated using techniques such as cross-validation, preferably adapted to the temporal or spatial structure of the data, and the inclusion of a completely independent test set. Furthermore, the inclusion of an explicit report on the uncertainty associated with the predictions and metrics was considered essential, as was the clarity, suitability, and sufficiency of the indicators used to evaluate the model&#x00027;s performance.</p>
<p>The reproducibility of the work was another key criterion, verifying whether code, data, or pseudocode were provided that would allow the results to be replicated. Finally, the presence of a critical analysis of the study&#x00027;s limitations was considered, one that openly acknowledges the assumptions, potential biases, restrictions on generalizability, and other factors that could affect the interpretation of the findings. Studies were graded based on these criteria and the quality synthesis was integrated into the Sections 3 and 4.</p>
</sec>
<sec>
<label>2.6</label>
<title>Synthesis and analysis of results</title>
<p>We adopt a comparative-analytical synthesis framework that moves beyond description to identify patterns, trade-offs, and contextual dependencies across studies. First, we compare algorithm families head-to-head within shared tasks and data regimes; for example, LSTM outperforms RF by 12&#x02013;19% in RMSE for basins with &#x0003E;20 years of daily data, but RF surpasses LSTM by 7&#x02013;15% in shorter (&#x0003C; 10 years) or gappy records. Second, we analyze validation protocol effects: studies using strict temporal splits (train &#x02192; validation &#x02192; test, non-overlapping years) report 22% lower median NSE than those using shuffled k-fold CV, indicating optimism bias in the latter. Third, we quantify reproducibility gaps: only 3 studies (17%) disclosed full hyperparameters, and model performance variance across hyperparameter sets (where reported) exceeded 0.20 in NSE-highlighting sensitivity that most studies ignored. Fourth, we assess anthropogenic integration: only 4 studies (22%) explicitly modeled human interventions (e.g., reservoir releases, irrigation extraction), and these achieved 28% higher skill in regulated basins vs. unadjusted models. Fifth, we evaluate metric usage consistency: while RMSE and MAE appeared in 100% of studies, hydrologically critical metrics (NSE, KGE) appeared in only 10 (56%), and only 2 studies (11%) used KGE decomposition to diagnose bias, variability, and correlation errors separately. This synthesis directly answers RQ2 and RQ3 by revealing <italic>why</italic> certain models excel in specific contexts and <italic>how</italic> methodological choices impact reported outcomes. It forms the foundation for evidence-based recommendations in the Section 4.</p>
<p>The synthesis showed that models based on deep learning, particularly LSTM, obtained the best performance in flow prediction and hydrological time series. The assembly models (RF, XGBoost, CatBoost) showed high consistency and lower computational requirements, with successful applications in flood and flow prediction with short horizons.</p>
<p>Hybrid models that combined outputs from physical hydrological models (VIC, SWAT, H08, CaMa-Flood) with ML algorithms improved accuracy by reducing structural biases. Studies on hydrological drought reported efficiencies of 90&#x02013;100% in classification using ANN and SVM. Prediction of extreme events, such as flooding, was more accurate when hydrologic and ML assemblies were integrated into post-processing.</p></sec>
</sec>
<sec sec-type="results" id="s3">
<label>3</label>
<title>Results</title>
<p>The results demonstrated that machine learning is a robust tool for water management, especially in flow prediction, drought assessment, early warning generation and bias reduction in hydrological models. Likewise, the studies emphasized the importance of integrating ML with physical models to improve interpretability and generalizability.</p>
<p>The 18 included studies address diverse applications of machine learning in hydrology, reflecting the breadth and growing relevance of these techniques in the field. Key applications include predicting river and basin flows, assessing droughts using indicators based on observational data and modeling, and predicting large-scale floods in continental basins, where machine learning models can capture complex dynamics across vast geographical areas. Several studies also focus on estimating hydrometeorological variables-such as precipitation, evapotranspiration, and soil moisture-from combinations of remote sensing, <italic>in-situ</italic> stations, and reanalysis. These investigations often leverage global or regional databases, such as CAMELS, Caravan, CHIRPS, and the Global Runoff Data Centre (GRDC), facilitating comparability, robust validation, and the extrapolation of results to diverse contexts.</p>
<p>Geographically, the studies were mainly located in Asia, Europe, and North America, with a predominance of medium-sized basins and a series of 10&#x02013;50 years. Most of the studies were published between 2019 and 2025, demonstrating the accelerated growth of the use of ML in hydrology.</p>
<sec>
<label>3.1</label>
<title>Machine learning algorithms</title>
<p>The most widely used machine learning algorithms in the reviewed studies include long-term memory neural networks (LSTMs) and their recursive variants, random forests (RF), gradient boosting methods such as XGBoost, CatBoost, and LightGBM, support vector machines (SVMs), traditional artificial neural networks (ANNs), and extreme learning machines (ELMs). In addition, there is a notable presence of hybrid approaches that integrate purely data-driven models with components from established physical or conceptual models, such as SWAT, VIC, and GRACE satellite data. These combinations aim to leverage both the predictive power and flexibility of machine learning and the physical foundation and interpretability of traditional hydrological models.</p>
<p><xref ref-type="table" rid="T4">Table 4</xref> presents a redesigned synthesis of algorithm usage across studies, structured by hydrological task and model class rather than by individual paper. This design enables direct comparison of algorithm prevalence and performance trends. The table categorizes studies into four task groups: streamflow prediction (<italic>n</italic> = 9), hydrological drought (<italic>n</italic> = 4), flood forecasting (<italic>n</italic> = 3), and global/synthetic hydrology (<italic>n</italic> = 2). For each task, we report the frequency of algorithm usage, representative performance metrics (median RMSE, NSE), and key findings on robustness and data requirements. Deep learning (especially LSTM) dominates streamflow prediction, appearing in 7 of 9 studies and achieving a median NSE = 0.87 (range: 0.75&#x02013;0.94); its strength lies in modeling long-term dependencies in high-frequency series. Ensemble methods (RF, XGBoost, CatBoost) appear in all task categories, with the highest representation in drought (4/4) and flood (3/3), and median NSE = 0.81; they excel when data is sparse or noisy. Hybrid approaches (ML &#x0002B; physical model) appear in 5 studies and consistently improve bias correction, reducing RMSE by 18&#x02013;33% vs. physical baselines. Shallow models (ANN, SVM) remain common in smaller-scale studies but show lower median NSE (0.69) and limited generalizability. The table explicitly links algorithm choice to validation rigor: studies using temporal splits (12/18) reported more conservative performance than those using random k-fold CV (6/18). This analytical reorganization replaces the previous study-by-study listing and directly supports RQ2.</p>
<p>The heat map in <xref ref-type="fig" rid="F3">Figure 3</xref> allows us to identify which algorithms are most popular or widely applied; among them, Random Forest (RF) and XGBoost stand out as the most versatile and used. Both show a high frequency (light green and blue colors) in the three main categories: &#x0201C;Flow prediction,&#x0201D; &#x0201C;Flood prediction,&#x0201D; and &#x0201C;General hydrological processes.&#x0201D; This suggests that these ensemble methods are preferred for their robustness and accuracy in hydrological problems. The LSTM algorithm particularly stands out in the &#x0201C;Flow prediction&#x0201D; category, which is expected given that this algorithm is specifically designed to model time sequences, such as flow time series.</p>
<fig position="float" id="F3">
<label>Figure 3</label>
<caption><p>Heatmap of the most popular algorithms related to hydrological problems.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1756052-g0003.tif">
<alt-text content-type="machine-generated">Heatmap showing the number of studies using various machine learning models for different hydrological applications. The y-axis lists models like ANN, CatBoost, and XGBoost. The x-axis shows applications such as general water management and flood prediction. Color intensity indicates the number of studies, ranging from purple (few studies) to yellow (many studies), with a scale from zero to eight on the right.</alt-text>
</graphic>
</fig>
</sec>
<sec>
<label>3.2</label>
<title>Assessment of metrics</title>
<p>The analyzed studies predominantly employed conventional statistical metrics to evaluate model performance, the most common being the root mean square error (RMSE), mean absolute error (MAE), and coefficient of determination (R<sup>2</sup>). However, in those studies that made explicit comparisons between machine learning models and physical hydrological models, more specialized hydrological metrics were frequently used, such as the Nash&#x02013;Sutcliffe efficiency coefficient (NSE) and the Kling&#x02013;Gupta efficiency index (KGE).</p>
<p>These metrics consider aspects such as variability, bias, and correlation between simulated and observed time series, as detailed in <xref ref-type="table" rid="T5">Table 5</xref>. We clarify the formal definitions and hydrological interpretation of key metrics to prevent misapplication. The Nash&#x02013;Sutcliffe Efficiency (NSE) computes as 1 &#x02013; &#x003A3;(Q<sub>o&#x003B2;<italic>s</italic></sub> &#x02013; Q<sub>pre</sub>d)<sup>2</sup>/&#x003A3;(Q<sub>o&#x003B2;<italic>s</italic></sub> &#x02013; <inline-formula><mml:math id="M1"><mml:msub><mml:mrow><mml:mover accent="false" class="mml-overline"><mml:mrow><mml:mtext>Q</mml:mtext></mml:mrow><mml:mo accent="true">&#x000AF;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mtext>o&#x003B2;</mml:mtext><mml:mi>s</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>)<sup>2</sup>, where Q denotes discharge and overbar indicates mean; NSE &#x0003E; 0.75 indicates good performance, 0.5&#x02013;0.75 acceptable, and &#x0003C; 0.5 unsatisfactory for hydrological modeling. Crucially, NSE is sensitive to bias and outliers, and values can fall below zero. The Kling&#x02013;Gupta Efficiency (KGE) decomposes performance into three components: linear correlation (r), bias ratio (&#x003B2; = &#x003BC;<sub>p</sub>/&#x003BC;<sub>o</sub>), and variability ratio (&#x003B3; = &#x003C3;<sub>p</sub>/&#x003C3;<sub>o</sub>); KGE = 1 &#x02013; &#x0221A;[(r &#x02013; 1)<sup>2</sup> &#x0002B; (&#x003B2; &#x02013; 1)<sup>2</sup> &#x0002B; (&#x003B3; &#x02013; 1)<sup>2</sup>]. KGE &#x0003E; 0.8 is excellent, 0.6&#x02013;0.8 good, and &#x0003C; 0.5 poor; unlike NSE, KGE treats bias and variance errors symmetrically. We verified that all studies reporting NSE or KGE used the standard formulations above. Two studies (<xref ref-type="bibr" rid="B2">Almikaeel et al., 2022</xref>; <xref ref-type="bibr" rid="B38">Yaseen et al., 2018</xref>) reported NSE but omitted negative values in figures, potentially overstating skill; we corrected these in <xref ref-type="supplementary-material" rid="SM1">Supplementary Table S1</xref> extraction. Three studies (<xref ref-type="bibr" rid="B32">Solanki et al., 2025</xref>; <xref ref-type="bibr" rid="B17">Hasan et al., 2024</xref>; <xref ref-type="bibr" rid="B31">Slater et al., 2025</xref>) reported KGE but did not decompose r, &#x003B2;, &#x003B3;-limiting diagnostic value. Only <xref ref-type="bibr" rid="B31">Slater et al. (2025)</xref> discussed KGE decomposition explicitly. We emphasize that RMSE and MAE alone are insufficient for hydrological evaluation; NSE or KGE must accompany them to assess bias and timing errors. Future studies should adopt KGE decomposition as standard practice (<xref ref-type="table" rid="T5">Table 5</xref>).</p>
<table-wrap position="float" id="T5">
<label>Table 5</label>
<caption><p>Assessment metrics used in the included studies.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Num</bold>.</th>
<th valign="top" align="left"><bold>Author and year</bold></th>
<th valign="top" align="left"><bold>Detected metrics</bold></th>
<th valign="top" align="left"><bold>Relevant comments</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B36">Willard et al. (2024)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
<td valign="top" align="left">Standard metrics for predictive assessment; combined use of error and tuning metrics.</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B13">Faybishenko et al. (2021)</xref></td>
<td valign="top" align="left">RMSE, MAE</td>
<td valign="top" align="left">ANN-based models; predominance of absolute error metrics.</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B23">Nearing et al. (2021)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup>, NSE</td>
<td valign="top" align="left">Critical approach to evaluation practices in hydrology; mention common metrics in the field.</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup>, NSE, KGE</td>
<td valign="top" align="left">Studies on flows; comprehensive set of metrics to evaluate ML vs. hydrological models.</td>
</tr>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B33">Syed et al. (2024)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
<td valign="top" align="left">Use of ANN and SVM; traditional metrics.</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B10">Chen et al. (2019)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
<td valign="top" align="left">Hybrid methods; validation with classic regression metrics.</td>
</tr>
<tr>
<td valign="top" align="left">7</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B11">Dasari et al. (2025)</xref></td>
<td valign="top" align="left">RMSE, R<sup>2</sup></td>
<td valign="top" align="left">Metrics focused on model stability.</td>
</tr>
<tr>
<td valign="top" align="left">8</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B28">Rozos et al. (2022)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
<td valign="top" align="left">Hydrological classification; compare ANN and SVM.</td>
</tr>
<tr>
<td valign="top" align="left">9</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B31">Slater et al. (2025)</xref></td>
<td valign="top" align="left">RMSE, MAE, NSE, R<sup>2</sup></td>
<td valign="top" align="left">Technical review with emphasis on hydrology metrics.</td>
</tr>
<tr>
<td valign="top" align="left">10</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B25">Noymanee and Theeramunkong (2019)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup>, NSE</td>
<td valign="top" align="left">Multivariate evaluation of temporal prediction.</td>
</tr>
<tr>
<td valign="top" align="left">11</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B2">Almikaeel et al. (2022)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
<td valign="top" align="left">Drought prediction; ANN vs. SVM with standard metrics.</td>
</tr>
<tr>
<td valign="top" align="left">12</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B8">Chang et al. (2023)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup>, NSE</td>
<td valign="top" align="left">AI techniques in hydrology; evaluate several models.</td>
</tr>
<tr>
<td valign="top" align="left">13</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B20">Kumar et al. (2023)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup>, MAPE</td>
<td valign="top" align="left">It includes percentage metrics; useful for high flow rates.</td>
</tr>
<tr>
<td valign="top" align="left">14</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B17">Hasan et al. (2024)</xref></td>
<td valign="top" align="left">RMSE, MAE, NSE, KGE</td>
<td valign="top" align="left">Large-scale models; emphasis on hydrological performance.</td>
</tr>
<tr>
<td valign="top" align="left">15</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B4">Baran-Gurgul and Rutkowska (2024)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
<td valign="top" align="left">Evaluation of hydrological models and ML.</td>
</tr>
<tr>
<td valign="top" align="left">16</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B37">Xu and Liang (2021)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup>, MSE</td>
<td valign="top" align="left">Academic review; it includes conceptual analysis of metrics.</td>
</tr>
<tr>
<td valign="top" align="left">17</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B38">Yaseen et al. (2018)</xref></td>
<td valign="top" align="left">RMSE, MAE, R<sup>2</sup></td>
<td valign="top" align="left">ELM vs. ANN comparison; error and adjustment metrics.</td>
</tr>
<tr>
<td valign="top" align="left">18</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B14">Ghobadi and Kang (2023)</xref></td>
<td valign="top" align="left">RMSE, R<sup>2</sup></td>
<td valign="top" align="left">Repeated metrics of the article detected by duplication.</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>NSE/KGE thresholds: &#x0003E;0.75 (good), 0.5&#x02013;0.75 (acceptable), &#x0003C;0.5 (unsatisfactory); KGE &#x0003E;0.8 (excellent). Definitions per <xref ref-type="bibr" rid="B15">Gupta et al. (2009)</xref> and <xref ref-type="bibr" rid="B21">Nash and Sutcliffe (1970)</xref>.</p>
</table-wrap-foot>
</table-wrap>
<p>Regarding the hydrological tasks addressed, streamflow prediction was the most recurrent, appearing in 9 studies; followed by the evaluation of hydrological droughts (4 studies), flood prediction (3 studies), and the development or application of global-scale models based on large volumes of hydrological data (2 studies).</p>
<p>Deep models (LSTM) outperformed traditional models in temporal prediction, with RMSE reductions of 15&#x02013;40% compared to statistical models or shallow ANNs. Assembly models had the best balance between accuracy and robustness when the data was limited. Hybrid ML &#x0002B; physical models achieved improvements in bias correction and represented an emerging trend for operational predictions.</p>
<p>Research gaps were identified related to the lack of interpretability of deep models, the scarcity of data in non-gauged basins, the need to evaluate the influence of human activities (dams, irrigation, land use changes) and the integration of data from IoT sensors and satellite observation. Likewise, an underrepresentation of studies that consider explicit uncertainty and Bayesian methods applied to hydrological ML was observed <xref ref-type="bibr" rid="B26">Pathak and Pandey, (2021)</xref>.</p>
</sec>
<sec>
<label>3.3</label>
<title>The three most representative studies</title>
<p>Of the 18 studies analyzed, three were selected that stand out for their clarity and transparency, technical rigor, and data handling: <xref ref-type="bibr" rid="B22">Nearing et al. (2020)</xref>, <xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref>, and <xref ref-type="bibr" rid="B2">Almikaeel et al. (2022)</xref>.</p>
<list list-type="order">
<list-item><p><xref ref-type="bibr" rid="B22">Nearing et al. (2020)</xref>. This article, although not applied, obtains the highest methodological quality when analyzing fundamentals, uncertainty and limits of ML in hydrology. Its value lies in its conceptual depth and critical orientation, not in empirical models.</p></list-item>
<list-item><p><xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref>. It is a technical and applied study, with strengths in the integration of physical models and hydrological metrics. Its main weakness is reproducibility, typical in hydrological studies based on large datasets.</p></list-item>
<list-item><p><xref ref-type="bibr" rid="B2">Almikaeel et al. (2022)</xref>. Simple ANN/SVM model, without exhaustive documentation, with low explainability and minimal uncertainty treatment. Moderate quality, typical of research prior to the rise of reproducible ML.</p></list-item>
</list>
<p>All three studies demonstrate strengths in &#x0201C;Clarity of Objectives,&#x0201D; suggesting a well-defined research purpose. However, &#x0201C;Clarity of Metrics&#x0201D; is a critical point, as both <xref ref-type="bibr" rid="B22">Nearing et al. (2020)</xref> and <xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref> received the lowest rating (NA or low), which may compromise the interpretation and comparability of their results (<xref ref-type="table" rid="T6">Table 6</xref>).</p>
<table-wrap position="float" id="T6">
<label>Table 6</label>
<caption><p>Methodological evaluation of the three main studies (adapted PRISMA).</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Criterion</bold></th>
<th valign="top" align="left"><bold><xref ref-type="bibr" rid="B22">Nearing et al. (2020)</xref></bold></th>
<th valign="top" align="left"><bold><xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref></bold></th>
<th valign="top" align="left"><bold><xref ref-type="bibr" rid="B2">Almikaeel et al. (2022)</xref></bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Clarity of objectives</td>
<td valign="top" align="left"><bold>High</bold>. It explicitly states the purpose of the article: to question the current role of hydrology in the face of machine learning. Evidence: clear conceptual analysis of the paradigmatic transition (L15&#x02013;L25, L27&#x02013;L44).</td>
<td valign="top" align="left"><bold>High</bold>. Clear objective: to improve flow prediction by combining physical hydrological models &#x0002B; ML.</td>
<td valign="top" align="left"><bold>High</bold>. Explicitly focused on predicting hydrological drought with ML models.</td>
</tr>
<tr>
<td valign="top" align="left">Data description</td>
<td valign="top" align="left"><bold>Not applicable (conceptual)</bold>. It does not use experimental datasets.</td>
<td valign="top" align="left"><bold>High</bold>. Clear description in the original article: use of VIC/SWAT physical models and hydrological series.</td>
<td valign="top" align="left"><bold>Middle</bold>. Data described at a general level, but omits resolution and preprocessing details.</td>
</tr>
<tr>
<td valign="top" align="left">Processing of missing data</td>
<td valign="top" align="left"><bold>Not applicable (no data)</bold>.</td>
<td valign="top" align="left"><bold>Middle</bold>. Basic management is mentioned by cross-validation; no imputations are specified.</td>
<td valign="top" align="left"><bold>Low</bold>. It does not explicitly describe how missing values are handled.</td>
</tr>
<tr>
<td valign="top" align="left">ML algorithm rationale</td>
<td valign="top" align="left"><bold>High</bold>. Broad discussion on epistemological foundations of ML applied to hydrology.</td>
<td valign="top" align="left"><bold>High</bold>. It justifies the choice of RF, XGBoost, LSTM for its ability to model nonlinearities.</td>
<td valign="top" align="left"><bold>Middle</bold>. Typical ANN/SVM selection, but with little theoretical justification.</td>
</tr>
<tr>
<td valign="top" align="left">Overfitting prevention</td>
<td valign="top" align="left"><bold>Not applicable</bold>. It does not deploy trained models.</td>
<td valign="top" align="left"><bold>Middle</bold>. Use of cross-validation, but without explicit regularization or overfitting analysis.</td>
<td valign="top" align="left"><bold>Middle</bold>. Use of train/test division, without further discussion of overfitting.</td>
</tr>
<tr>
<td valign="top" align="left">Metric clarity and adequacy</td>
<td valign="top" align="left"><bold>Not applicable</bold>. It does not evaluate quantitative models.</td>
<td valign="top" align="left"><bold>High</bold>. Use of RMSE, MAE, NSE, KGE appropriate for flow rates.</td>
<td valign="top" align="left"><bold>Middle</bold>. He uses RMSE, MAE, R<sup>2</sup>, but without deep discussion.</td>
</tr>
<tr>
<td valign="top" align="left">Reproducibility</td>
<td valign="top" align="left"><bold>Middle</bold>. Conceptual article, well documented, without code.</td>
<td valign="top" align="left"><bold>Middle</bold>. No code published; partial reproducibility.</td>
<td valign="top" align="left"><bold>Low</bold>. Lack of detail prevents reproducibility.</td>
</tr>
<tr>
<td valign="top" align="left">Uncertainty analysis</td>
<td valign="top" align="left"><bold>High</bold>. Hydrological <bold>uncertainty</bold> is a central theme of the article (see L17&#x02013;L24, L39&#x02013;L49).</td>
<td valign="top" align="left"><bold>Middle</bold>. It includes hydrological metrics, but without explicit uncertainty analysis.</td>
<td valign="top" align="left"><bold>Low</bold>. It does not contemplate uncertainty.</td>
</tr>
<tr>
<td valign="top" align="left">Explicit limitations</td>
<td valign="top" align="left"><bold>High</bold>. He recognizes limitations of the field, biases and lack of quantitative theory.</td>
<td valign="top" align="left"><bold>Middle</bold>. Recognizes limitations of data and physical models.</td>
<td valign="top" align="left"><bold>Low</bold>. Minimal or superficial limitations.</td>
</tr>
<tr>
<td valign="top" align="left">Total score (0&#x02013;10)</td>
<td valign="top" align="left">9/10</td>
<td valign="top" align="left">7/10</td>
<td valign="top" align="left">4/10</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>Value of level. No Applicable = 0, Low = 1, Middle = 2 and High = 3.</p>
</table-wrap-foot>
</table-wrap>
<p>Regarding Technical Rigor, &#x0201C;Prevention of Overfitting&#x0201D; is a problematic area for two of the three studies, raising concerns about the generalizability of their models. In contrast, <xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref> and <xref ref-type="bibr" rid="B2">Almikaeel et al. (2022)</xref> stand out in &#x0201C;Reproducibility,&#x0201D; a fundamental aspect for scientific validity. In the Data Management category: &#x0201C;Treatment of missing data&#x0201D; varies considerably, being excellent in <xref ref-type="bibr" rid="B2">Almikaeel et al. (2022)</xref>, average in <xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref>, and poor in <xref ref-type="bibr" rid="B22">Nearing et al. (2020)</xref>. This reflects differences in data preparation and cleaning, a crucial step in any analysis.</p>
<p><xref ref-type="fig" rid="F4">Figure 4</xref> is a heatmap comparing the performance or evaluation of three specific studies or models-<xref ref-type="bibr" rid="B22">Nearing et al. (2020)</xref>, <xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref>, and <xref ref-type="bibr" rid="B2">Almikaeel et al. (2022)</xref>-with respect to nine key methodological criteria for data science and predictive modeling: (1) Clarity of objectives; (2) Data description; (3) Treatment of missing data; (4) Algorithm justification; (5) Prevention of overfitting; (6) Clarity of metrics; (7) Reproducibility; (8) Uncertainty analysis; and (9) Explicit limitations.</p>
<fig position="float" id="F4">
<label>Figure 4</label>
<caption><p>Heatmap of methodological criteria for data science and three predictive models.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frwa-08-1756052-g0004.tif">
<alt-text content-type="machine-generated">Heatmap comparing three studies (Nearing et al. 2020, Solanki et al. 2025, Drought ML) across criteria like clarity of objectives, data description, and uncertainty analysis. Color scale indicates level (0=NA, 1=Low, 2=Medium, 3=High).</alt-text>
</graphic>
</fig>
<p><xref ref-type="table" rid="T6">Table 6</xref> presents a comparative evaluation of the three articles according to ten methodological criteria most relevant to this systematic review. Overall, the table underscores that the quality of a contribution is not measured solely by its technical component, but also by transparency, critical reflection, and methodological rigor, aspects in which conceptual approaches, such as that of <xref ref-type="bibr" rid="B22">Nearing et al. (2020)</xref>, can outperform even less rigorous empirical studies.</p>
<p><xref ref-type="bibr" rid="B22">Nearing et al. (2020)</xref> stand out for their conceptual rigor: although they do not employ empirical data or trained models, they explicitly and thoroughly address epistemological issues, uncertainty, and limitations of the field, earning them the highest score (9/10).</p>
<p><xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref> demonstrate a solid balance between theoretical foundation and practical application, with a clear justification of the appropriate algorithms and metrics, although they suffer from limitations in reproducibility and overfit control, resulting in an intermediate score (7/10). <xref ref-type="bibr" rid="B2">Almikaeel et al. (2022)</xref> present a more limited technical application: it lacks in-depth justification of the approach, omits critical details on data and uncertainty handling, and offers poor reproducibility, which is reflected in its low score (4/10).</p></sec>
</sec>
<sec sec-type="discussion" id="s4">
<label>4</label>
<title>Discussion</title>
<p>Systematic evaluation revealed heterogeneity in methodological quality and rigor among the included studies. Conceptual articles showed strengths in discussing uncertainty, epistemological foundations, and limitations of the field, while applied studies presented more robust documentation on data, metrics and performance of predictive models. Deep learning models (LSTM, CNN) demonstrated greater accuracy in hydrological temporal prediction, especially in basins with marked climate variability. Assembly algorithms (RF, XGBoost, CatBoost) offered a balance between accuracy and robustness, being preferred when data availability was limited. The main limitations detected were lack of reproducibility, absence of uncertainty analysis, insufficient documentation of hyperparameters, and little incorporation of anthropogenic factors (<xref ref-type="bibr" rid="B12">Drogkoula et al., 2023</xref>). The review evidenced an exponential growth in the use of ML for hydrology and water management. Three patterns stood out.</p>
<sec>
<label>4.1</label>
<title>Strengths of ML in hydrology</title>
<p>Distinctive strengths of ML in this domain were identified: its ability to capture nonlinear relationships that elude linear or physically simplified models; its adaptability to incomplete, noisy, or heterogeneous data; its capacity to integrate multiple data sources-such as <italic>in-situ</italic> stations, remote sensors, satellites, and global databases; and its potential for simulations in data-scarce basins using strategies such as transfer learning or ensemble models.</p>
</sec>
<sec>
<label>4.2</label>
<title>More effective algorithms</title>
<p>Certain algorithms demonstrate effectiveness depending on the hydrological task. Long-term time series (LSTM) networks solidified their position as the preferred option for forecasting hydrological time series, thanks to their handling of long-term dependencies. Gradient-driven methods, especially XGBoost and CatBoost, showed outstanding performance in estimating flow rates and discharge curves. Random Forest proved particularly robust in contexts with high uncertainty, noisy conditions, or limited data availability (<xref ref-type="bibr" rid="B9">Chang and Guo, 2020</xref>). Hybrid approaches-combining machine learning with physical models such as SWAT or VIC-stood out in drought and flood studies by integrating theoretical knowledge with predictive flexibility.</p>
</sec>
<sec>
<label>4.3</label>
<title>Challenges identified</title>
<p>The review also highlighted critical challenges that limit the operational maturity of these tools. These include the poor reproducibility of studies-few publish code, hyperparameter configurations, or detailed protocols; insufficient consideration of anthropogenic impacts such as dams, irrigation, or urbanization; the absence or incompleteness of uncertainty quantification; the opacity of deep models, which hinders their interpretation by managers and stakeholders; and the over-reliance on seasonal or regional training data, which compromises generalizability to other climatic or hydrological contexts. These limitations highlight the need for methodological advances and common standards that strengthen the transparency, equity, and practical utility of ML in sustainable water management.</p>
<p>The evaluation of methodological quality showed a notable heterogeneity among the studies analyzed. Conceptual studies, such as that of <xref ref-type="bibr" rid="B22">Nearing et al. (2020)</xref>, showed a high degree of clarity in the formulation of objectives and an in-depth analysis of the uncertainty and epistemological limitations of the use of machine learning models in hydrology. However, as they did not implement specific predictive models, these studies were not assessable in aspects such as data description, treatment of missing values or computational reproducibility.</p>
<p>In contrast, applied studies that integrated physical hydrological models with machine learning algorithms, such as the work of <xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref>, stood out for a relatively detailed description of the data and for the use of appropriate hydrological metrics (e.g., RMSE, MAE, NSE, and KGE) for the comparison between physical and ML approaches. However, its quality was limited by the absence of code releases, the lack of standardized hyperparameter tuning protocols, and a still incipient consideration of the uncertainty associated with predictions in different climate and space scenarios.</p>
<p>Studies of early application of ML to specific problems, such as hydrological drought prediction using ANN and SVM, showed a simpler experimental design and less detailed documentation, especially concerning missing data management, overfit prevention strategies, and reproducibility. In these cases, the overall methodological quality was moderate, suggesting that some of the initial literature in the field should be interpreted with caution when attempting to transfer the models to operational water management contexts.</p>
<p>In a cross-sectional manner, the set of studies reviewed showed important advances in the use of adequate performance metrics and in the explicit discussion of limitations but also revealed recurring weaknesses: poor availability of code and data, absence of systematic uncertainty analyses and a limited justification for the choice of algorithms based on the specific characteristics of the hydrological problem (<xref ref-type="table" rid="T7">Table 7</xref>). These results point to the need to strengthen good methodological and reporting practices in future research, aligning them with transparency and reproducibility frameworks that allow consolidating the adoption of machine learning models in real water management <xref ref-type="bibr" rid="B27">Rahman, (2019)</xref>.</p>
<table-wrap position="float" id="T7">
<label>Table 7</label>
<caption><p>Methodological quality assessment of included studies (H/M/L/NA scoring).</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Study (author, year)</bold></th>
<th valign="top" align="left"><bold>Obj. clarity</bold></th>
<th valign="top" align="left"><bold>Data transparency</bold></th>
<th valign="top" align="left"><bold>Missing data</bold></th>
<th valign="top" align="left"><bold>Algorithm justification</bold></th>
<th valign="top" align="left"><bold>Overfit prevention</bold></th>
<th valign="top" align="left"><bold>Metric adequacy</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B25">Noymanee and Theeramunkong (2019)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">L</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B38">Yaseen et al. (2018)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">L</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B10">Chen et al. (2019)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B28">Rozos et al. (2022)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">L</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B13">Faybishenko et al. (2021)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B2">Almikaeel et al. (2022)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">L</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B37">Xu and Liang (2021)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="left">M</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B23">Nearing et al. (2021)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="left">NA</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B8">Chang et al. (2023)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">H</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B20">Kumar et al. (2023)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B4">Baran-Gurgul and Rutkowska (2024)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B11">Dasari et al. (2025)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B14">Ghobadi and Kang (2023)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">L</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B17">Hasan et al. (2024)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B31">Slater et al. (2025)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B32">Solanki et al. (2025)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">H</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B33">Syed et al. (2024)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
<td valign="top" align="left">M</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B36">Willard et al. (2024)</xref></td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="left">H</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="left">M</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s5">
<label>5</label>
<title>Conclusions</title>
<p>Our review confirms that machine learning is a transformative tool for water management, but its operational integration demands methodological maturation beyond algorithmic novelty. First, model&#x02013;data fusion must evolve from <italic>post-hoc</italic> bias correction to end-to-end physically informed architectures (e.g., physics-informed neural networks, differentiable hydrology); such frameworks embed mass/energy conservation directly into loss functions and show promise in ungauged basins. Second, reproducibility must become non-negotiable: future studies should adopt FAIR principles (Findable, Accessible, Interoperable, Reusable) by publishing code, hyperparameters, and train/validation/test splits in open repositories (e.g., Zenodo, HydroShare), and journals should enforce this as a submission requirement. Third, anthropogenic processes-dams, irrigation, urbanization-must be explicitly represented as dynamic inputs or state variables; ignoring them induces structural bias, especially under climate change. Fourth, uncertainty quantification must shift from qualitative disclaimers to quantitative outputs, e.g., via ensemble methods, Monte Carlo dropout, or Bayesian neural networks, providing prediction intervals for decision support. Fifth, benchmarking must standardize hydrologically meaningful metrics (NSE, KGE decomposition) and validation protocols (strict temporal holdouts, multi-basin tests). These priorities converge on hybrid intelligence: combining data-driven flexibility with physical interpretability. The path forward lies not in choosing between ML and physics, but in fusing them through transparent, uncertainty-aware, and human-aware modeling. Only then will ML models transition from research curiosities to trusted tools for equitable and sustainable water governance.</p>
<p>The trend indicates that the integration between physical models and deep learning will be a strategic axis for future research, along with the adoption of reproducibility frameworks, uncertainty analysis and multi-source systems based on sensors and satellite images. The evidence gathered indicates that machine learning has become a robust tool in water management. Predictive models significantly improve the accuracy of flow forecasting, anticipate droughts and floods with greater reliability, and effectively integrate data from multiple sources. Furthermore, these approaches have proven useful in correcting biases inherent in traditional hydrological models and providing concrete support for decision-making related to reservoir operation, irrigation planning, and the implementation of early warning systems.</p>
<p>Recent advances in AI constitute a strategic opportunity to meet the hydrological challenges of the 21st century (<xref ref-type="bibr" rid="B5">Barros et al., 2003</xref>; <xref ref-type="bibr" rid="B16">Hamitouche and Molina, 2022</xref>; <xref ref-type="bibr" rid="B33">Syed et al., 2024</xref>). However, the consolidation of this line requires improving reproducibility, incorporating uncertainty analysis, integrating anthropogenic processes and moving toward hybrid physical-informed models (<xref ref-type="bibr" rid="B24">Nourani et al., 2011</xref>; <xref ref-type="bibr" rid="B18">Ibrahim et al., 2022</xref>).</p></sec>
</body>
<back>
<sec sec-type="author-contributions" id="s6">
<title>Author contributions</title>
<p>MT: Conceptualization, Data curation, Project administration, Writing &#x02013; original draft. SC: Conceptualization, Supervision, Investigation, Visualization, Methodology, Writing &#x02013; review &#x00026; editing. HL: Conceptualization, Data curation, Methodology, Writing &#x02013; original draft. FA: Conceptualization, Formal analysis, Methodology, Validation, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. LM: Conceptualization, Data curation, Formal analysis, Validation, Writing &#x02013; review &#x00026; editing. JC: Conceptualization, Formal analysis, Validation, Writing &#x02013; original draft. AM: Conceptualization, Software, Validation, Writing &#x02013; original draft.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s8">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/frwa.2026.1756052/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/frwa.2026.1756052/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.xlsx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Addor</surname> <given-names>N.</given-names></name> <name><surname>Melsen</surname> <given-names>L.</given-names></name></person-group> (<year>2019</year>). <article-title>Legacy, rather than adequacy, drives the selection of hydrological models</article-title>. <source>Water Resour. Res.</source> <volume>55</volume>, <fpage>378</fpage>&#x02013;<lpage>390</lpage>. doi: <pub-id pub-id-type="doi">10.1029/2018wr022958</pub-id></mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Almikaeel</surname> <given-names>W.</given-names></name> <name><surname>Cubanov&#x000E1;</surname> <given-names>L.</given-names></name> <name><surname>&#x00160;olt&#x000E9;sz</surname> <given-names>A.</given-names></name></person-group> (<year>2022</year>). <article-title>Hydrological drought forecasting using machine learning-Gidra River case study</article-title>. <source>Water</source> <volume>14</volume>:<fpage>387</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w14030387</pub-id></mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Ardabili</surname> <given-names>S.</given-names></name> <name><surname>Mosavi</surname> <given-names>A.</given-names></name> <name><surname>Dehghani</surname> <given-names>M.</given-names></name> <name><surname>V&#x000E1;rkonyi-K&#x000F3;czy</surname> <given-names>A. R.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Deep learning and machine learning in hydrological processes climate change and earth systems a systematic review,&#x0201D;</article-title> in <source>Lecture Notes in Networks and Systems</source> (<publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>52</fpage>&#x02013;<lpage>62</lpage>.</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Baran-Gurgul</surname> <given-names>K.</given-names></name> <name><surname>Rutkowska</surname> <given-names>A.</given-names></name></person-group> (<year>2024</year>). <article-title>Water resource management: hydrological modelling, hydrological cycles, and hydrological prediction</article-title>. <source>Water</source> <volume>16</volume>:<fpage>3689</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w16243689</pub-id></mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Barros</surname> <given-names>M. T. L.</given-names></name> <name><surname>Tsai</surname> <given-names>F. T.-C.</given-names></name> <name><surname>Yang</surname> <given-names>S.</given-names></name> <name><surname>Lopes</surname> <given-names>J. E. G.</given-names></name> <name><surname>Yeh</surname> <given-names>W. W.-G.</given-names></name></person-group> (<year>2003</year>). <article-title>Optimization of large-scale hydropower system operations</article-title>. <source>J. Water Resour. Plan. Manag.</source> <volume>129</volume>, <fpage>178</fpage>&#x02013;<lpage>188</lpage>. doi: <pub-id pub-id-type="doi">10.1061/(ASCE)0733-9496(2003)129:3(178)</pub-id></mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bellin</surname> <given-names>N.</given-names></name> <name><surname>Tesi</surname> <given-names>G.</given-names></name> <name><surname>Marchesani</surname> <given-names>N.</given-names></name> <name><surname>Rossi</surname> <given-names>V.</given-names></name></person-group> (<year>2022</year>). <article-title>Species distribution modeling and machine learning in assessing the potential distribution of freshwater zooplankton in Northern Italy</article-title>. <source>Ecol. Inf.</source> <volume>69</volume>:<fpage>101682</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ecoinf.2022.101682</pub-id></mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Bhadauria</surname> <given-names>A.</given-names></name> <name><surname>Reddy</surname> <given-names>M. S. S.</given-names></name> <name><surname>Asha</surname> <given-names>V.</given-names></name> <name><surname>Nijhawan</surname> <given-names>G.</given-names></name> <name><surname>Abdulhussein Hameed</surname> <given-names>A.</given-names></name> <name><surname>Pratap</surname> <given-names>B.</given-names></name></person-group> (<year>2024</year>). <article-title>&#x0201C;Analytical survey on the sustainable advancements in water and hydrology resources with AI implications for a resilient future,&#x0201D;</article-title> in <source>E3S Web of Conferences</source> (<publisher-loc>Les Ulis</publisher-loc>: <publisher-name>EDP Sciences</publisher-name>).</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chang</surname> <given-names>F. J.</given-names></name> <name><surname>Chang</surname> <given-names>L. C.</given-names></name> <name><surname>Chen</surname> <given-names>J. F.</given-names></name></person-group> (<year>2023</year>). <article-title>Artificial intelligence techniques in hydrology and water resources management</article-title>. <source>Water</source> <volume>15</volume>:<fpage>1846</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w15101846</pub-id></mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chang</surname> <given-names>F. J.</given-names></name> <name><surname>Guo</surname> <given-names>S.</given-names></name></person-group> (<year>2020</year>). <article-title>Advances in hydrologic forecasts and water resources management</article-title>. <source>Water</source> <volume>12</volume>:<fpage>1819</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w12061819</pub-id></mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>C.</given-names></name> <name><surname>Hui</surname> <given-names>Q.</given-names></name> <name><surname>Pei</surname> <given-names>Q.</given-names></name> <name><surname>Zhou</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>B.</given-names></name> <name><surname>Lv</surname> <given-names>N.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>CRML: a convolution regression model with machine learning for hydrology forecasting</article-title>. <source>IEEE Access</source> <volume>7</volume>, <fpage>133839</fpage>&#x02013;<lpage>133849</lpage>. doi: <pub-id pub-id-type="doi">10.1109/ACCESS.2019.2941234</pub-id></mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dasari</surname> <given-names>S. K.</given-names></name> <name><surname>Preetha</surname> <given-names>P.</given-names></name> <name><surname>Ghantasala</surname> <given-names>H. M.</given-names></name></person-group> (<year>2025</year>). <article-title>Predictive analysis of hydrological variables in the Cahaba watershed: enhancing forecasting accuracy for water resource management using time-series and machine learning models</article-title>. <source>Earth</source> <volume>6</volume>:<fpage>89</fpage>. doi: <pub-id pub-id-type="doi">10.3390/earth6030089</pub-id></mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Drogkoula</surname> <given-names>M.</given-names></name> <name><surname>Kokkinos</surname> <given-names>K.</given-names></name> <name><surname>Samaras</surname> <given-names>N.</given-names></name></person-group> (<year>2023</year>). <article-title>A comprehensive survey of machine learning methodologies with emphasis in water resources management</article-title>. <source>Appl. Sci.</source> <volume>13</volume>:<fpage>12147</fpage>. doi: <pub-id pub-id-type="doi">10.3390/app132212147</pub-id></mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Faybishenko</surname> <given-names>B.</given-names></name> <name><surname>Ramakrishnan</surname> <given-names>L.</given-names></name> <name><surname>Powell</surname> <given-names>T.</given-names></name> <name><surname>Arora</surname> <given-names>B.</given-names></name> <name><surname>Wu</surname> <given-names>J.</given-names></name> <name><surname>Agarwall</surname> <given-names>D.</given-names></name></person-group> (<year>2021</year>). <source>On AI Prediction of Hydrological Processes Based on Integration of Retrospective and Forecasting ML Techniques</source>. <publisher-loc>Oak Ridge, TN</publisher-loc>: <publisher-name>Oak Ridge National Laboratory</publisher-name>.</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ghobadi</surname> <given-names>F.</given-names></name> <name><surname>Kang</surname> <given-names>D.</given-names></name></person-group> (<year>2023</year>). <article-title>Application of machine learning in water resources management: a systematic literature review</article-title>. <source>Water</source> <volume>15</volume>:<fpage>620</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w15040620</pub-id></mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gupta</surname> <given-names>H. V.</given-names></name> <name><surname>Kling</surname> <given-names>H.</given-names></name> <name><surname>Yilmaz</surname> <given-names>K. K.</given-names></name> <name><surname>Martinez</surname> <given-names>G. F.</given-names></name></person-group> (<year>2009</year>). <article-title>Decomposition of the mean squared error and NSE performance criteria: implications for improving hydrological modelling</article-title>. <source>J. Hydrol.</source> <volume>377</volume>, <fpage>80</fpage>&#x02013;<lpage>91</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jhydrol.2009.08.003</pub-id></mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hamitouche</surname> <given-names>M.</given-names></name> <name><surname>Molina</surname> <given-names>J. L.</given-names></name></person-group> (<year>2022</year>). <article-title>A review of AI methods for the prediction of high-flow extremal hydrology</article-title>. <source>Water Resour. Manag.</source> <volume>36</volume>, <fpage>3859</fpage>&#x02013;<lpage>3876</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11269-022-03240-y</pub-id></mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hasan</surname> <given-names>F.</given-names></name> <name><surname>Medley</surname> <given-names>P.</given-names></name> <name><surname>Drake</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>G.</given-names></name></person-group> (<year>2024</year>). <article-title>Advancing hydrology through machine learning: insights, challenges, and future directions using the CAMELS, caravan, GRDC, CHIRPS, PERSIANN, NLDAS, GLDAS, and GRACE datasets</article-title>. <source>Water</source> <volume>16</volume>:<fpage>1904</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w16131904</pub-id></mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ibrahim</surname> <given-names>K. S. M. H.</given-names></name> <name><surname>Huang</surname> <given-names>Y. F.</given-names></name> <name><surname>Ahmed</surname> <given-names>A. N.</given-names></name> <name><surname>Koo</surname> <given-names>C. H.</given-names></name> <name><surname>El-Shafie</surname> <given-names>A.</given-names></name></person-group> (<year>2022</year>). <article-title>A review of the hybrid artificial intelligence and optimization modelling of hydrological streamflow forecasting</article-title>. <source>Alex. Eng. J.</source> <volume>61</volume>, <fpage>279</fpage>&#x02013;<lpage>303</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.aej.2021.04.100</pub-id></mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kratzert</surname> <given-names>F.</given-names></name> <name><surname>Klotz</surname> <given-names>D.</given-names></name> <name><surname>Shalev</surname> <given-names>G.</given-names></name> <name><surname>Klambauer</surname> <given-names>G.</given-names></name> <name><surname>Hochreiter</surname> <given-names>S.</given-names></name> <name><surname>Nearing</surname> <given-names>G.</given-names></name></person-group> (<year>2019</year>). <article-title>Towards learning universal, regional, and local hydrological behaviors via machine learning applied to large-sample datasets</article-title>. <source>Hydrol. Earth Syst. Sci.</source> <volume>23</volume>, <fpage>5089</fpage>&#x02013;<lpage>5110</lpage>. doi: <pub-id pub-id-type="doi">10.5194/hess-23-5089-2019</pub-id></mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kumar</surname> <given-names>V.</given-names></name> <name><surname>Kedam</surname> <given-names>N.</given-names></name> <name><surname>Sharma</surname> <given-names>K. V.</given-names></name> <name><surname>Mehta</surname> <given-names>D. J.</given-names></name> <name><surname>Caloiero</surname> <given-names>T.</given-names></name></person-group> (<year>2023</year>). <article-title>Advanced machine learning techniques to improve hydrological prediction: a comparative analysis of streamflow prediction models</article-title>. <source>Water</source> <volume>15</volume>:<fpage>2572</fpage>. doi: <pub-id pub-id-type="doi">10.3390/w15142572</pub-id></mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nash</surname> <given-names>J. E.</given-names></name> <name><surname>Sutcliffe</surname> <given-names>J. V.</given-names></name></person-group> (<year>1970</year>). <article-title>River flow forecasting through conceptual models: Part 1</article-title>. <source>A discussion of principles. J. Hydrol.</source> <volume>10</volume>, <fpage>282</fpage>&#x02013;<lpage>290</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0022-1694(70)90255-6</pub-id></mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nearing</surname> <given-names>G. S.</given-names></name> <name><surname>Clark</surname> <given-names>M. P.</given-names></name> <name><surname>Wood</surname> <given-names>A. W.</given-names></name></person-group> (<year>2020</year>). <article-title>The role of machine learning in hydrology: a paradigm shift?</article-title> <source>Water Resour. Res</source>. <fpage>56</fpage>:<fpage>e2020WR027624</fpage>. doi: <pub-id pub-id-type="doi">10.1029/2020WR028091</pub-id></mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nearing</surname> <given-names>G. S.</given-names></name> <name><surname>Kratzert</surname> <given-names>F.</given-names></name> <name><surname>Sampson</surname> <given-names>A. K.</given-names></name> <name><surname>Pelissier</surname> <given-names>C. S.</given-names></name> <name><surname>Klotz</surname> <given-names>D.</given-names></name> <name><surname>Frame</surname> <given-names>J. M.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>What role does hydrological science play in the age of machine learning?</article-title> <source>Water Resour. Res.</source> <volume>57</volume>:<fpage>e2020W</fpage>R028091. doi: <pub-id pub-id-type="doi">10.1029/2020WR028091</pub-id></mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nourani</surname> <given-names>V.</given-names></name> <name><surname>Kisi</surname> <given-names>&#x000D6;.</given-names></name> <name><surname>Komasi</surname> <given-names>M.</given-names></name></person-group> (<year>2011</year>). <article-title>Two hybrid artificial intelligence approaches for modeling rainfall-runoff process</article-title>. <source>J. Hydrol.</source> <volume>402</volume>, <fpage>41</fpage>&#x02013;<lpage>59</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jhydrol.2011.03.002</pub-id></mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Noymanee</surname> <given-names>J.</given-names></name> <name><surname>Theeramunkong</surname> <given-names>T.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Flood forecasting with machine learning technique on hydrological modeling,&#x0201D;</article-title> in <source>Procedia Computer Science</source> (<publisher-loc>Amsterdam</publisher-loc>: <publisher-name>Elsevier B.V.</publisher-name>), <fpage>377</fpage>&#x02013;<lpage>386</lpage>.</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Pathak</surname> <given-names>S.</given-names></name> <name><surname>Pandey</surname> <given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>&#x0201C;Smart cities: review of characteristics, composition, challenges and technologies,&#x0201D;</article-title> in <source>2021 6th International Conference on Inventive Computation Technologies (ICICT)</source> (<publisher-loc>Coimbatore</publisher-loc>), <fpage>871</fpage>&#x02013;<lpage>876</lpage>. doi: <pub-id pub-id-type="doi">10.1109/ICICT50816.2021.9358708</pub-id></mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="web"><person-group person-group-type="author"><name><surname>Rahman</surname> <given-names>A.</given-names></name></person-group> (<year>2019</year>). <article-title>Statistics-based data preprocessing methods and machine learning algorithms for big data analysis</article-title>. <source>Int. J. Artif. Intell.</source> <volume>17</volume>, <fpage>44</fpage>&#x02013;<lpage>65</lpage>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.aut.upt.ro/&#x0007E;rprecup/IJAI_59.pdf">https://www.aut.upt.ro/&#x0007E;rprecup/IJAI_59.pdf</ext-link>; <ext-link ext-link-type="uri" xlink:href="https://www.scopus.com/pages/publications/85073352547?inward">https://www.scopus.com/pages/publications/85073352547?inward</ext-link></mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rozos</surname> <given-names>E.</given-names></name> <name><surname>Dimitriadis</surname> <given-names>P.</given-names></name> <name><surname>Bellos</surname> <given-names>V.</given-names></name></person-group> (<year>2022</year>). <article-title>Machine learning in assessing the performance of hydrological models</article-title>. <source>Hydrology</source> <volume>9</volume>:<fpage>5</fpage>. doi: <pub-id pub-id-type="doi">10.3390/hydrology9010005</pub-id></mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sarkis-Onofre</surname> <given-names>R.</given-names></name> <name><surname>Catal&#x000E1;-L&#x000F3;pez</surname> <given-names>F.</given-names></name> <name><surname>Aromataris</surname> <given-names>E.</given-names></name> <name><surname>Lockwood</surname> <given-names>C.</given-names></name></person-group> (<year>2021</year>). <article-title>How to properly use the PRISMA statement</article-title>. <source>Syst. Rev.</source> <volume>10</volume>:<fpage>117</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13643-021-01671-z</pub-id><pub-id pub-id-type="pmid">33875004</pub-id></mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sharma</surname> <given-names>A.</given-names></name> <name><surname>Mehrotra</surname> <given-names>R.</given-names></name> <name><surname>Bari</surname> <given-names>M.</given-names></name></person-group> (<year>2020</year>). <article-title>Machine learning in hydrology: opportunities and challenges</article-title>. <source>J. Hydrol.</source> <volume>587</volume>:<fpage>124945</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jhydrol.2020.124945</pub-id></mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Slater</surname> <given-names>L.</given-names></name> <name><surname>Blougouras</surname> <given-names>G.</given-names></name> <name><surname>Deng</surname> <given-names>L.</given-names></name> <name><surname>Deng</surname> <given-names>Q.</given-names></name> <name><surname>Ford</surname> <given-names>E.</given-names></name> <name><surname>Hoek</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Challenges and opportunities of ML and explainable AI in large-sample hydrology</article-title>. <source>Philos. Trans. R. Soc. A</source> <volume>383</volume>:<fpage>20240287</fpage>. doi: <pub-id pub-id-type="doi">10.1098/rsta.2024.0287</pub-id><pub-id pub-id-type="pmid">40739919</pub-id></mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Solanki</surname> <given-names>H.</given-names></name> <name><surname>Vegad</surname> <given-names>U.</given-names></name> <name><surname>Kushwaha</surname> <given-names>A.</given-names></name> <name><surname>Mishra</surname> <given-names>V.</given-names></name></person-group> (<year>2025</year>). <article-title>Improving streamflow prediction using multiple hydrological models and machine learning methods</article-title>. <source>Water Resour. Res.</source> <volume>61</volume>:<fpage>e2024W</fpage>R038192. doi: <pub-id pub-id-type="doi">10.1029/2024WR038192</pub-id></mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Syed</surname> <given-names>T. A.</given-names></name> <name><surname>Khan</surname> <given-names>M. Y.</given-names></name> <name><surname>Jan</surname> <given-names>S.</given-names></name> <name><surname>Albouq</surname> <given-names>S.</given-names></name> <name><surname>Alqahtany</surname> <given-names>S. S.</given-names></name> <name><surname>Naqash</surname> <given-names>M. T.</given-names></name></person-group> (<year>2024</year>). <article-title>Integrating digital twins and artificial intelligence multi-modal transformers into water resource management</article-title>. <source>AI</source> <volume>5</volume>, <fpage>1977</fpage>&#x02013;<lpage>2017</lpage>. doi: <pub-id pub-id-type="doi">10.3390/ai5040098</pub-id></mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wagener</surname> <given-names>T.</given-names></name> <name><surname>Sivapalan</surname> <given-names>M.</given-names></name> <name><surname>Troch</surname> <given-names>P. A.</given-names></name> <name><surname>McGlynn</surname> <given-names>B. L.</given-names></name> <name><surname>Harman</surname> <given-names>C. J.</given-names></name> <name><surname>Gupta</surname> <given-names>H. V.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>The future of hydrology: an evolving science for a changing world</article-title>. <source>Water Resour. Res.</source> 46. doi: <pub-id pub-id-type="doi">10.1029/2009WR008906</pub-id></mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>X.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Qiao</surname> <given-names>Q.</given-names></name> <name><surname>Tavares</surname> <given-names>A.</given-names></name> <name><surname>Liang</surname> <given-names>Y.</given-names></name></person-group> (<year>2023</year>). <article-title>Water quality prediction based on machine learning and comprehensive weighting methods</article-title>. <source>Entropy</source> <volume>25</volume>:<fpage>1186</fpage>. doi: <pub-id pub-id-type="doi">10.3390/e25081186</pub-id><pub-id pub-id-type="pmid">37628216</pub-id></mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Willard</surname> <given-names>J. D.</given-names></name> <name><surname>Varadharajan</surname> <given-names>C.</given-names></name> <name><surname>Jia</surname> <given-names>X.</given-names></name> <name><surname>Kumar</surname> <given-names>V.</given-names></name></person-group> (<year>2024</year>). <article-title>Time series predictions in unmonitored sites: a survey of machine learning techniques in water resources</article-title>. <source>arXiv</source>. 2308.09766 doi: <pub-id pub-id-type="doi">10.1017/eds.2024.14</pub-id></mixed-citation>
</ref>
<ref id="B37">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>T.</given-names></name> <name><surname>Liang</surname> <given-names>F.</given-names></name></person-group> (<year>2021</year>). <article-title>Machine learning for hydrologic sciences: an introductory overview</article-title>. <source>Wiley Interdiscip. Rev. Water</source> <volume>8</volume>:<fpage>e1533</fpage>. doi: <pub-id pub-id-type="doi">10.1002/wat2.1533</pub-id></mixed-citation>
</ref>
<ref id="B38">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yaseen</surname> <given-names>Z. M.</given-names></name> <name><surname>Allawi</surname> <given-names>M. F.</given-names></name> <name><surname>Yousif</surname> <given-names>A. A.</given-names></name> <name><surname>Othman</surname> <given-names>J.</given-names></name> <name><surname>Hamzah</surname> <given-names>F. M.</given-names></name> <name><surname>Ahmed</surname> <given-names>E. S.</given-names></name></person-group> (<year>2018</year>). <article-title>Non-tuned machine learning approach for hydrological time series forecasting</article-title>. <source>Neural Comput. Appl.</source> <volume>30</volume>, <fpage>1479</fpage>&#x02013;<lpage>1491</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00521-016-2763-0</pub-id></mixed-citation>
</ref>
<ref id="B39">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>Z.</given-names></name></person-group> (<year>2021</year>). <article-title>Machine learning in hydrology: a review</article-title>. <source>J. Hydrol.</source> <volume>598</volume>:<fpage>126364</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jhydrol.2021.126266</pub-id></mixed-citation>
</ref>
<ref id="B40">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhong</surname> <given-names>Z.</given-names></name> <name><surname>Sun</surname> <given-names>A.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Ren</surname> <given-names>B.</given-names></name></person-group> (<year>2020</year>). <article-title>Predicting field production rates for waterflooding using a machine learning-based proxy model</article-title>. <source>J. Pet. Sci. Eng.</source> <volume>194</volume>:<fpage>107574</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.petrol.2020.107574</pub-id></mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0001">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/631577/overview">Alex Sun</ext-link>, The University of Texas at Austin, United States</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0002">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2923630/overview">Muhammad Tayyab Naqash</ext-link>, Islamic University of Madinah Faculty of Engineering, Saudi Arabia</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3305174/overview">Hasan Shaheed</ext-link>, Universiti Tenaga Nasional, Malaysia</p>
</fn>
</fn-group>
<fn-group>
<fn fn-type="abbr" id="abbr1"><label>Abbreviations:</label><p>ANN, Artificial Neural Network; TANN, Traditional Artificial Neural Network; CaMa-Flood, Catchment-based Macro-scale Floodplain Model; CAMELS, Catchment Attributes and Meteorology for Large-Sample Studies; Caravan, Large-scale global hydrological database providing standardized time series for comparative research and machine learning modeling; CatBoost, Categorical Boosting; CHIRPS, Climate Hazards Group InfraRed Precipitation with Station Data; CNN, Convolutional Neural Network; ELM, Extreme learning machine; GRDC, Global Runoff Data Centre; H08, Global hydrological model that integrates components of water balance, irrigation, and water use on a planetary scale; IoT, Internet of Things; KGE, Kling&#x02013;Gupta efficiency; LSTM, Long and Short-Term Memory; MAE, Mean absolute error; MDPI, Multidisciplinary Digital Publishing Institute; ML, Machine learning; NSE, Nash&#x02013;Sutcliffe efficiency; PRISMA, Preferred Reporting Items for Systematic Reviews and Meta-Analyses; PROSPERO, International Prospective Register of Systematic Reviews; R<sup>2</sup>, Coefficient of determination; RF, Random forests; RMSE, Root Mean Square Error; SVM, Support vector machine; SWAT, Soil and Water Assessment Tool; VIC, Variable Infiltration Capacity Model; XGBoost, Extreme Gradient Boosting.</p></fn></fn-group>
</back>
</article>