<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Remote Sens.</journal-id>
<journal-title>Frontiers in Remote Sensing</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Remote Sens.</abbrev-journal-title>
<issn pub-type="epub">2673-6187</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1622360</article-id>
<article-id pub-id-type="doi">10.3389/frsen.2025.1622360</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Remote Sensing</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Artificial intelligence for groundwater recharge prediction in an arid region: application of tabular deep learning models in the Feija Basin, Morocco</article-title>
<alt-title alt-title-type="left-running-head">Elmotawakkil et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/frsen.2025.1622360">10.3389/frsen.2025.1622360</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Elmotawakkil</surname>
<given-names>Abdessamad</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3054887/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Moumane</surname>
<given-names>Adil</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3054781/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zahi</surname>
<given-names>Assia</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sadiki</surname>
<given-names>Abdelkhalik</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Karkouri</surname>
<given-names>Jamal Al</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Batchi</surname>
<given-names>Mouhcine</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Bhagat</surname>
<given-names>Suraj Kumar</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2843018/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tiyasha</surname>
<given-names>Tiyasha</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Enneya</surname>
<given-names>Nourddine</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Computer Science</institution>, <institution>Faculty of Sciences</institution>, <institution>University Ibn Tofail</institution>, <addr-line>Kenitra</addr-line>, <country>Morocco</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Geography</institution>, <institution>Faculty of Humanities and Social Sciences</institution>, <institution>University Ibn Tofail</institution>, <addr-line>Kenitra</addr-line>, <country>Morocco</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Marwadi University Research Center</institution>, <institution>Department of Civil Engineering</institution>, <institution>Faculty of Engineering &#x26; Technology</institution>, <institution>Marwadi University</institution>, <addr-line>Gujarat</addr-line>, <addr-line>Rajkot</addr-line>, <country>India</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Faculty of Civil Engineering</institution>, <institution>Ton Duc Thang University</institution>, <addr-line>Ho Chi Minh City</addr-line>, <country>Vietnam</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1158924/overview">Romulus Costache</ext-link>, National Institute of Hydrology and Water Management, Romania</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1306238/overview">Salim Heddam</ext-link>, University of Skikda, Algeria</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3066153/overview">Burhan Bezekci</ext-link>, Kilis 7 Aral&#x131;k University, T&#xfc;rkiye</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Suraj Kumar Bhagat, <email>drsurajenv@gmail.com</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>03</day>
<month>09</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>6</volume>
<elocation-id>1622360</elocation-id>
<history>
<date date-type="received">
<day>03</day>
<month>05</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>29</day>
<month>07</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Elmotawakkil, Moumane, Zahi, Sadiki, Karkouri, Batchi, Bhagat, Tiyasha and Enneya.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Elmotawakkil, Moumane, Zahi, Sadiki, Karkouri, Batchi, Bhagat, Tiyasha and Enneya</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Groundwater recharge mapping is crucial for sustainable water resource management in arid and semi-arid regions, particularly in hydro-climatically stressed areas such as the Feija Basin in southeastern Morocco. Characterized by shallow aquifers, irregular rainfall, and over-extraction for agriculture, this region faces increasing groundwater depletion. Recent extreme rainfall events during the 2024&#x2013;2025 season have highlighted both the vulnerability and opportunity for recharge, emphasizing the need for data-driven, proactive strategies.</p>
</sec>
<sec>
<title>Methods</title>
<p>This study introduces a GeoAI-based framework combining remote sensing, geospatial analysis, and advanced artificial intelligence (AI) models to predict optimal groundwater recharge zones. Ten conditioning factors (e.g., elevation, slope, topographic wetness index, NDVI, rainfall, soil permeability, geomorphology) were used to construct the input dataset. Five AI models TabNet, TabTransformer, Multilayer Perceptron (MLP), CatBoost, and AdaBoost were trained and optimized using grid search and particle swarm optimization (PSO). Performance was evaluated using accuracy, AUC-ROC, Cohen&#x2019;s Kappa, and feature importance. Spatial validation was conducted using in-situ borehole data.</p>
</sec>
<sec>
<title>Results</title>
<p>Among the tested models, TabNet achieved the highest performance (accuracy = 97.8%, AUC = 0.99), followed closely by TabTransformer (accuracy = 97.6%). Both models demonstrated strong generalization and produced spatially coherent recharge maps. Predicted optimal zones corresponded with low-lying, vegetated, and permeable areas, aligning with known hydrogeological features.</p>
</sec>
<sec>
<title>Discussion</title>
<p>This study presents a novel application of tabular deep learning models in groundwater science, enhancing the precision and interpretability of recharge zone mapping. The results provide actionable insights for water resource planners, especially in light of recent anomalous hydrological events. The proposed framework supports the development of rainwater harvesting and artificial recharge systems to ensure long-term groundwater sustainability in climate-sensitive areas.</p>
</sec>
</abstract>
<abstract abstract-type="graphical">
<title>Graphical Abstract</title>
<p>
<graphic xlink:href="FRSEN_frsen-2025-1622360_wc_abs.tif">
<alt-text content-type="machine-generated">Workflow diagram illustrating an AI-driven methodology for groundwater analysis. Includes conditioning factors like rainfall and elevation, data maps, and analysis results using TabNet. Displays graphs for factor importance and confusion matrices, with outcomes indicated on geographical maps.</alt-text>
</graphic>
</p>
</abstract>
<kwd-group>
<kwd>machine learning</kwd>
<kwd>groundwater research</kwd>
<kwd>arid region</kwd>
<kwd>TabNet</kwd>
<kwd>Morocco</kwd>
</kwd-group>
<counts>
<page-count count="22"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Data Fusion and Assimilation</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Groundwater is a fundamental component of water security in arid and semi-arid regions, acting as a buffer against the variability and scarcity of surface water resources. A global synthesis of well data reveals rapid declines often exceeding 0.5&#xa0;m/year in dry-region aquifers, underscoring their crucial role in sustaining ecosystems, agriculture, and livelihoods in the absence of reliable rivers or reservoirs (<xref ref-type="bibr" rid="B34">Jasechko et al., 2024</xref>). In Morocco&#x2019;s southern and southeastern provinces, including the Middle Dr&#xe2;a Valley, groundwater similarly underpins agricultural activity, domestic supply, and ecological balance. For example, the Feija watershed is overwhelmingly reliant on pumped groundwater, and intensifying farming and aridity have led to overexploitation of the aquifers (<xref ref-type="bibr" rid="B50">Moumane et al., 2021</xref>).</p>
<p>Although agriculture remains central to the Feija Plain&#x2019;s economy, the shift toward large-scale, export-driven watermelon cultivation has dramatically intensified groundwater pumping. Socio-hydrological research (<xref ref-type="bibr" rid="B14">Bossenbroek et al., 2023</xref>; <xref ref-type="bibr" rid="B24">Fico and Kenti, 2023</xref>; <xref ref-type="bibr" rid="B23">Fico, 2024</xref>; <xref ref-type="bibr" rid="B66">Silva-Novoa S&#xe1;nchez et al., 2025</xref>) confirms that this expansion has not only depleted aquifers but also aggravated social inequities and ecological fragility. Crucially, this over-extraction has diminished the aquifer&#x2019;s natural buffering capacity, making the system highly susceptible to both prolonged drought and episodic floods. Between late 2024 and early 2025, southern Morocco experienced a spate of intense flash floods even as the region faced one of the worst droughts in decades, the most striking being the September 7&#x2013;8, 2024 Atlantic-origin extratropical cyclone that dumped more than a year&#x2019;s worth of rain in only 2&#xa0;days (<xref ref-type="bibr" rid="B52">Moumane et al., 2025</xref>; <xref ref-type="bibr" rid="B19">Egbejule, 2024</xref>; <xref ref-type="bibr" rid="B53">NASA Earth Observatory, 2024</xref>), temporarily filling Lake Iriqui after more than 50&#xa0;years (<xref ref-type="bibr" rid="B52">Moumane et al., 2025</xref>). Yet, despite this dramatic influx, key oases like Ternata remain groundwater-stressed, weakened by persistent extraction pressure and upstream dam regulation. In May 2025, a violent 10-min storm in Zagora Province destroyed fields and thousands of watermelon crops (<xref ref-type="bibr" rid="B25">Freshplaza, 2025</xref>), illustrating that even extreme, short-duration rainfall events fail to recharge deep aquifers without intentional capture and storage systems. These compounding factors highlight the urgent need for targeted infrastructure such as managed aquifer recharge, retention basins, and infiltration ponds to convert episodic floods into reliable groundwater reserves and enhance both water security and agricultural resilience (<xref ref-type="bibr" rid="B51">Moumane et al., 2024</xref>).</p>
<p>Recent studies have shown that deep learning techniques are increasingly used across various scientific fields, including hydrology, physics, and speech recognition (<xref ref-type="bibr" rid="B39">Kheddar, Hemis, and Himeur, 2024</xref>; <xref ref-type="bibr" rid="B69">Tripathy and Mishra, 2024</xref>; <xref ref-type="bibr" rid="B9">Bezekci, 2025</xref>; <xref ref-type="bibr" rid="B11">Bezekci and Kuru, 2025</xref>; <xref ref-type="bibr" rid="B10">Bezek&#xe7;i, 2025</xref>), demonstrating their flexibility and problem-solving potential across disciplines. They have also proven effective in extracting water surfaces from satellite imagery using semantic segmentation models such as U-Net (<xref ref-type="bibr" rid="B20">Elmotawakkil and Enneya, 2025</xref>).</p>
<p>While machine learning techniques have gained considerable attention in hydrogeological studies, most conventional models, such as random forest, support vector machines, or decision trees, are limited in their ability to capture complex, nonlinear interactions among environmental variables (<xref ref-type="bibr" rid="B45">Maity et al., 2024</xref>; <xref ref-type="bibr" rid="B12">Biazar et al., 2025</xref>). These models often rely on predefined feature hierarchies and may struggle to generalize in heterogeneous, data-scarce contexts like arid and semi-arid regions (<xref ref-type="bibr" rid="B13">Borz&#xec;, 2025</xref>). Furthermore, traditional machine learning (ML) approaches frequently lack mechanisms for automated feature selection and spatial awareness, which are critical for accurately delineating recharge zones (<xref ref-type="bibr" rid="B58">Roy et al., 2025</xref>). This gap highlights the need for more sophisticated models capable of learning intricate spatial and hydrological patterns directly from structured data without extensive manual preprocessing.</p>
<p>To address the pressing challenges of groundwater recharge assessment in the Feija Basin, this study presents an integrated GeoAI-based modeling framework. The approach leverages five advanced AI algorithms: TabNet, TabTransformer, MLP, CatBoost, and AdaBoost. Despite the growing availability of geospatial data in structured tabular formats derived from environmental layers such as soil, geomorphology, and hydrology, there remains a significant research gap in applying tabular deep learning models to groundwater recharge prediction, particularly in arid regions. While ML methods have gained traction in hydrogeology (<xref ref-type="bibr" rid="B33">Jari et al., 2023</xref>; <xref ref-type="bibr" rid="B2">Al Atawneh et al., 2024</xref>; <xref ref-type="bibr" rid="B44">Liu et al., 2024;</xref> <xref ref-type="bibr" rid="B60">Sarkar et al., 2024</xref>; <xref ref-type="bibr" rid="B28">Hosseini et al., 2025</xref>), deep learning (DL) architectures like TabNet and TabTransformer are rarely explored in this field. These models offer a distinct advantage in handling high-dimensional, heterogeneous tabular data. Their application in this study represents a novel attempt to adapt state-of-the-art DL techniques to the specific demands of recharge zone mapping in arid, fragile environments such as the Middle Dr&#xe2;a Valley.</p>
<p>This study pursues two principal aims. First, it explores the novel application of tabular DL architectures, specifically TabNet and TabTransformer, for hydrogeological modeling in arid environments, leveraging structured geospatial datasets to predict groundwater recharge zones with enhanced spatial accuracy. These models are systematically evaluated using robust performance metrics and validated against <italic>in situ</italic> borehole data to ensure empirical reliability. Second, the study aims to develop high-resolution groundwater recharge maps capable of identifying priority zones for artificial recharge. These outputs are intended to inform and accelerate the design of strategic water harvesting infrastructure, such as infiltration ponds and recharge basins, particularly in anticipation of increasing numbers of flood events projected under future climate scenarios (<xref ref-type="bibr" rid="B3">Amiha et al., 2024</xref>; <xref ref-type="bibr" rid="B57">Rieder et al., 2025</xref>). By aligning advanced AI techniques with geospatial intelligence, the research provides actionable insights to support sustainable water management and reduce the vulnerability of agriculture, especially watermelon production, in the water-stressed Feija Basin.</p>
</sec>
<sec id="s2">
<title>Related work</title>
<p>Groundwater resources in arid and semi-arid regions are increasingly under pressure due to anthropogenic overuse and climate variability. In southeastern Morocco, particularly the Feija Basin and the wider Middle Dr&#xe2;a Valley, this issue is acute. <xref ref-type="bibr" rid="B42">Lamqadem and Pradhan (2019)</xref> employed multi-temporal Landsat imagery to monitor land use transformations, documenting a shift from traditional pastoralism to agriculture, driven primarily by informal groundwater abstraction. Complementing this, <xref ref-type="bibr" rid="B50">Moumane et al. (2021)</xref> used a combination of remote sensing and geostatistical tools to assess groundwater salinization and drawdown in the Feija region, revealing significant degradation between 2013 and 2018.</p>
<p>Beyond hydrological metrics, sociopolitical studies such as those by <xref ref-type="bibr" rid="B14">Bossenbroek et al. (2023)</xref> and <xref ref-type="bibr" rid="B23">Fico (2024)</xref> have highlighted the role of land commodification, the expansion of commercial crops (e.g., watermelon), and unequal water access in intensifying the groundwater crisis in the region. Although these studies provide critical insights, they predominantly rely on GIS-based multi-criteria evaluation or qualitative assessments, with limited incorporation of predictive, data-driven modeling tools such as machine learning (ML) or deep learning (DL).</p>
<p>In other parts of the world, machine learning and deep learning have been successfully applied to groundwater potential mapping. <xref ref-type="bibr" rid="B54">Nugroho et al. (2024)</xref> evaluated the performance of random forest (RF), support vector machine (SVM), and artificial neural network (ANN) for predicting groundwater zones in West Java, Indonesia, using GIS and remote sensing layers. RF was found to outperform the other models in both accuracy and spatial coherence. <xref ref-type="bibr" rid="B60">Sarkar et al. (2024)</xref> applied a suite of ML models, including ANN and logistic regression, to assess groundwater potential in Bangladesh under climate change scenarios, demonstrating that integrating hydroclimatic variables into the modeling framework enhances spatial prediction accuracy. In Morocco, <xref ref-type="bibr" rid="B56">Ragragui et al. (2024)</xref> compared multiple ML classifiers and concluded that a voting ensemble model yielded the highest predictive accuracy for groundwater potential mapping, underscoring the effectiveness of ensemble strategies in data-scarce arid regions. Similarly, <xref ref-type="bibr" rid="B21">Elmotawakkil et al. (2024)</xref> explored the integration of geospatial data and ML techniques to improve groundwater level prediction and support sustainable water resource management in the Rabat&#x2013;Sal&#xe9;&#x2013;K&#xe9;nitra region.</p>
<p>Recent developments in deep learning have led to the emergence of models tailored specifically for tabular data, such as TabNet and TabTransformer. These architectures address limitations of traditional CNN and LSTM models when applied to non-sequential, structured datasets (<xref ref-type="bibr" rid="B5">Arik and Pfister, 2021</xref>; <xref ref-type="bibr" rid="B30">Huang et al., 2021</xref>) by enabling efficient feature selection and improved interpretability. While DL approaches like ANN have been adopted in recent groundwater studies, most applications continue to focus on conventional ML techniques such as random forest or logistic regression. Few studies attempt to compare these models statistically or explore newer tabular DL frameworks like <xref ref-type="bibr" rid="B32">Igwebuike et al. (2024)</xref>. Moreover, model evaluation remains largely dependent on singular performance metrics such as receiver operating characteristic (ROC)-AUC or accuracy, without multi-criteria decision-making or significance testing. Tools such as the Friedman test and the Technique for Order Preference by Similarity to Ideal Solution (TOPSIS) method, which enable rigorous model comparison and selection, are rarely employed in this context (<xref ref-type="bibr" rid="B73">Yariyan et al., 2021</xref>; <xref ref-type="bibr" rid="B6">Atenidegbe and Mogaji, 2023</xref>). This study introduces TabNet and other advanced models for groundwater potential mapping in the Feija Basin, offering a novel contribution by integrating tabular deep learning with rigorous statistical validation and spatial performance assessment.</p>
<p>In summary, the literature reveals that while GIS- and multi-criteria decision analysis (MCDA)-based approaches are commonly used for groundwater potential mapping in southeastern Morocco, the adoption of machine learning and DL techniques remains limited. International studies highlight the potential of these models, yet they often lack rigorous comparative validation and spatial assessment. To address these gaps, the present study implements and compares five advanced models, including TabNet, TabTransformer, MLP, CatBoost, and AdaBoost, for groundwater potential mapping in the Feija Basin. By integrating spatial accuracy evaluation with robust statistical techniques such as confusion matrices, ROC analysis, the Friedman test, and the TOPSIS ranking method, this study provides a comprehensive and reproducible framework for groundwater assessment in complex arid environments.</p>
</sec>
<sec sec-type="methods" id="s3">
<title>Methodology</title>
<p>This study presents a comprehensive ML pipeline designed to classify groundwater potential zones based on remote sensing and geospatial features. The methodology consists of sequential stages, including data preprocessing, augmentation, feature scaling, model selection, hyperparameter optimization, model training, and performance evaluation <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Methodological flowchart of the AI-driven framework for groundwater potential mapping.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g001.tif">
<alt-text content-type="machine-generated">Flowchart depicting the process of using groundwater conditioning factors to achieve final results. It starts with dataset creation from factors like elevation and rainfall, followed by pre-processing and cleaning. The dataset is split for training, validation, and testing. Model selection involves algorithms like AdaBoost and CatBoost. Hyperparameters are optimized using swarm optimization and grid search. Model training and evaluation are conducted using metrics such as accuracy and F1-score, leading to final results.</alt-text>
</graphic>
</fig>
<sec id="s3-1">
<title>Study area description</title>
<p>The Feija Plain is located in southeastern Morocco within the Middle Dr&#xe2;a Valley (MDV). This region, historically characterized by subsistence agriculture and seasonal pastoralism, is ecologically fragile and climatically arid (<xref ref-type="bibr" rid="B62">Schulz and Manfred, 2013</xref>). It lies along the western flank of the Dr&#xe2;a River near the city of Zagora and forms part of an interconnected oasis system extending over 200&#xa0;km (<xref ref-type="bibr" rid="B36">Karmaoui and Adil, 2016</xref>).</p>
<p>Over the past 2&#xa0;decades, Feija has undergone a rapid transformation toward intensive, export-oriented agriculture (<xref ref-type="bibr" rid="B42">Lamqadem and Pradhan, 2019</xref>). In particular, watermelon farming has emerged as the dominant land use, incentivized by government-subsidized drip irrigation systems and the widespread availability of high-yield hybrid seeds from international agribusinesses (<xref ref-type="bibr" rid="B22">Fico, 2022</xref>; <xref ref-type="bibr" rid="B65">Silva-Novoa S&#xe1;nchez, 2024</xref>). The region&#x2019;s warm winter climate allows for two harvests per season prior to the main production peaks in competing regions, granting it a comparative advantage in the national market (<xref ref-type="bibr" rid="B14">Bossenbroek et al., 2023</xref>).</p>
<p>Hydrogeologically, the Feija Plain is primarily underlain by shallow, unconfined phreatic aquifers hosted in Quaternary alluvial deposits, which have traditionally been accessed through hand-dug wells (<xref ref-type="bibr" rid="B4">Aoubouazza and Elmeknassi, 1996</xref>; <xref ref-type="bibr" rid="B40">Klose, 2013</xref>; <xref ref-type="bibr" rid="B7">Bassin Hydraulique de Souss Massa et de DraaABHSMD Agence du, 2014</xref>). However, the intensification of irrigated agriculture, particularly for high-demand crops such as watermelon, has triggered a dramatic increase in groundwater abstraction. As a result, deep boreholes, often exceeding 100&#xa0;m in depth, are now being drilled into older, confined aquifer systems embedded within Ordovician and Cambrian geological formations. These deep aquifers exhibit low recharge rates due to their lithological composition and structural confinement, rendering them highly vulnerable to overexploitation. The cumulative impact has been a significant decline in piezometric levels, raising critical concerns over long-term aquifer sustainability, ecological degradation, and the socioeconomic viability of agricultural livelihoods in the region (<xref ref-type="bibr" rid="B50">Moumane et al., 2021</xref>; <xref ref-type="bibr" rid="B51">2024</xref>).</p>
<p>The area is also traversed by ephemeral watercourses, including Oued Feija and Oued Boutious, which become active during high-intensity rainfall events. During the 2024&#x2013;2025 hydrological season, both streams experienced significant flash floods <xref ref-type="fig" rid="F2">Figures 2</xref>, <xref ref-type="fig" rid="F3">3</xref>, with at least five episodic flow events recorded. A particularly destructive storm occurred in early May 2025, when torrential rains and hail struck the Feija Plain. This event devastated nearly 4,000 to 5,000 tons of watermelon crops, only 1&#xa0;week before the main harvest. According to field reports, more than 700 farmers lost 90%&#x2013;95% of their production, leading to severe financial distress and widespread concerns about the repayment of agricultural loans (<xref ref-type="bibr" rid="B25">Freshplaza, 2025</xref>). Many cultivation areas were rendered inaccessible due to waterlogged tracks, and no water harvesting or artificial recharge systems were in place to capture the millions of cubic meters of floodwater lost to the desert.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Delineation of the Feija Watershed and ephemeral stream network on Sentinel-2 imagery (18 March 2025). This map delineates the Feija watershed in southeastern Morocco, outlined in red and overlaid on a Sentinel-2 L2A true color image acquired on 18 March 2025. The background satellite imagery illustrates the topographic and land use contrasts. The map highlights the ephemeral stream network (in blue), including Oued El Feija and Oued Bou Tiouas, which are typically dry but become active during flash flood events. Several key localities, such as Lmghader, Bouzkar, and Foum Lachar, are marked. These transient channels played a major role in surface runoff transport during storm events, underscoring the urgent need for floodwater harvesting and aquifer recharge infrastructure in the plain.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g002.tif">
<alt-text content-type="machine-generated">Map highlighting an area in Morocco with ephemeral streams in blue and key localities marked with yellow dots. Towns such as Bouzkar, Argab-n-tal, Foum Lachar, Lmghader, Djinia, and Anagam are labeled within the outlined region. A compass rose indicates direction, and a scale bar is provided for distance measurement. An inset map shows the location within Morocco.</alt-text>
</graphic>
</fig>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Post-flood Sentinel-2 image of the Feija Plain (2 May 2025) depicting agricultural damage following the early May 2025 flash floods. This Sentinel-2 L2A true color image, acquired on 2 May 2025, captures the Feija Plain in the immediate aftermath of severe flash floods that struck the region in early May. The area, including the agricultural zones around the village of Lmghader, was heavily impacted by torrential rains and hail. The ephemeral streams Oued Feija and Oued Boutious, visible as bright sediment-laden channels, overflowed and inundated surrounding farmland. According to field reports, approximately 4,000 to 5,000 tonnes of watermelon were destroyed 1&#xa0;week before harvest, affecting more than 700 farmers who lost up to 95% of their crop. The absence of floodwater retention infrastructure resulted in widespread waterlogging and the total loss of cultivable land parcels across the plain.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g003.tif">
<alt-text content-type="machine-generated">Satellite image showing the area around Lmghader with a desert landscape. Numerous small, dark green agricultural plots are scattered across the terrain. A scale bar at the bottom indicates distances in kilometers, and coordinates are along the edges. A green triangle marks the location of Lmghader.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3-2">
<title>Dataset description</title>
<p>The dataset used in this study integrates both remote sensing-derived features and <italic>in situ</italic> observations to support accurate classification of groundwater potential zones. The <italic>in situ</italic> component consists of field-based groundwater potential assessments or borehole productivity data, which serve as ground-truth labels for supervised machine learning. Predictor variables were extracted from multiple geospatial and satellite data sources, including stream distance, drainage density, soil permeability, rainfall, topographic wetness index (TWI), geomorphology, lineament density, curvature, slope, elevation (DEM), and the Normalized Difference Vegetation Index (NDVI). These features were obtained from processed satellite imagery (e.g., Sentinel-2), digital elevation models (e.g., SRTM), and thematic layers such as geological or hydrological maps. All spatial layers were resampled and reprojected to a common spatial resolution and coordinate system to ensure consistency. After preprocessing and integration, the dataset was formatted as a structured table where each entry corresponds to a geospatial unit associated with the input variables and a labeled groundwater potential class. Summary statistics for all input features, including their mean, standard deviation, minimum, and maximum values, are presented in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Descriptive statistics of input features.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Factors</th>
<th align="right">Mean</th>
<th align="right">Std Dev</th>
<th align="right">Min</th>
<th align="right">Max</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">NDVI</td>
<td align="right">0.0746</td>
<td align="right">0.0425</td>
<td align="right">0.0294</td>
<td align="right">0.3379</td>
</tr>
<tr>
<td align="left">Stream distance</td>
<td align="right">816.4746</td>
<td align="right">799.6260</td>
<td align="right">0.0000</td>
<td align="right">3786.2095</td>
</tr>
<tr>
<td align="left">Soil permeability</td>
<td align="right">1.4568</td>
<td align="right">1.2221</td>
<td align="right">0.0000</td>
<td align="right">3.0000</td>
</tr>
<tr>
<td align="left">Rainfall</td>
<td align="right">92.7709</td>
<td align="right">6.0181</td>
<td align="right">79.5719</td>
<td align="right">98.8845</td>
</tr>
<tr>
<td align="left">TWI</td>
<td align="right">7.3940</td>
<td align="right">2.2004</td>
<td align="right">3.9654</td>
<td align="right">19.4476</td>
</tr>
<tr>
<td align="left">Geomorphology</td>
<td align="right">1.5463</td>
<td align="right">0.8407</td>
<td align="right">1.0000</td>
<td align="right">5.0000</td>
</tr>
<tr>
<td align="left">Lineament density</td>
<td align="right">0.1346</td>
<td align="right">0.3070</td>
<td align="right">0.0000</td>
<td align="right">1.4887</td>
</tr>
<tr>
<td align="left">Curvature</td>
<td align="right">&#x2212;0.0856</td>
<td align="right">0.6359</td>
<td align="right">&#x2212;4.1250</td>
<td align="right">1.9479</td>
</tr>
<tr>
<td align="left">Slope</td>
<td align="right">7.7233</td>
<td align="right">8.6287</td>
<td align="right">0.3428</td>
<td align="right">32.7110</td>
</tr>
<tr>
<td align="left">Elevation</td>
<td align="right">859.9074</td>
<td align="right">186.9025</td>
<td align="right">664.0000</td>
<td align="right">1348.0000</td>
</tr>
</tbody>
</table>
</table-wrap>
<sec id="s3-2-1">
<title>Data preprocessing</title>
<p>The preprocessing workflow began with handling missing values, ensuring consistent data formats, and detecting and removing outliers to improve data quality. The dataset was then partitioned into training (64%), validation (16%), and testing (20%) subsets using stratified sampling to maintain a balanced distribution of groundwater potential classes across all sets.</p>
<p>To address class imbalance and improve model robustness, data augmentation was applied exclusively to the training set. Synthetic samples were generated by injecting Gaussian noise into the original features, with noise parameters constrained within the observed feature ranges. This technique preserved the statistical characteristics of the original data while increasing the diversity of training samples, thereby reducing the risk of overfitting and improving model generalization in underrepresented classes.</p>
<p>Feature scaling was performed using the StandardScaler from Scikit-learn. The scaler was fitted on the training data and then applied consistently to the validation and testing sets to prevent data leakage and ensure uniform scaling across the entire modeling pipeline.</p>
</sec>
<sec id="s3-2-2">
<title>Selection of predictor variables for groundwater modeling</title>
<p>Groundwater recharge is fundamentally controlled by hydrological, hydrogeological, and land-surface characteristics that affect infiltration, flow paths, and storage. We selected ten conditioning factors: elevation, slope, curvature, TWI, soil permeability, geomorphology, rainfall, NDVI, stream distance, and lineament density, based on their established roles in recharge processes and support in recent hydrogeological studies:</p>
<p>Elevation, slope, curvature, and TWI: These topographic indices determine runoff potential and soil moisture accumulation. The use of TWI and slope as recharge proxies is demonstrated in global hydrology models and distributed watershed frameworks (<xref ref-type="bibr" rid="B46">Mathewos et al., 2024</xref>; <xref ref-type="bibr" rid="B55">Patel et al., 2024</xref>; <xref ref-type="bibr" rid="B1">Ajayakumar and Reghunath, 2025</xref>).</p>
<p>Rainfall: As the principal source of recharge, precipitation is universally included in recharge assessments across Indian, African, and Chinese basins (<xref ref-type="bibr" rid="B35">Kaewdum and Chotpantarat, 2021</xref>; <xref ref-type="bibr" rid="B49">Mezali et al., 2025</xref>; <xref ref-type="bibr" rid="B68">Tabassum et al., 2025</xref>).</p>
<p>Soil permeability and geomorphology: Soil texture and landform types strongly influence infiltration rates. These factors have been weighted heavily in analytical hierarchy process (AHP) and MCDA studies (<xref ref-type="bibr" rid="B52">Moumane et al., 2025</xref>).</p>
<p>NDVI and LULC: Vegetation significantly impacts evapotranspiration and soil moisture. Plant cover, estimated via NDVI, is essential in recharge studies (<xref ref-type="bibr" rid="B48">Meng et al., 2024</xref>).</p>
<p>Stream (drainage) distance: Areas close to streams or with low drainage density often indicate greater infiltration potential (<xref ref-type="bibr" rid="B63">Sedghi and Zhan, 2023</xref>).</p>
<p>Lineament density: Fracture and fault frequency control subsurface fluid pathways. High-density lineament zones positively correlate with recharge (<xref ref-type="bibr" rid="B59">Sander, 2007</xref>).</p>
<p>These factors are widely recognized across hydrological literature, from GIS-based MCDA/AHP frameworks to data-driven predictive schemes. <xref ref-type="table" rid="T2">Table 2</xref> includes a detailed summary of each variable&#x2019;s data source, unit type, and hydrological relevance, citing these foundational studies to enhance transparency and methodological robustness.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Groundwater conditioning factors used in the study, along with their data characteristics and hydrological relevance.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Factor</th>
<th align="left">Type</th>
<th align="left">Unit/Class</th>
<th align="left">Source</th>
<th align="left">Hydrological relevance</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Elevation</td>
<td align="left">Continuous</td>
<td align="left">Meters (m)</td>
<td align="left">USGS EarthExplorer (30&#xa0;m)</td>
<td align="left">Governs flow direction and recharge zone location</td>
</tr>
<tr>
<td align="left">Slope</td>
<td align="left">Continuous</td>
<td align="left">Degrees (&#xb0;)</td>
<td align="left">Derived from DEM (USGS)</td>
<td align="left">Influences runoff intensity and infiltration</td>
</tr>
<tr>
<td align="left">Curvature</td>
<td align="left">Continuous</td>
<td align="left">Unitless</td>
<td align="left">Derived from DEM (USGS)</td>
<td align="left">Identifies concave/convex zones affecting accumulation</td>
</tr>
<tr>
<td align="left">TWI</td>
<td align="left">Continuous</td>
<td align="left">Unitless</td>
<td align="left">Derived from DEM (USGS)</td>
<td align="left">Highlights areas of potential saturation</td>
</tr>
<tr>
<td align="left">Soil permeability</td>
<td align="left">Categorical</td>
<td align="left">Low, medium, high</td>
<td align="left">
<xref ref-type="bibr" rid="B51">Moumane et al. (2024)</xref>
</td>
<td align="left">Controls percolation and subsurface infiltration rate</td>
</tr>
<tr>
<td align="left">Geomorphology</td>
<td align="left">Categorical</td>
<td align="left">Landform classes</td>
<td align="left">Topographic maps (El Gloa and Zagora, 1:100,000)</td>
<td align="left">Reflects lithology and terrain influencing recharge</td>
</tr>
<tr>
<td align="left">NDVI</td>
<td align="left">Continuous</td>
<td align="left">0&#x2013;1</td>
<td align="left">Landsat 8<break/>Landsat 9 (30&#xa0;m)</td>
<td align="left">Proxy for vegetation health and evapotranspiration</td>
</tr>
<tr>
<td align="left">Rainfall</td>
<td align="left">Continuous</td>
<td align="left">mm/year</td>
<td align="left">NASA POWER<break/>Local station (Zagora)</td>
<td align="left">Represents direct recharge potential from precipitation</td>
</tr>
<tr>
<td align="left">Stream distance</td>
<td align="left">Continuous</td>
<td align="left">Meters (m)</td>
<td align="left">Derived from DEM and topographic maps</td>
<td align="left">Indicates surface water proximity and indirect recharge zones</td>
</tr>
<tr>
<td align="left">Lineament density</td>
<td align="left">Continuous</td>
<td align="left">km/km<sup>2</sup>
</td>
<td align="left">Derived from DEM (USGS) using GIS</td>
<td align="left">Indicates fractures and pathways aiding infiltration</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s3-3">
<title>Feature selection</title>
<p>To improve model robustness and reduce redundancy in the input space, feature selection was conducted using both linear and nonlinear dependency analyses. First, a Pearson correlation matrix (<xref ref-type="fig" rid="F4">Figure 4</xref>) was computed to identify pairs of features with high collinearity. Features exhibiting strong correlations (i.e., <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mfenced open="|" close="" separators="|">
<mml:mrow>
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mfenced open="|" close="" separators="|">
<mml:mrow>
<mml:mo>&#x3e;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>0.9</mml:mn>
</mml:mrow>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</inline-formula>) were examined, and one feature from each correlated pair was removed to avoid multicollinearity, which can distort model learning and increase variance.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Feature correlation matrix among input variables.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g004.tif">
<alt-text content-type="machine-generated">Correlation matrix with a color scale from -0.5 (purple) to 1.0 (yellow). Variables include NDVI, Stream Distance, Soil Permeability, and others. Diagonal values show perfect correlation (1.0).</alt-text>
</graphic>
</fig>
<p>In parallel, mutual information (MI) was computed between each input feature and the target groundwater potential class to capture nonlinear dependencies <xref ref-type="fig" rid="F5">Figure 5</xref>. Features with low MI scores, indicating weak predictive relevance, were excluded from the final feature set. This dual approach allowed for the retention of variables that were both independent and informative, thereby optimizing the input space used for model training and reducing computational complexity.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Mutual information scores between features and groundwater potential classes.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g005.tif">
<alt-text content-type="machine-generated">Bar chart showing mutual information scores for various features. Slope has the highest score, followed by lineament density and curvature. Other features include elevation, rainfall, soil permeability, stream distance, TWI, NDVI, and geomorphology, with descending scores. The horizontal axis represents the mutual information score, while the vertical axis lists the features.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3-4">
<title>Machine learning and deep learning models</title>
<p>In this study, a combination of traditional ML algorithms and modern DL architectures was employed to classify groundwater potential zones based on a set of geospatial and environmental features. The chosen models were selected to provide a comprehensive comparison between interpretable, efficient classifiers and more complex, representation-learning-based models. Specifically, the ML models used include CatBoost and AdaBoost. These algorithms are known for their robustness, generalization capabilities, and suitability for structured data.</p>
<p>To complement these, three DL models, MLP, TabNet, and TabTransformer, were implemented to evaluate their ability to capture high-order feature interactions and complex patterns. TabNet and TabTransformer are recent architectures designed specifically for tabular data, offering attention-based mechanisms that improve interpretability and learning efficiency. The diversity of models allows for a comprehensive evaluation of predictive performance, computational cost, and interpretability across different learning paradigms.</p>
</sec>
<sec id="s3-5">
<title>AdaBoost classifier</title>
<p>AdaBoost (adaptive boosting) is an ensemble method that combines multiple weak classifiers, typically decision stumps, to form a strong classifier. It improves performance by focusing on the training instances that were previously misclassified. At each iteration, AdaBoost assigns a weight to the weak learner based on its accuracy and updates the weights of the training samples to emphasize difficult examples.</p>
<p>Given a dataset of <inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> samples <inline-formula id="inf3">
<mml:math id="m3">
<mml:mrow>
<mml:mfenced open="{" close="}" separators="|">
<mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</inline-formula>, where <inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mrow>
<mml:mfenced open="{" close="}" separators="|">
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, the final strong classifier <inline-formula id="inf5">
<mml:math id="m5">
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is defined as follows:<disp-formula id="equ1">
<mml:math id="m6">
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>sign</mml:mtext>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>T</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b1;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>where:<list list-type="simple">
<list-item>
<p>&#x2022; <inline-formula id="inf6">
<mml:math id="m7">
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the total number of boosting rounds,</p>
</list-item>
<list-item>
<p>&#x2022; <inline-formula id="inf7">
<mml:math id="m8">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the weak learner at iteration <inline-formula id="inf8">
<mml:math id="m9">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>,</p>
</list-item>
<list-item>
<p>&#x2022; <inline-formula id="inf9">
<mml:math id="m10">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b1;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:mfrac>
<mml:mi>ln</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x3f5;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
</mml:mrow>
<mml:msub>
<mml:mi>&#x3f5;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the weight assigned to <inline-formula id="inf10">
<mml:math id="m11">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>,</p>
</list-item>
<list-item>
<p>&#x2022; <inline-formula id="inf11">
<mml:math id="m12">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3f5;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the weighted error of <inline-formula id="inf12">
<mml:math id="m13">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</list-item>
</list>
</p>
<p>After each iteration, the weights of the training samples are updated according to their classification outcome, thereby guiding the model to focus on harder-to-classify examples. This adaptive mechanism helps AdaBoost improve the overall prediction accuracy while maintaining good generalization.</p>
<p>AdaBoost has demonstrated robust performance across various classification tasks and has solid theoretical foundations, particularly in reducing both bias and variance (<xref ref-type="bibr" rid="B61">Schapire, 1999</xref>).</p>
</sec>
<sec id="s3-6">
<title>CatBoost</title>
<p>CatBoost is a gradient boosting decision tree (GBDT) algorithm developed to handle categorical features efficiently without extensive preprocessing (<xref ref-type="bibr" rid="B18">Dorogush, Ershov, and Gulin, 2018</xref>). The model constructs an ensemble of decision trees, where each tree <inline-formula id="inf13">
<mml:math id="m14">
<mml:mrow>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> corrects the errors of its predecessors by minimizing a differentiable loss function <inline-formula id="inf14">
<mml:math id="m15">
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>:<disp-formula id="equ2">
<mml:math id="m16">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">F</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold">x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold">F</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold">x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi>&#x3b3;</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold">x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf15">
<mml:math id="m17">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b3;</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the learning rate. CatBoost incorporates ordered boosting and novel techniques to mitigate prediction shift, making it highly effective for heterogeneous tabular datasets with mixed data types.</p>
</sec>
<sec id="s3-7">
<title>Multilayer perceptron (MLP)</title>
<p>MLP is a fundamental DL architecture composed of multiple layers of interconnected neurons, where each neuron applies an affine transformation followed by a nonlinear activation function (<xref ref-type="bibr" rid="B27">Goodfellow, Bengio, and Courville, 2016</xref>). Given an input feature vector <inline-formula id="inf16">
<mml:math id="m18">
<mml:mrow>
<mml:mi mathvariant="bold">x</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi mathvariant="double-struck">R</mml:mi>
<mml:mi>d</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, the hidden layer output <inline-formula id="inf17">
<mml:math id="m19">
<mml:mrow>
<mml:mi mathvariant="bold">h</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is computed as follows:<disp-formula id="equ3">
<mml:math id="m20">
<mml:mrow>
<mml:mi mathvariant="bold">h</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>&#x3c3;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">W</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mi mathvariant="bold">x</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold">b</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf18">
<mml:math id="m21">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">W</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf19">
<mml:math id="m22">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">b</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are the weight matrix and bias vector, respectively, and <inline-formula id="inf20">
<mml:math id="m23">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mo>&#xb7;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is a nonlinear activation function such as a rectified linear unit (ReLU). This hidden representation is then passed through additional layers or directly to the output layer for final prediction:<disp-formula id="equ4">
<mml:math id="m24">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>&#x3d5;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">W</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mi mathvariant="bold">h</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold">b</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf21">
<mml:math id="m25">
<mml:mrow>
<mml:mi>&#x3d5;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mo>&#xb7;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> denotes the activation function used in the output layer (e.g., softmax for classification or identity for regression). MLPs are powerful function approximators capable of modeling complex nonlinear relationships between input features and target variables.</p>
<sec id="s3-7-1">
<title>TabNet</title>
<p>TabNet is a unified DL architecture that employs a sequential multi-step decision process to enhance both feature selection and the representation of high-dimensional data (<xref ref-type="bibr" rid="B5">Arik and Pfister, 2021</xref>). At each step in the sequence, a D-dimensional feature vector is processed and passed through a Feature Transformer module. This module comprises several layers that may be either shared across all decision steps or uniquely assigned to individual steps. Within each Transformer block, fully connected layers are integrated with batch normalization and gated linear unit (GLU) activations. The GLU is further enhanced with a residual connection followed by normalization, which contributes to maintaining stable variance across the network. This hierarchical structure not only facilitates effective feature selection but also optimizes the model&#x2019;s parameter usage.</p>
<p>At each decision step, TabNet uses an Attentive Transformer to generate a sparse mask that selects relevant features. This mask is computed as follows:<disp-formula id="equ5">
<mml:math id="m26">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold">M</mml:mi>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>Sparsemax</mml:mtext>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold">P</mml:mi>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>&#xb7;</mml:mo>
<mml:msup>
<mml:mi mathvariant="bold">a</mml:mi>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf22">
<mml:math id="m27">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold">P</mml:mi>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> is a learnable projection matrix and <inline-formula id="inf23">
<mml:math id="m28">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold">a</mml:mi>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> is the aggregated context from the previous step. The selected features are element-wise multiplied with the input and passed through a Feature Transformer block, producing outputs <inline-formula id="inf24">
<mml:math id="m29">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold">h</mml:mi>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, which are aggregated over <inline-formula id="inf25">
<mml:math id="m30">
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> steps:<disp-formula id="equ6">
<mml:math id="m31">
<mml:mrow>
<mml:mi mathvariant="bold">z</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>T</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:msup>
<mml:mi mathvariant="bold">h</mml:mi>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>The final prediction is computed as follows:<disp-formula id="equ7">
<mml:math id="m32">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>&#x3c3;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">W</mml:mi>
<mml:mi>o</mml:mi>
</mml:msub>
<mml:mo>&#xb7;</mml:mo>
<mml:mi mathvariant="bold">z</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold">b</mml:mi>
<mml:mi>o</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>This step-wise attention mechanism enables TabNet to focus on the most informative features at each stage, offering both high predictive performance and interpretability for structured datasets.</p>
</sec>
</sec>
<sec id="s3-8">
<title>TabTransformer with self-supervised learning</title>
<p>The TabTransformer is a DL architecture tailored for tabular data, effectively modeling both categorical and numerical features through contextual embeddings and self-attention mechanisms (<xref ref-type="bibr" rid="B30">Huang et al., 2021</xref>). In this framework, each categorical feature <inline-formula id="inf26">
<mml:math id="m33">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is mapped to a dense embedding vector <inline-formula id="inf27">
<mml:math id="m34">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">e</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi mathvariant="double-struck">R</mml:mi>
<mml:mi>d</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, forming an embedding matrix <inline-formula id="inf28">
<mml:math id="m35">
<mml:mrow>
<mml:mi mathvariant="bold">E</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi mathvariant="double-struck">R</mml:mi>
<mml:mrow>
<mml:mi>C</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> for <inline-formula id="inf29">
<mml:math id="m36">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> categorical features:<disp-formula id="equ8">
<mml:math id="m37">
<mml:mrow>
<mml:mi mathvariant="bold">E</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">e</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold">e</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>;</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold">e</mml:mi>
<mml:mi>C</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>These embeddings are processed through Transformer encoder layers utilizing multi-head self-attention to capture inter-feature dependencies. The output embeddings are then concatenated with normalized numerical features <inline-formula id="inf30">
<mml:math id="m38">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">x</mml:mi>
<mml:mtext>num</mml:mtext>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> to form a combined representation <inline-formula id="inf31">
<mml:math id="m39">
<mml:mrow>
<mml:mi mathvariant="bold">h</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>:<disp-formula id="equ9">
<mml:math id="m40">
<mml:mrow>
<mml:mi mathvariant="bold">h</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mtext>Flatten</mml:mtext>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mtext>Transformer</mml:mtext>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold">E</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold">x</mml:mi>
<mml:mtext>num</mml:mtext>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>This representation <inline-formula id="inf32">
<mml:math id="m41">
<mml:mrow>
<mml:mi mathvariant="bold">h</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is subsequently passed through an MLP for downstream tasks such as classification or regression. The architecture supports self-supervised pretraining strategies, including masked feature modeling, to enhance performance on tasks with limited labeled data (<xref ref-type="bibr" rid="B70">Vyas and Bertsimas, 2024</xref>).</p>
</sec>
<sec id="s3-9">
<title>Model optimization</title>
<p>Hyperparameter optimization was critical for maximizing the predictive performance of the models. Two different strategies were applied depending on the model type: grid search for DL models and particle swarm optimization (PSO) for classical ML models.</p>
<sec id="s3-9-1">
<title>Grid search optimization</title>
<p>Grid search (<xref ref-type="bibr" rid="B8">Bergstra and Bengio, 2012</xref>) is a systematic approach that exhaustively explores a manually defined subset of the hyperparameter space. In <xref ref-type="table" rid="T3">Table 3</xref>, grid search was applied to optimize DL models such as TabNet, TabTransformer, and MLP. Although computationally intensive, grid search guarantees the identification of the optimal hyperparameter combination within the predefined grid. It is particularly effective when the search space is moderate in size and model training times are relatively manageable. Cross-validation was used during the search process to ensure the robustness and generalization capability of the selected hyperparameters.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Grid search: hyperparameter ranges and best settings for deep learning models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Model</th>
<th align="left">Hyperparameter</th>
<th align="left">Search space</th>
<th align="left">Best value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="5" align="left">TabNet</td>
<td align="left">n_steps</td>
<td align="left">[3, 5]</td>
<td align="left">3</td>
</tr>
<tr>
<td align="left">n_d, n_a</td>
<td align="left">[8, 16, 32]</td>
<td align="left">32</td>
</tr>
<tr>
<td align="left">gamma</td>
<td align="left">[1.0, 1.3, 1.5]</td>
<td align="left">1.3</td>
</tr>
<tr>
<td align="left">lambda_sparse</td>
<td align="left">[1e-3, 1e-4]</td>
<td align="left">0.0001</td>
</tr>
<tr>
<td align="left">lr</td>
<td align="left">[0.005, 0.01, 0.02]</td>
<td align="left">0.01</td>
</tr>
<tr>
<td rowspan="5" align="left">TabTransformer</td>
<td align="left">num_layers</td>
<td align="left">[1, 2, 3]</td>
<td align="left">1</td>
</tr>
<tr>
<td align="left">num_heads</td>
<td align="left">[2, 4, 8]</td>
<td align="left">2</td>
</tr>
<tr>
<td align="left">hidden_dim</td>
<td align="left">[64, 128, 256]</td>
<td align="left">64</td>
</tr>
<tr>
<td align="left">dropout</td>
<td align="left">[0.1, 0.2, 0.3]</td>
<td align="left">0.1</td>
</tr>
<tr>
<td align="left">lr</td>
<td align="left">[0.0001, 0.001, 0.01]</td>
<td align="left">0.001</td>
</tr>
<tr>
<td rowspan="5" align="left">MLP</td>
<td align="left">hidden_size1</td>
<td align="left">[32, 64, 128]</td>
<td align="left">128</td>
</tr>
<tr>
<td align="left">hidden_size2</td>
<td align="left">[16, 32, 64]</td>
<td align="left">32</td>
</tr>
<tr>
<td align="left">dropout</td>
<td align="left">[0.2, 0.3, 0.4]</td>
<td align="left">0.3</td>
</tr>
<tr>
<td align="left">lr</td>
<td align="left">[0.0001, 0.0005, 0.001]</td>
<td align="left">0.001</td>
</tr>
<tr>
<td align="left">weight_decay</td>
<td align="left">[1e-4, 1e-5]</td>
<td align="left">0.0001</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-9-2">
<title>Swarm optimization</title>
<p>Particle swarm optimization (PSO) (<xref ref-type="bibr" rid="B38">Kennedy and Russell, 1995</xref>) was utilized for classical ML models, including support vector machine (SVM) and AdaBoost. PSO is a nature-inspired metaheuristic algorithm modeled after the collective behavior of bird flocking and fish schooling. It optimizes hyperparameters by initializing a swarm of candidate solutions that move through the search space guided by their own best-known positions and the global best-known position <xref ref-type="table" rid="T4">Table 4</xref>. PSO is particularly advantageous for efficiently exploring large, non-convex, and multi-modal search spaces, offering faster convergence and better avoidance of local minima than grid-based methods.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Swarm optimization: hyperparameter ranges and best settings for machine learning models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Model</th>
<th align="left">Hyperparameter</th>
<th align="left">Search space</th>
<th align="left">Best value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="4" align="left">CatBoost</td>
<td align="left">depth</td>
<td align="left">[4, 5, 6, 7, 8]</td>
<td align="left">7</td>
</tr>
<tr>
<td align="left">learning_rate</td>
<td align="left">[0.01, 0.1]</td>
<td align="left">0.0971</td>
</tr>
<tr>
<td align="left">iterations</td>
<td align="left">[50, 150]</td>
<td align="left">99</td>
</tr>
<tr>
<td align="left">l2_leaf_reg</td>
<td align="left">[1, 2, 3, 4, 5]</td>
<td align="left">2</td>
</tr>
<tr>
<td rowspan="3" align="left">AdaBoost</td>
<td align="left">n_estimators</td>
<td align="left">[50, 150]</td>
<td align="left">150</td>
</tr>
<tr>
<td align="left">learning_rate</td>
<td align="left">[0.01, 0.1]</td>
<td align="left">0.01</td>
</tr>
<tr>
<td align="left">algorithm</td>
<td align="left">[&#x2018;SAMME&#x2019;, &#x2018;SAMME.R&#x2019;]</td>
<td align="left">&#x2018;SAMME.R&#x2032;</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The reason PSO, and more generally, swarm optimization (SO), is often preferred for ML models rather than DL models comes down to efficiency, scalability, and internal training complexity. ML models typically have fewer parameters and faster evaluation cycles, making SO-based tuning more computationally feasible. In contrast, DL models involve expensive gradient-based internal optimization during training, making external swarm-based hyperparameter tuning impractical due to high computational cost and time requirements.</p>
</sec>
</sec>
<sec id="s3-10">
<title>Model evaluation</title>
<p>We employed several standard evaluation metrics to comprehensively assess the performance of the developed classification models, including accuracy, precision, recall (sensitivity), F1-score, specificity, and Cohen&#x2019;s kappa score. These metrics are essential for evaluating both overall and class-wise performance, especially in the presence of class imbalance (<xref ref-type="bibr" rid="B67">Sokolova and Lapalme, 2009</xref>; <xref ref-type="bibr" rid="B15">Chicco and Jurman, 2020</xref>; <xref ref-type="bibr" rid="B41">Kumar and Singh, 2022</xref>).</p>
<p>The following equations define the metrics used:</p>
<p>
<xref ref-type="table" rid="T4">Table 4</xref> evaluation metrics (mathematical definitions).<disp-formula id="equ10">
<mml:math id="m42">
<mml:mrow>
<mml:mtext>Accuracy</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mtext>&#x2009;Precision</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mtext>&#x2009;Recall</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="equ11">
<mml:math id="m43">
<mml:mrow>
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mo>1</mml:mo>
<mml:mo>&#x2010;</mml:mo>
<mml:mtext>Score</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#xb7;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mtext>Precision</mml:mtext>
<mml:mo>&#xb7;</mml:mo>
<mml:mtext>Recall</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>Precision</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mtext>Recall</mml:mtext>
</mml:mrow>
</mml:mfrac>
<mml:mtext>&#x2009;Specificity</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mtext>&#x2009;Kappa</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mi>o</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mi>e</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mi>e</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf33">
<mml:math id="m44">
<mml:mrow>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mi>o</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the observed accuracy and <inline-formula id="inf34">
<mml:math id="m45">
<mml:mrow>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mi>e</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the expected accuracy under random chance. Here, <inline-formula id="inf35">
<mml:math id="m46">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf36">
<mml:math id="m47">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf37">
<mml:math id="m48">
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula id="inf38">
<mml:math id="m49">
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> denote true positives, true negatives, false positives, and false negatives, respectively. The kappa score evaluates the degree of agreement beyond chance, where a value of <inline-formula id="inf39">
<mml:math id="m50">
<mml:mrow>
<mml:mi>&#x3ba;</mml:mi>
<mml:mo>&#x3e;</mml:mo>
<mml:mn>0.6</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> generally indicates substantial agreement (<xref ref-type="bibr" rid="B47">McHugh, 2012</xref>).</p>
<p>All metrics were computed using weighted averages to accommodate class imbalance, and models were evaluated on both training and testing data to ensure generalization. In addition, receiver operating characteristic (ROC) and precision-recall (PR) curves were plotted to assess classification thresholds and model discrimination capacity (<xref ref-type="bibr" rid="B16">Davis and Goadrich, 2006</xref>).</p>
<sec id="s3-10-1">
<title>Model selection using the Friedman test and TOPSIS</title>
<p>To identify the best-performing ML model among multiple candidates, we adopted a dual evaluation strategy based on (1) the Friedman test with <italic>post hoc</italic> ranking and (2) TOPSIS. These methods were chosen for their robustness in multi-metric and multi-model comparison scenarios, where conventional single-metric evaluations may lead to biased or inconsistent conclusions.</p>
<p>The Friedman test is a nonparametric statistical test used to detect significant differences in the performance rankings of models across multiple metrics or datasets. It does not assume normality and is particularly suitable for ML experiments involving repeated measures. In our case, we applied the Friedman test across six performance metrics (accuracy, recall, specificity, precision, F1-score, and Cohen&#x2019;s kappa) to evaluate six models. A significant test result indicates that at least one model performs differently. If significance is confirmed, <italic>post hoc</italic> analyses (e.g., the Nemenyi test) can identify which models differ significantly (<xref ref-type="bibr" rid="B17">Dem&#x161;ar, 2006</xref>).</p>
<p>The Friedman test was employed in parallel to compare the performance of each model based on multiple evaluation metrics. This test ranks the models by considering their performance across all metrics (classification accuracy, AUC-ROC, Cohen&#x2019;s kappa, and feature importance) and identifies statistically significant differences between them (<xref ref-type="bibr" rid="B31">Hwang and Yoon, 1981</xref>). This approach allows for the selection of the best-performing model without the need for aggregation into a single composite score.</p>
<p>Combining both the Friedman test and TOPSIS allows for statistically grounded, robust, and interpretable model selection. The former ensures that differences are not due to randomness, while the latter facilitates holistic evaluation across all performance aspects.</p>
<p>The proposed methodology integrates advanced data preparation techniques, including cleaning, augmentation, and feature scaling, with tailored optimization strategies adapted to each model type. Deep learning models (TabNet, TabTransformer, and MLP) are fine-tuned using grid search, while machine learning models (CatBoost and AdaBoost) benefit from swarm optimization to efficiently explore large hyperparameter spaces. Finally, model evaluation is conducted using a comprehensive set of metrics to ensure robust and interpretable groundwater potential classification.</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="s4">
<title>Results</title>
<sec id="s4-1">
<title>Groundwater conditioning factors</title>
<p>The spatial distribution of the selected groundwater conditioning factors is illustrated in <xref ref-type="fig" rid="F6">Figures 6</xref>&#x2013;<xref ref-type="fig" rid="F8">8</xref>. These factors, derived from remote sensing and geospatial datasets, were carefully selected based on their relevance to groundwater recharge dynamics in arid and semi-arid environments. Topographic features such as elevation, slope, curvature, and the TWI influence surface runoff, water accumulation, and infiltration capacity. Soil permeability and geomorphological classes reflect lithological and structural controls that govern the percolation of water through subsurface formations. The Normalized Difference Vegetation Index (NDVI) serves as an ecological proxy for vegetation cover, which is often indicative of groundwater availability in shallow aquifers. Hydrological parameters, including rainfall, lineament density, and stream distance, capture climatic inputs and structural pathways that facilitate recharge. Together, these twelve factors provide a comprehensive representation of the hydro-environmental variability across the Feija Basin and form a robust input set for data-driven groundwater potential modeling.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Spatial distribution of four of the ten groundwater conditioning factors used in the study: rainfall, elevation, stream distance, and soil permeability.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g006.tif">
<alt-text content-type="machine-generated">Top left map shows rainfall distribution with high values in dark blue and low in light purple. Top right map depicts elevation with a gradient from red (high) to pink (low). Bottom left map illustrates stream distance with high values in purple and low in red. Bottom right map presents soil permeability, ranging from high in dark blue to very low in gray. Each map is set over a satellite terrain image with scale bars and compass roses.</alt-text>
</graphic>
</fig>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Spatial distribution of four of the ten groundwater conditioning factors used in the study: slope, TWI, drainage density, and NDVI.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g007.tif">
<alt-text content-type="machine-generated">Four maps illustrating topographical and vegetation data of a region. Top-left shows slope values in green to red, high to low. Top-right displays Topographic Wetness Index (TWI) in bright green. Bottom-left presents geomorphology with various colors indicating features like plains and channels. Bottom-right shows NDVI values, with red indicating low vegetation and green for high. Each map has a compass rose, scale bar in kilometers, and legends indicating data ranges.</alt-text>
</graphic>
</fig>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Spatial distribution of two of the ten groundwater conditioning factors used in the study: curvature and lineament density.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g008.tif">
<alt-text content-type="machine-generated">Two side-by-side maps showing lineament density and curvature in a region. The left map highlights areas of high lineament density in red. The right map displays curvature values with varying intensity, predominantly in green and yellow. Both maps include a compass and a scale in kilometers.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s4-2">
<title>Model performance evaluation</title>
<p>All performance results presented in this section are based on the optimal hyperparameter configurations obtained through the tuning procedures outlined in the Methodology section. To ensure a comprehensive evaluation, the classification performance of the five models (TabNet, TabTransformer, MLP, CatBoost, and AdaBoost) was assessed separately on the training and testing datasets. A range of standard evaluation metrics was computed, including accuracy, recall, specificity, precision, F1-score, and Cohen&#x2019;s kappa. <xref ref-type="fig" rid="F9">Figure 9</xref> presents radar plots that visualize and compare the performance of each model across these metrics for both phases, providing clear insight into learning effectiveness and generalization capability.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Radar plots of performance metrics for training (left) and testing (right) sets across all models.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g009.tif">
<alt-text content-type="machine-generated">Two radar charts compare the performance of machine learning models during training and testing. Models include AdaBoost, CatBoost, TabNet, TabTransformer, and MLP. Metrics measured are accuracy, recall, specificity, precision, F1 score, and Kappa. Each model&#x27;s performance is plotted with different colored lines corresponding to each metric. The charts illustrate variations in model performance across different metrics.</alt-text>
</graphic>
</fig>
<p>Overall, TabNet and TabTransformer exhibited superior and consistent performance, attaining high scores across all evaluation metrics during the testing phase. AdaBoost and CatBoost also demonstrated competitive results, whereas MLP displayed moderate performance, reflecting limited generalization capacity.</p>
<p>
<xref ref-type="fig" rid="F10">Figure 10</xref> presents the confusion matrices for each model on the test dataset. TabNet and TabTransformer achieved the most balanced predictions across the three groundwater potential (GWP) classes, misclassifying only a small number of samples. CatBoost also performed reasonably well but showed minor misclassification between Class 2 and Class 3. MLP and especially AdaBoost displayed noticeable confusion, particularly with Class 2 instances being predicted as Class 3.</p>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>Confusion matrices for each model evaluated on the test set.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g010.tif">
<alt-text content-type="machine-generated">Five confusion matrices compare the performance of CatBoost, MLP, TabNet, TabTransformer, and AdaBoost models. Each matrix shows actual versus predicted classes. The diagonal indicates correct predictions, with CatBoost and TabNet showing higher accuracy, while AdaBoost has more off-diagonal misclassifications.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s4-3">
<title>Receiver operating characteristic (ROC) analysis</title>
<p>To assess the discriminative power of the classifiers beyond accuracy-based metrics, we conducted a ROC analysis using the micro-average AUC approach, suitable for multi-class classification scenarios. <xref ref-type="fig" rid="F11">Figure 11</xref> presents the ROC curves for all models on both training and testing datasets.</p>
<fig id="F11" position="float">
<label>FIGURE 11</label>
<caption>
<p>ROC curves (micro-average) for all models on <bold>(a)</bold> training and <bold>(b)</bold> testing datasets.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g011.tif">
<alt-text content-type="machine-generated">Two ROC curve charts compare the performance of machine learning models. Chart (a) shows TabNet and TabTransformer with AUC of 0.99, MLP and AdaBoost with 0.96, CatBoost with 0.99. Chart (b) shows TabNet and CatBoost with AUC of 0.98, TabTransformer and AdaBoost with 0.97, MLP with 0.96. Dashed lines represent different models.</alt-text>
</graphic>
</fig>
<p>The ensemble-based and DL models (TabNet, TabTransformer, and CatBoost) achieved near-perfect AUC values of 0.99 on both training and testing phases, reflecting excellent separability among the GWP classes. MLP and AdaBoost exhibited slightly lower AUC scores, with values of 0.96 and 0.97 on the test set, respectively. These results corroborate earlier observations from confusion matrices and classification metrics, indicating that TabNet and TabTransformer not only classify accurately but also maintain strong discriminatory performance across all classes.</p>
</sec>
<sec id="s4-4">
<title>Feature influence and model sensitivity</title>
<p>The correlation matrix and mutual information analysis (not shown here) provided insights into the relationships and relevance of input features. These analyses highlighted that factors such as elevation, slope, and soil permeability have a strong influence on GWP classification. Feature importance scores obtained from each model (<xref ref-type="fig" rid="F12">Figure 12</xref>) further confirmed these findings, with elevation consistently ranked as the most influential variable.</p>
<fig id="F12" position="float">
<label>FIGURE 12</label>
<caption>
<p>Feature importance scores across all models.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g012.tif">
<alt-text content-type="machine-generated">Five bar charts display feature importance for different models: AdaBoost, TabNet, TabTransformer, MLP, and CatBoost. Each evaluates nine features, with &#x27;Elevation&#x27; consistently showing the highest importance across models. The importance varies for other features like &#x27;Soil Permeability&#x27;, &#x27;NDVI&#x27;, &#x27;Slope&#x27;, and &#x27;Stream Distance&#x27;.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s4-5">
<title>Groundwater class distribution and spatial mapping</title>
<p>The distribution of predicted groundwater classes across models is visualized in <xref ref-type="fig" rid="F13">Figure 13</xref>. Most models exhibited relatively balanced classifications among the three GWP categories. However, AdaBoost disproportionately predicted Class 3 (42.2%), indicating bias toward higher groundwater potential zones.</p>
<fig id="F13" position="float">
<label>FIGURE 13</label>
<caption>
<p>Percentage distribution of groundwater potential classes for each model on the test set.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g013.tif">
<alt-text content-type="machine-generated">Stacked bar chart comparing five models: TabNet, TabTransformer, MLP, CatBoost, and AdaBoost. Each bar is divided into three classes. Class 1 in blue ranges from 31.8% to 35.1%, Class 2 in green ranges from 26.0% to 32.0%, and Class 3 in gray ranges from 33.1% to 42.2%.</alt-text>
</graphic>
</fig>
<p>The spatial predictions generated by each model are presented in <xref ref-type="fig" rid="F13">Figures 13</xref>, <xref ref-type="fig" rid="F14">14</xref>, <xref ref-type="fig" rid="F15">15</xref>. Models such as TabNet, TabTransformer, and CatBoost produced coherent and geographically consistent patterns that aligned well with known hydrogeological and topographic features of the study area. These models accurately delineated high-potential groundwater zones typically located in low-lying alluvial plains, valley corridors, and areas characterized by high soil permeability and vegetation density features often associated with groundwater accumulation. The spatial transitions between different GWP classes were smooth and well-localized, reflecting each model&#x2019;s capacity to learn complex spatial and geophysical relationships from the input data.</p>
<fig id="F14" position="float">
<label>FIGURE 14</label>
<caption>
<p>Spatial prediction maps of groundwater potential generated by AdaBoost, CatBoost, MLP, and TabTransformer.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g014.tif">
<alt-text content-type="machine-generated">Four maps showing land classification using different machine learning models: TabTransformer, MLP, CatBoost, and AdaBoost. Each map uses color coding&#x2014;gray for low, cyan for medium, and dark blue for high classification areas. Each map includes a scale bar and compass.</alt-text>
</graphic>
</fig>
<fig id="F15" position="float">
<label>FIGURE 15</label>
<caption>
<p>Spatial prediction maps of groundwater potential generated by Tabnet.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g015.tif">
<alt-text content-type="machine-generated">Map highlighting a geographic area with different levels of intensity. A legend indicates &#x22;Low&#x22; in gray, &#x22;Medium&#x22; in light blue, and &#x22;High&#x22; in dark blue. A compass rose shows orientation, and a scale bar displays distance in kilometers.</alt-text>
</graphic>
</fig>
<p>From a technical standpoint, these models exhibited stronger generalization capabilities, benefiting from deep representation learning (TabNet), ensemble-based robustness (TabTransformer), and gradient-boosted refinement (CatBoost). In contrast, MLP and AdaBoost produced noisier and more fragmented spatial outputs. These inconsistencies were particularly evident in transition zones, such as the interfaces between moderate and high GWP areas, where these models often failed to capture subtle environmental gradients. AdaBoost tended to overpredict Class 3 (high potential), generating spatial overestimation and reducing practical utility for hydrogeological planning. These results emphasize the necessity of selecting models that are not only accurate in classification metrics but also capable of preserving spatial coherence and geographic relevance in the context of groundwater potential mapping.</p>
</sec>
<sec id="s4-6">
<title>Statistical comparison and model ranking</title>
<p>Two robust evaluation methods were applied to provide a statistically grounded comparison of model performance: the Friedman test and the TOPSIS ranking method. The Friedman test (<xref ref-type="fig" rid="F16">Figure 16</xref>, left) showed statistically significant differences among models (<inline-formula id="inf40">
<mml:math id="m51">
<mml:mrow>
<mml:msup>
<mml:mi>&#x3c7;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>30.0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>; <inline-formula id="inf41">
<mml:math id="m52">
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>0.001</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>), with TabNet achieving the best average rank (1.00), followed by CatBoost (3.00), TabTransformer (4.00), and MLPr (5.00). AdaBoost ranked the lowest (6.00), confirming its underperformance.</p>
<fig id="F16" position="float">
<label>FIGURE 16</label>
<caption>
<p>Friedman test average ranking (left) and TOPSIS closeness score (right) for all models.</p>
</caption>
<graphic xlink:href="frsen-06-1622360-g016.tif">
<alt-text content-type="machine-generated">Bar charts compare the performance of models. Left chart shows AdaBoost with six, MLP with five, TabTransformer with four, CatBoost with three, TabNet with one. Right chart shows TabNet with one, CatBoost at zero point eight nine, TabTransformer at zero point eight, MLP at zero point two three, AdaBoost at zero.</alt-text>
</graphic>
</fig>
<p>To complement this analysis, the TOPSIS method was employed to evaluate the closeness of each model to the ideal solution across all metrics. The results (<xref ref-type="fig" rid="F16">Figure 16</xref>, right) aligned with the Friedman rankings. TabNet scored highest (1.0000), indicating optimal performance, followed closely by CatBoost (0.8935) and TabTransformer (0.80). MLP and AdaBoost were assigned significantly lower scores, reinforcing their inferior metric consistency.</p>
<p>The aggregated evaluation from both tests is summarized in <xref ref-type="table" rid="T5">Table 5</xref>, where models were qualitatively categorized based on their combined scores.</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Model comparison using TOPSIS score and Friedman test ranking.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Model</th>
<th align="center">TOPSIS score</th>
<th align="center">Friedman Avg. Rank</th>
<th align="center">Performance verdict</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">TabNet</td>
<td align="center">1.0000</td>
<td align="center">1.00</td>
<td align="center">Excellent</td>
</tr>
<tr>
<td align="left">CatBoost</td>
<td align="center">0.8935</td>
<td align="center">3.00</td>
<td align="center">Good</td>
</tr>
<tr>
<td align="left">TabTransformer</td>
<td align="center">0.8016</td>
<td align="center">4.00</td>
<td align="center">Good</td>
</tr>
<tr>
<td align="left">MLP</td>
<td align="center">0.2316</td>
<td align="center">5.00</td>
<td align="center">Moderate</td>
</tr>
<tr>
<td align="left">AdaBoost</td>
<td align="center">0.0000</td>
<td align="center">6.00</td>
<td align="center">Poor</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>
<xref ref-type="table" rid="T5">Table 5</xref> summarizes the integrated ranking of models based on statistical (Friedman) and multi-criteria (TOPSIS) evaluations. TabNet achieved the best overall performance, while AdaBoost was ranked lowest in both methods.</p>
</sec>
</sec>
<sec sec-type="discussion" id="s5">
<title>Discussion</title>
<p>This study systematically evaluated five advanced machine learning and DL models, TabNet, TabTransformer, MLP, CatBoost, and AdaBoost, for predicting groundwater potential zones in the Feija Basin. Among these, TabNet demonstrated superior predictive capabilities. Specifically, it achieved a test accuracy of 97.8%, a recall of 97.8%, and a kappa coefficient of 0.97. TabNet&#x2019;s sparse attention mechanism enabled selective prioritization of relevant features from heterogeneous tabular datasets, thereby enhancing both interpretability and performance (<xref ref-type="bibr" rid="B5">Arik and Pfister, 2021</xref>; <xref ref-type="bibr" rid="B64">Shah et al., 2022</xref>).</p>
<p>The methodological framework was comprehensive and data-driven. A structured dataset was constructed using field sampling and remote sensing-derived features and was subjected to rigorous preprocessing and stratification. Feature relevance and independence were ensured using both linear (Pearson correlation) and nonlinear (mutual information) techniques. DL models were fine-tuned via grid search, while classical models were optimized using PSO. This dual optimization strategy mitigated overfitting while preserving computational efficiency (<xref ref-type="bibr" rid="B72">Wu et al., 2025</xref>).</p>
<p>TabNet&#x2019;s strong performance underscores the promise of tabular DL architectures in environmental modeling (<xref ref-type="bibr" rid="B43">Li et al., 2025</xref>). Compared to MLP, which lacks embedded attention and feature selection capabilities, TabNet effectively captured complex interactions within structured environmental data. While TabTransformer and CatBoost also performed well, their outputs lacked the spatial consistency observed in TabNet.</p>
<p>In terms of interpretability, this study also provides insights into both global and local model behavior. Globally, feature importance scores and mutual information analysis revealed that elevation, slope, and soil permeability were consistently influential across all models. At the local level, models such as TabNet and TabTransformer demonstrated stable and context-aware predictions in transition zones between moderate and high groundwater potential areas. These models were able to respond adaptively to subtle variations in input features, resulting in smoother spatial transitions. This highlights their suitability not only for overall prediction accuracy but also for context-specific decision-making in spatially heterogeneous environments.</p>
<p>Previous groundwater studies in the Feija region, such as those by <xref ref-type="bibr" rid="B51">Moumane et al. (2024)</xref>, primarily employed GIS-based and multi-criteria decision analysis (MCDA) approaches. While effective for integrating thematic layers and expert judgment, these methods generally lack the dynamic learning capacity and predictive accuracy of data-driven models. Additionally, they are inherently static and less responsive to evolving climatic or land use conditions.</p>
<p>This study represents a methodological advance by integrating tabular deep learning with rigorous model evaluation. To date, few studies have simultaneously combined spatial validation and holistic evaluation frameworks (e.g., Friedman and TOPSIS) in a hydrogeologically vulnerable, data-scarce environment like the Feija Basin.</p>
<p>Beyond its methodological contributions, this work addresses a critical issue in the Feija Basin: the sustainable management of rainwater and groundwater resources. By accurately identifying recharge-prone zones, the models offer actionable tools for policymakers and engineers to optimize the allocation and capture of scarce hydrological inputs. Targeting these high-potential zones for the implementation of artificial recharge basins, percolation tanks, subsurface dams, or rainwater harvesting ponds would allow for the strategic retention of stormwater that would otherwise be lost through runoff or deep infiltration. Even partial capture could substantially augment aquifer recharge (<xref ref-type="bibr" rid="B37">Kebede et al., 2024</xref>), particularly in geomorphological zones with favorable permeability characteristics.</p>
<p>From an economic standpoint, improved groundwater recharge would increase irrigation reliability for high-value crops such as watermelon, reduce dependence on costly deep-well pumping, and safeguard yields during drought periods. Additionally, increased groundwater availability would alleviate pressure on potable water systems in rural communities (<xref ref-type="bibr" rid="B26">Gebreslassie et al., 2025</xref>), contributing to economic resilience. This strategy also helps mitigate land degradation, supports ecosystem services, and contributes to the long-term hydrological balance of the basin (<xref ref-type="bibr" rid="B29">Howard et al., 2023</xref>; <xref ref-type="bibr" rid="B71">Woldearegay et al., 2024</xref>). Moreover, the modeling approach enhances institutional capacity by delivering a replicable and interpretable framework that can inform similar groundwater planning efforts across other arid, semi-arid, and drought-prone regions.</p>
<p>Despite its contributions, this study has a few limitations. First, the sparse availability of <italic>in situ</italic> monitoring wells constrains the capacity for comprehensive validation. Second, class imbalance within the training dataset may have impacted model stability, particularly for MLP and AdaBoost.</p>
</sec>
<sec sec-type="conclusion" id="s6">
<title>Conclusion</title>
<p>This study presents a robust GeoAI-based framework for groundwater recharge zone mapping in the Feija Basin, a climate-vulnerable and agriculturally stressed region in southeastern Morocco. By integrating multi-source geospatial data with advanced ML and DL algorithms, the framework achieved high predictive accuracy and spatial consistency. Among the five evaluated models, TabNet exhibited superior performance, accurately delineating recharge-prone zones that closely aligned with known hydrogeological features. The methodology incorporated <italic>in situ</italic> borehole validation, feature importance analysis, and comprehensive evaluation metrics (e.g., accuracy, AUC-ROC, and Cohen&#x2019;s kappa), confirming both the reliability and interpretability of the modeling outputs. The results particularly highlight the strength of tabular DL models, especially TabNet, in capturing complex environmental interactions within structured datasets. The resulting high-resolution recharge potential maps provide actionable insights for groundwater managers and decision-makers, supporting the strategic planning of artificial recharge structures, rainwater harvesting systems, and sustainable land use practices. These tools are especially timely in light of the unusually high rainfall recorded during the 2024&#x2013;2025 hydrological year, offering a critical opportunity to increase aquifer replenishment and improve long-term water resilience.</p>
<p>Looking ahead, future work should incorporate temporal groundwater monitoring, including piezometric time series, to enable dynamic and predictive modeling. The inclusion of socio-economic factors, land use changes, and climate change projections would further improve model realism and policy relevance. Moreover, hybridizing data-driven models with physically based hydrological simulations may enhance interpretability and facilitate scenario-based planning. Collaborating with local stakeholders such as farmers, water authorities, and development agencies will be key to translating technical insights into practical, adaptive groundwater governance. Ultimately, this study contributes to the growing body of evidence supporting the integration of artificial intelligence in groundwater resource assessment, particularly in arid and data-scarce environments.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s7">
<title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. These data can be found here: NA.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>AE: Writing &#x2013; original draft, Data curation, Conceptualization, Writing &#x2013; review and editing. AM: Writing &#x2013; review and editing, Writing &#x2013; original draft, Data curation, Conceptualization. AZ: Writing &#x2013; original draft, Writing &#x2013; review and editing, Visualization, Methodology. AS: Writing &#x2013; review and editing, Writing &#x2013; original draft, Methodology, Visualization. JK: Formal Analysis, Investigation, Writing &#x2013; review and editing, Writing &#x2013; original draft. MB: Writing &#x2013; review and editing, Investigation, Writing &#x2013; original draft, Formal Analysis. SB: Writing &#x2013; review and editing, Investigation, Supervision, Writing &#x2013; original draft. TT: Writing &#x2013; original draft, Formal Analysis, Investigation, Writing &#x2013; review and editing. NE: Writing &#x2013; review and editing, Writing &#x2013; original draft, Supervision, Investigation.</p>
</sec>
<sec sec-type="funding-information" id="s9">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research and/or publication of this article.</p>
</sec>
<ack>
<p>The authors would like to express their sincere gratitude to all contributors who supported the development of this research. Special thanks are extended to the Faculty of Sciences and the Faculty of Humanities and Social Sciences at Ibn Tofail University for providing technical resources and academic guidance. The authors also thank the Marwadi University Research Centre for its valuable methodological input, particularly in the domain of artificial intelligence.</p>
</ack>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s11">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s12">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s13">
<title>Abbreviations</title>
<p>AI, artificial intelligence; ANN, artificial neural network; AUC-ROC, area under the receiver operating characteristic curve; CHIRPS, Climate Hazards Group InfraRed Precipitation with Station Data; DEM, digital elevation model; DL, deep learning; FAO, Food and Agriculture Organization; GeoAI, geospatial artificial intelligence; GIS, geographic information system; GWP, groundwater potential; kappa, Cohen&#x2019;s kappa coefficient; LULC, land use/land cover; MCDA, multi-criteria decision analysis; MDV, Middle Dr&#xe2;a Valley; ML, machine learning; MLP, multilayer perceptron; MODIS, Moderate Resolution Imaging Spectroradiometer; NASA POWER, Prediction of Worldwide Energy Resources (NASA); NDVI, Normalized Difference Vegetation Index; PSO, particle swarm optimization; RF, random forest; SVM, support vector machine; TOPSIS, Technique for Order Preference by Similarity to Ideal Solution; TWI, topographic wetness index; USGS, United States Geological Survey.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ajayakumar</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Reghunath</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Delineation of groundwater recharge zones in lateritic terrains using geospatial techniques</article-title>. <source>Discov. Geosci.</source> <volume>3</volume>, <fpage>6</fpage>. <pub-id pub-id-type="doi">10.1007/s44288-025-00110-z</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Al Atawneh</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Cartwright</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Doble</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Janardhanan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bertone</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2024</year>). &#x201c;<article-title>Predicting groundwater net recharge using machine learning models</article-title>&#x201d;. <pub-id pub-id-type="doi">10.2139/ssrn.4848392</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Amiha</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Kabbachi</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Ait Haddou</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hamma</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Bouchriti</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Gougueni</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Climate vulnerability and adaptation strategies in the Zagora oasis, southern Morocco: a time series analysis and projection to 2050</article-title>. <source>Theor. Appl. Climatol.</source> <volume>155</volume>, <fpage>9767</fpage>&#x2013;<lpage>9781</lpage>. <pub-id pub-id-type="doi">10.1007/s00704-024-05213-0</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Aoubouazza</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Elmeknassi</surname>
<given-names>Y. E.</given-names>
</name>
</person-group> (<year>1996</year>). &#x201c;<article-title>Hydrologie Et Hydrog&#xe9;ologie Du Bassin de La Feija de Zagora (Province de Ouarzazate)</article-title>,&#x201d; in <source>Maroc: &#xe9;tude sur la lutte contre la d&#xe9;sertification dans la vall&#xe9;e moyenne de l&#x2019;Oued Dr&#xe2;a</source>.</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arik</surname>
<given-names>S. &#xd6;.</given-names>
</name>
<name>
<surname>Pfister</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>TabNet: attentive interpretable Tabular learning</article-title>. <source>Proc. AAAI Conf. Artif. Intell.</source> <volume>35</volume>, <fpage>6679</fpage>&#x2013;<lpage>6687</lpage>. <pub-id pub-id-type="doi">10.1609/aaai.v35i8.16826</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Atenidegbe</surname>
<given-names>O. F.</given-names>
</name>
<name>
<surname>Mogaji</surname>
<given-names>K. A.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Modeling assessment of groundwater vulnerability to contamination risk in a typical basement terrain using TOPSIS-Entropy developed vulnerability data mining technique</article-title>. <source>Heliyon</source> <volume>9</volume> (<issue>7</issue>), <fpage>e18371</fpage>. <pub-id pub-id-type="doi">10.1016/j.heliyon.2023.e18371</pub-id>
<pub-id pub-id-type="pmid">37539304</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<collab>Bassin Hydraulique de Souss Massa et de Draa, ABHSMD Agence du</collab> (<year>2014</year>). &#x201c;<article-title>Etude Hydrologique de La Nappe de La Feija</article-title>.&#x201d; <comment>Morocco: Agence du Bassin Hydraulique de Souss Massa et de Draa</comment>.</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bergstra</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Bengio</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Random search for hyper-parameter optimization</article-title>. <source>J. Mach. Learn. Res.</source> <volume>13</volume>, <fpage>281</fpage>&#x2013;<lpage>305</lpage>. <comment>JMLR</comment>.</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bezekci</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Deep learning-enhanced regularization of irregular traveling pulses in the FitzHugh-Nagumo model</article-title>. <source>SN Comput. Sci.</source> <volume>6</volume>, <fpage>206</fpage>. <pub-id pub-id-type="doi">10.1007/s42979-025-03752-5</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bezek&#xe7;i</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>The refined physics-informed neural networks for nonlinear convection-reaction-diffusion equations using exponential schemes</article-title>. <source>Black Sea J. Eng. Sci.</source> <volume>8</volume>, <fpage>7</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.34248/bsengineering.1645207</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bezekci</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Kuru</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Deep learning-based approach for modeling threshold curves</article-title>. <source>Alexandria Eng. J.</source> <volume>129</volume>, <fpage>40</fpage>&#x2013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.1016/j.aej.2025.05.072</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Biazar</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Golmohammadi</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Nedhunuri</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Shaghaghi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mohammadi</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Artificial intelligence in hydrology: advancements in soil, water resource management, and sustainable development</article-title>. <source>Sustainability</source> <volume>17</volume> (<issue>5</issue>), <fpage>2250</fpage>. <pub-id pub-id-type="doi">10.3390/su17052250</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Borz&#xec;</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Modeling groundwater resources in data-scarce regions for sustainable management: methodologies and limits</article-title>. <source>Hydrology</source> <volume>12</volume> (<issue>1</issue>), <fpage>11</fpage>. <pub-id pub-id-type="doi">10.3390/hydrology12010011</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bossenbroek</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ftouhi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Kadiri</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Kuper</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Watermelons in the desert in Morocco: struggles around a groundwater commons-in-the-making</article-title>. <source>Water Altern.</source> <volume>16</volume> (<issue>February</issue>), <fpage>87</fpage>&#x2013;<lpage>107</lpage>.</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chicco</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Jurman</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The advantages of the Matthews Correlation Coefficient (MCC) over F1 Score and accuracy in binary classification evaluation</article-title>. <source>BMC Genomics</source> <volume>21</volume> (<issue>1</issue>), <fpage>6</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-019-6413-7</pub-id>
<pub-id pub-id-type="pmid">31898477</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Davis</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Goadrich</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2006</year>). &#x201c;<article-title>The relationship between precision-recall and ROC curves</article-title>,&#x201d; in <source>Proceedings of the 23rd international conference on machine learning (ICML)</source>, <fpage>233</fpage>&#x2013;<lpage>240</lpage>. <pub-id pub-id-type="doi">10.1145/1143844.1143874</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dem&#x161;ar</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Statistical comparisons of classifiers over multiple data sets</article-title>. <source>J. Mach. Learn. Res.</source> <volume>7</volume> (<issue>Jan</issue>), <fpage>1</fpage>&#x2013;<lpage>30</lpage>.</citation>
</ref>
<ref id="B18">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Dorogush</surname>
<given-names>A. V.</given-names>
</name>
<name>
<surname>Ershov</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Gulin</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). &#x201c;<article-title>CatBoost: gradient boosting with categorical features support</article-title>,&#x201d; in <source>Proceedings of the workshop on ML systems at NeurIPS</source>. <pub-id pub-id-type="doi">10.48550/arXiv.1810.11363</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Egbejule</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Dramatic images show the first floods in the sahara in half a century</article-title>. <source>Guard</source>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.theguardian.com/environment/2024/oct/11/dramatic-images-show-the-first-floods-in-the-sahara-in-half-a-century">https://www.theguardian.com/environment/2024/oct/11/dramatic-images-show-the-first-floods-in-the-sahara-in-half-a-century</ext-link>.</comment>
</citation>
</ref>
<ref id="B20">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Elmotawakkil</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Enneya</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2025</year>). &#x201c;<article-title>Boosting artificial intelligence performance in Sentinel-2 imagery analysis: a DL approach for water bodies detection</article-title>,&#x201d; in <source>Remote sensing and GIS techniques in hydrology</source>. Editors <person-group person-group-type="editor">
<name>
<surname>Batchi,</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Moumane</surname>
<given-names>A.</given-names>
</name>
</person-group> (<publisher-loc>Hershey, PA</publisher-loc>: <publisher-name>IGI Global</publisher-name>), <fpage>133</fpage>&#x2013;<lpage>152</lpage>. <pub-id pub-id-type="doi">10.4018/979-8-3693-9651-3.ch005</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Elmotawakkil</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sadiki</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Enneya</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Predicting groundwater level based on remote sensing and machine learning: a case study in the Rabat-K&#xe9;nitra region</article-title>. <source>J. Hydroinformatics</source> <volume>26</volume> (<issue>10</issue>), <fpage>2639</fpage>&#x2013;<lpage>2667</lpage>. <pub-id pub-id-type="doi">10.2166/hydro.2024.494</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Fico</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2022</year>). <source>Watering the desert, draining the oasis: navigating drought, development, and irrigation politics in the draa Valley, Morocco</source>. <comment>Master&#x27;s thesis. Syracuse: Syracuse University. Available online at: <ext-link ext-link-type="uri" xlink:href="https://surface.syr.edu/thesis/693/">https://surface.syr.edu/thesis/693/</ext-link>
</comment>.</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fico</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Frontiers of fortune: mobilising land, water, and collective identity for watermelon production in Southeastern Morocco</article-title>. <source>
<italic>J. North Afr. Stud.</italic> Sept.</source>, <fpage>1</fpage>&#x2013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.1080/13629387.2024.2404952</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fico</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kenti</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Living on luck: the story behind Zagora&#x2019;s watermelons</article-title>. <source>Heinrich B&#xf6;ll Stift. Rabat Maroc</source>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://ma.boell.org/fr/node/1283">https://ma.boell.org/fr/node/1283</ext-link>.</comment>
</citation>
</ref>
<ref id="B25">
<citation citation-type="web">
<collab>Freshplaza</collab> (<year>2025</year>). <article-title>A storm hits Zagora and destroys watermelon plantations</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.freshplaza.com/north-america/article/9728581/a-storm-hits-zagora-and-destroys-watermelon-plantations/">https://www.freshplaza.com/north-america/article/9728581/a-storm-hits-zagora-and-destroys-watermelon-plantations/</ext-link>.</comment>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gebreslassie</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Berhane</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Gebreyohannes</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Hagos</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hussien</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Walraevens</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Water harvesting and groundwater recharge: a comprehensive review and synthesis of Current practices</article-title>. <source>Water</source> <volume>17</volume>, <fpage>976</fpage>. <pub-id pub-id-type="doi">10.3390/w17070976</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Goodfellow</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Bengio</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Courville</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2016</year>). <source>Deep learning</source>. <publisher-name>MIT Press</publisher-name>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.deeplearningbook.org/">https://www.deeplearningbook.org/</ext-link>.</comment>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hosseini</surname>
<given-names>F. S.</given-names>
</name>
<name>
<surname>Jafari</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zandi</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Alesheikh</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Rezaie</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Groundwater potential mapping using optimized decision tree-based ensemble learning model with local and global explainability</article-title>. <source>Water</source> <volume>17</volume> (<issue>10</issue>), <fpage>1520</fpage>. <pub-id pub-id-type="doi">10.3390/w17101520</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Howard</surname>
<given-names>J. K.</given-names>
</name>
<name>
<surname>Dooley</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Brauman</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Klausmeyer</surname>
<given-names>K. R.</given-names>
</name>
<name>
<surname>Rohde</surname>
<given-names>M. M.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Ecosystem services produced by groundwater dependent ecosystems: a framework and case Study in California</article-title>. <source>Front. Water</source> <volume>5</volume>, <fpage>1115416</fpage>. <pub-id pub-id-type="doi">10.3389/frwa.2023.1115416</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Khetan</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cvitkovic</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Karnin</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>TabTransformer: tabular data modeling using contextual embeddings</article-title>. <source>Proc. AAAI Conf. Artif. Intell.</source> <volume>35</volume>, <fpage>5669</fpage>&#x2013;<lpage>76</lpage>.</citation>
</ref>
<ref id="B31">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hwang</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Yoon</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>1981</year>). <source>Multiple attribute decision making: methods and applications</source>. <publisher-name>Springer-Verlag</publisher-name>.</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Igwebuike</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Ajayi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Okolie</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Kanyerere</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Todd</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Application of machine learning and deep learning for predicting groundwater levels in the West Coast Aquifer System, South Africa</article-title>. <source>Earth Sci. Inf.</source> <volume>18</volume> (<issue>1</issue>), <fpage>6</fpage>. <pub-id pub-id-type="doi">10.1007/s12145-024-01623-w</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jari</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bachaoui</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Hajaj</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Khaddari</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Khandouch</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>El Harti</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Investigating machine learning and ensemble learning models in groundwater potential mapping in arid Region: case Study from Tan-Tan water-scarce Region, Morocco</article-title>. <source>Front. Water</source> <volume>5</volume>, <fpage>1305998</fpage>. <pub-id pub-id-type="doi">10.3389/frwa.2023.1305998</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jasechko</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Seybold</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Perrone</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Shamsudduha</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Taylor</surname>
<given-names>R. G.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Rapid groundwater decline and some cases of recovery in aquifers globally</article-title>. <source>Nature</source> <volume>625</volume> (<issue>7996</issue>), <fpage>715</fpage>&#x2013;<lpage>721</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-023-06879-8</pub-id>
<pub-id pub-id-type="pmid">38267682</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kaewdum</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Chotpantarat</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Mapping potential zones for groundwater recharge using a GIS technique in the lower khwae hanuman sub-basin area, prachin Buri Province, Thailand</article-title>. <source>Front. Earth Sci.</source> <volume>9</volume>, <fpage>717313</fpage>. <pub-id pub-id-type="doi">10.3389/feart.2021.717313</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Karmaoui</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Adil</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Changes in the environmental vulnerability of Oasean System (Desert oasis), pilot Study in middle draa Valley, Morocco</article-title>. <source>Expert Opin. Environ. Biol.</source> <volume>5</volume> (<issue>January</issue>). <pub-id pub-id-type="doi">10.4172/2325-9655.1000135</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kebede</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mekonnen</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Clement</surname>
<given-names>T. P.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Enhancing groundwater recharge through nature-based solutions: benefits and barriers</article-title>. <source>Hydrology</source> <volume>11</volume>, <fpage>195</fpage>. <pub-id pub-id-type="doi">10.3390/hydrology11110195</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kennedy</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Russell</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>1995</year>). &#x201c;<article-title>Particle swarm optimization</article-title>,&#x201d;<source>Proc. ICNN&#x2019;95 - Int. Conf. Neural Netw</source>, <volume>4</volume>, <fpage>1942</fpage>&#x2013;<lpage>1948</lpage>. <pub-id pub-id-type="doi">10.1109/ICNN.1995.488968</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kheddar</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hemis</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Himeur</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Automatic speech recognition using advanced Deep Learning Approaches: a Survey</article-title>. <source>Inf. Fusion</source> <volume>109</volume>, <fpage>102422</fpage>. <pub-id pub-id-type="doi">10.1016/j.inffus.2024.102422</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Klose</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2013</year>). <source>Regional hydrogeology and groundwater budget modeling in the arid middle draa catchment (South-Morocco)</source>. <publisher-loc>Bonn, Germany</publisher-loc>: <publisher-name>Universit&#xe4;ts- und Landesbibliothek Bonn</publisher-name>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://bonndoc.ulb.uni-bonn.de/xmlui/handle/20.500.11811/5752">https://bonndoc.ulb.uni-bonn.de/xmlui/handle/20.500.11811/5752</ext-link>.</comment>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kumar</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Singh</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Performance evaluation metrics for machine learning classification models: a comparative analysis</article-title>. <source>Int. J. Sci. Res. Comput. Sci.</source> <volume>10</volume> (<issue>1</issue>).</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lamqadem</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pradhan</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Pradhan</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2019</year>). &#x201c;<article-title>Long-term monitoring of transformation from pastoral to agricultural land use using time-series landsat data in the feija Basin Southeast Morocco</article-title>.&#x201d; <source>
<italic>Earth Syst. Environ.</italic> 3</source>. <volume>3</volume>, <fpage>525</fpage>, <lpage>538</lpage>. <pub-id pub-id-type="doi">10.1007/s41748-019-00110-3</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bian</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>HSDT-TabNet: a dual-path deep learning model for severity grading of soybean frogeye leaf spot</article-title>. <source>Agronomy</source> <volume>15</volume>, <fpage>1530</fpage>. <pub-id pub-id-type="doi">10.3390/agronomy15071530</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Enhancing groundwater recharge prediction: a feature selection-based Deep Forest model with bayesian optimisation</article-title>. <source>Hydrol. Process.</source> <volume>38</volume>, <fpage>e15309</fpage>. <pub-id pub-id-type="doi">10.1002/hyp.15309</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Maity</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Srivastava</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sarkar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Khan</surname>
<given-names>M. I.</given-names>
</name>
</person-group> (<year>2024</year>). &#x201c;<article-title>Revolutionizing the future of hydrological science: impact of machine learning and deep learning amidst emerging explainable AI and transfer learning</article-title>.&#x201d; <source>Appl. Comput. Geosciences</source> <volume>24</volume>: <fpage>100206</fpage>. <pub-id pub-id-type="doi">10.1016/j.acags.2024.100206</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mathewos</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Abate</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Dadi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mathewos</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Evaluation of the groundwater prospective Zone by coupling hydro-meteorological and geospatial evidence in Wabe River catchment omo Gibe River Basin, Ethiopia</article-title>. <source>Water Cycle</source> <volume>5</volume>, <fpage>37</fpage>&#x2013;<lpage>58</lpage>. <pub-id pub-id-type="doi">10.1016/j.watcyc.2024.01.002</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McHugh</surname>
<given-names>M. L.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Interrater reliability: the Kappa statistic</article-title>. <source>Biochem. Medica</source> <volume>22</volume> (<issue>3</issue>), <fpage>276</fpage>&#x2013;<lpage>282</lpage>. <pub-id pub-id-type="doi">10.11613/bm.2012.031</pub-id>
<pub-id pub-id-type="pmid">23092060</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Meng</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Khan</surname>
<given-names>M. I.</given-names>
</name>
<name>
<surname>Naqvi</surname>
<given-names>S. A. A.</given-names>
</name>
<name>
<surname>Sarwar</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Islam</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ali</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Identification and mapping of groundwater recharge zones using multi influencing factor and analytical hierarchy process</article-title>. <source>Sci. Rep.</source> <volume>14</volume>, <fpage>19240</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-024-70324-7</pub-id>
<pub-id pub-id-type="pmid">39164369</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mezali</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Chetibi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Naima</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Derdour</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Benmamar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Almohamad</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2025</year>). <article-title>Enhancing groundwater recharge assessment in mediterranean regions: a comparative Study using analytical hierarchy process and fuzzy analytical hierarchy process integrated with geographic information systems for the algiers watershed</article-title>. <source>Sustainability</source> <volume>17</volume>, <fpage>3242</fpage>. <pub-id pub-id-type="doi">10.3390/su17073242</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moumane</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>El Ghazali</surname>
<given-names>F. E.</given-names>
</name>
<name>
<surname>Jamal</surname>
<given-names>Al K.</given-names>
</name>
<name>
<surname>Delorme</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Batchi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chafiki</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Monitoring spatiotemporal variation of groundwater level and salinity under land use change using integrated field measurements, GIS, geostatistical, and remote-sensing approach: case Study of the feija aquifer, middle draa watershed, Moroccan Sahara</article-title>. <source>Environ. Monit. Assess.</source> <volume>193</volume> (<issue>December</issue>), <fpage>769</fpage>. <pub-id pub-id-type="doi">10.1007/s10661-021-09581-2</pub-id>
<pub-id pub-id-type="pmid">34735624</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moumane</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Enajar</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>El Ghazali</surname>
<given-names>F. E.</given-names>
</name>
<name>
<surname>Khouz</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ahmed</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Jamal</surname>
<given-names>Al K.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>GIS, remote sensing, and analytical hierarchy Process (AHP) approach for rainwater harvesting site selection in arid regions: feija Plain case Study, Zagora (Morocco)</article-title>. <source>Appl. Geomatics</source> <volume>16</volume> (<issue>September</issue>), <fpage>861</fpage>&#x2013;<lpage>880</lpage>. <pub-id pub-id-type="doi">10.1007/s12518-024-00585-4</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moumane</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bahouq</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ahmed</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Laghfiri</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Mohamed</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Karkouri</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2025</year>). <article-title>Lake iriqui&#x2019;s remarkable revival: field observations and a Google Earth engine analysis of its recovery after over half a century of desiccation</article-title>. <source>Land</source> <volume>14</volume> (<issue>1</issue>), <fpage>104</fpage>. <pub-id pub-id-type="doi">10.3390/land14010104</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="web">
<collab>NASA Earth Observatory</collab> (<year>2024</year>). <article-title>A deluge for the Sahara</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://earthobservatory.nasa.gov/images/153320/a-deluge-for-the-sahara">https://earthobservatory.nasa.gov/images/153320/a-deluge-for-the-sahara</ext-link>.</comment>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nugroho</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Indah Lestari</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gustiandi</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Sofan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Suwarsono</surname>
<given-names>I. P.</given-names>
</name>
<name>
<surname>Rahmi</surname>
<given-names>K. I. N.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). &#x201c;<article-title>Groundwater potential mapping using machine learning approach in West Java, Indonesia</article-title>.&#x201d; <source>Groundw. Sustain. Dev.</source> <volume>27</volume>: <fpage>101382</fpage>. <pub-id pub-id-type="doi">10.1016/j.gsd.2024.101382</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Patel</surname>
<given-names>D. K.</given-names>
</name>
<name>
<surname>Thakur</surname>
<given-names>T. K.</given-names>
</name>
<name>
<surname>Thakur</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Karuppannan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Swamy</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Pant</surname>
<given-names>R. R.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Groundwater potential Zone mapping using AHP and geospatial techniques in the upper Narmada Basin, central India</article-title>. <source>Discov. Sustain.</source> <volume>5</volume>, <fpage>355</fpage>. <pub-id pub-id-type="doi">10.1007/s43621-024-00560-4</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ragragui</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Aouragh</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>El-Hmaidi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ouali</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Saouita</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Iallamen</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). &#x201c;<article-title>Mapping and modeling groundwater potential using machine learning, deep learning and ensemble learning models in the saiss Basin (Fez-Meknes Region, Morocco)</article-title>.&#x201d; <source>Groundw. Sustain. Dev.</source> <volume>26</volume>: <fpage>101281</fpage>. <pub-id pub-id-type="doi">10.1016/j.gsd.2024.101281</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rieder</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Aemisegger</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Dente</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Armon</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Meteorological ingredients of heavy precipitation and subsequent lake-filling episodes in the northwestern Sahara</article-title>. <source>Hydrology Earth Syst. Sci.</source> <volume>29</volume>, <fpage>1395</fpage>&#x2013;<lpage>1427</lpage>. <pub-id pub-id-type="doi">10.5194/hess-29-1395-2025</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roy</surname>
<given-names>D. K.</given-names>
</name>
<name>
<surname>Kumar Sarkar</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Hossain Munmun</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Paul</surname>
<given-names>C. R.</given-names>
</name>
<name>
<surname>Datta</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>A review on the applications of machine learning and deep learning to groundwater salinity modeling: present status, challenges, and future directions</article-title>. <source>Discov. Water</source> <volume>5</volume>, <fpage>16</fpage>. <pub-id pub-id-type="doi">10.1007/s43832-025-00207-z</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sander</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Lineaments in groundwater exploration: a review of applications and limitations</article-title>. <source>Hydrogeology J.</source> <volume>15</volume>, <fpage>71</fpage>&#x2013;<lpage>74</lpage>. <pub-id pub-id-type="doi">10.1007/s10040-006-0138-9</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sarkar</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Rudra</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Talukdar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chandra Das</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Sadmin Nur</surname>
<given-names>Md.</given-names>
</name>
<name>
<surname>Alam</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Future groundwater potential mapping using machine learning algorithms and climate change scenarios in Bangladesh</article-title>. <source>Sci. Rep.</source> <volume>14</volume> (<issue>1</issue>), <fpage>10328</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-024-60560-2</pub-id>
<pub-id pub-id-type="pmid">38710767</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Schapire</surname>
<given-names>R. E.</given-names>
</name>
</person-group> (<year>1999</year>). &#x201c;<article-title>A brief introduction to boosting</article-title>,&#x201d; in <source>International joint conference on artificial intelligence (IJCAI)</source>, <fpage>1401</fpage>&#x2013;<lpage>1406</lpage>.</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schulz</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Manfred</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2013</year>). &#x201c;<article-title>IMPETUS Atlas Morocco (digital versions in English and French)</article-title>,&#x201d;<source>Unknown</source> Editors <person-group person-group-type="editor">
<name>
<surname>Schulz,</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Judex</surname>
<given-names>M.</given-names>
</name>
</person-group>, <pub-id pub-id-type="doi">10.1594/PANGAEA.821918</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sedghi</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Zhan</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Groundwater mounding due to recharge from ephemeral streams</article-title>. <source>Adv. Water Resour.</source> <volume>174</volume>, <fpage>104421</fpage>. <pub-id pub-id-type="doi">10.1016/j.advwatres.2023.104421</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shah</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Enhanced TabNet: attentive interpretable tabular learning for hyperspectral image classification</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <fpage>716</fpage>. <pub-id pub-id-type="doi">10.3390/rs14030716</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Silva-Novoa S&#xe1;nchez</surname>
<given-names>L. M.</given-names>
</name>
</person-group> (<year>2024</year>). <source>Water governance challenges in the middle dr&#xe2;a Valley of Morocco: analysing policies, practices and conflict</source>. <comment>Doctoral dissertation. Rheinland-Pf&#x00E4;lzische Technische Universit&#x00E4;t Kaiserslautern-Landau.</comment>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Silva-Novoa S&#xe1;nchez</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Schilling</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Bossenbroek</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ezzayyat</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Berger</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Drivers of conflict over customary land in the Middle Dr&#xe2;a Valley of Morocco</article-title>. <source>World Dev.</source> <volume>188</volume>, <fpage>106872</fpage>. <pub-id pub-id-type="doi">10.1016/j.worlddev.2024.106872</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sokolova</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lapalme</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>A systematic analysis of performance measures for classification tasks</article-title>. <source>Inf. Process. and Manag.</source> <volume>45</volume> (<issue>4</issue>), <fpage>427</fpage>&#x2013;<lpage>437</lpage>. <pub-id pub-id-type="doi">10.1016/j.ipm.2009.03.002</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tabassum</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sajjad</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sajid</surname>
<given-names>G. H.</given-names>
</name>
<name>
<surname>Ahmad</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Iqbal</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Khan</surname>
<given-names>A. H. A.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Assessing recharge zones for groundwater potential in Dera Ismail Khan (Pakistan): a GIS-Based analytical hierarchy process approach</article-title>. <source>Water</source> <volume>17</volume>, <fpage>1586</fpage>. <pub-id pub-id-type="doi">10.3390/w17111586</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tripathy</surname>
<given-names>K. P.</given-names>
</name>
<name>
<surname>Mishra</surname>
<given-names>A. K.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Deep learning in hydrology and water resources disciplines: concepts, methods, applications, and research directions</article-title>. <source>J. Hydrology</source> <volume>628</volume>, <fpage>130458</fpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2023.130458</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vyas</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bertsimas</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Deep learning with tabular data: a self-supervised approach</article-title>. <source>arXiv</source>. <pub-id pub-id-type="doi">10.48550/arXiv.2401.15238</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Woldearegay</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Grum</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Hessel</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Van Steenbergen</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Fleskens</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yazew</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Watershed management, groundwater recharge and drought resilience: an integrated approach to adapt to rainfall variability in Northern Ethiopia</article-title>. <source>Int. Soil Water Conservation Res.</source> <volume>12</volume>, <fpage>663</fpage>&#x2013;<lpage>683</lpage>. <pub-id pub-id-type="doi">10.1016/j.iswcr.2023.08.009</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2025</year>). <article-title>Predicting groundwater level dynamics and evaluating the impact of the south-to-north water diversion Project using stacking ensemble learning</article-title>. <source>Sustainability</source> <volume>17</volume>, <fpage>6120</fpage>. <pub-id pub-id-type="doi">10.3390/su17136120</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yariyan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Avand</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Omidvar</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Pham</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Linh</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Tiefenbacher</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Optimization of statistical and machine learning hybrid models for groundwater potential mapping</article-title>. <source>Geocarto Int.</source> <volume>36</volume> (<issue>February</issue>), <fpage>3877</fpage>&#x2013;<lpage>3911</lpage>. <pub-id pub-id-type="doi">10.1080/10106049.2020.1870164</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>