<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="discussion" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1599826</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2025.1599826</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Opinion</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>From bites to bytes: understanding how and why individual malaria risk varies using artificial intelligence and causal inference</article-title>
<alt-title alt-title-type="left-running-head">Ribeiro et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fgene.2025.1599826">10.3389/fgene.2025.1599826</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Ribeiro</surname>
<given-names>Ad&#xe8;le Helena</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2748177/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Soler</surname>
<given-names>J&#xfa;lia M. P.</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/67420/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Corder</surname>
<given-names>Rodrigo M.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3059892/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author" corresp="yes" equal-contrib="yes">
<name>
<surname>Ferreira</surname>
<given-names>Marcelo U.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1868266/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes" equal-contrib="yes">
<name>
<surname>Heider</surname>
<given-names>Dominik</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/59798/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Institute of Medical Informatics</institution>, <institution>University of M&#xfc;nster</institution>, <addr-line>M&#xfc;nster</addr-line>, <country>Germany</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Institute of Mathematics and Statistics</institution>, <institution>University of S&#xe3;o Paulo</institution>, <addr-line>S&#xe3;o Paulo</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Institute of Biomedical Sciences</institution>, <institution>University of S&#xe3;o Paulo</institution>, <addr-line>S&#xe3;o Paulo</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Institute of Hygiene and Tropical Medicine and Global Health and Tropical Medicine Research Center</institution>, <institution>NOVA University of Lisbon</institution>, <addr-line>Lisbon</addr-line>, <country>Portugal</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/991531/overview">Kenta Nakai</ext-link>, The University of Tokyo, Japan</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2268958/overview">Andrija Tomovic</ext-link>, Novartis, Bulgaria</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Marcelo U. Ferreira, <email>muferrei@usp.br</email>; Dominik Heider, <email>dominik.heider@uni-muenster.de</email>
</corresp>
<fn fn-type="equal" id="fn001">
<label>
<sup>&#x2020;</sup>
</label>
<p>These authors share last authorship</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>16</day>
<month>05</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1599826</elocation-id>
<history>
<date date-type="received">
<day>25</day>
<month>03</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>30</day>
<month>04</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Ribeiro, Soler, Corder, Ferreira and Heider.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Ribeiro, Soler, Corder, Ferreira and Heider</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>With an estimated 263 million cases recorded worldwide in 2023, malaria remains a major global health challenge, particularly in tropical regions with limited healthcare access. Beyond its health impact, malaria disrupts education, economic development, and social equality. While traditional research has focused on biological factors underlying human-mosquito interactions, growing evidence highlights the complex interplay of environmental, behavioral, and socioeconomic factors, alongside mobility and both human and parasite genetics, in shaping transmission dynamics, recurrence patterns, and control effectiveness. This work shows how integrating Artificial Intelligence (AI), Machine Learning (ML), and Causal Inference can advance malaria research by identifying context-specific risk factors, uncovering causal mechanisms, and informing more effective, targeted interventions. Drawing on the M&#xe2;ncio Lima cohort, a longitudinal, multimodal study of malaria risk in Brazil&#x2019;s main urban hotspot, and related studies in the Amazon, we highlight how rigorous, data-driven approaches can address the substantial variability in malaria risk across individuals and communities. AI-driven methods facilitate the integration of diverse high-dimensional datasets to uncover intricate patterns and improve individual risk stratification. Federated learning enables collaborative analysis across regions while preserving data privacy. Meanwhile, causal discovery and effect identification tools further strengthen these approaches by distinguishing genuine causal relationships from spurious associations. Together, these approaches offer a principled, scalable, and privacy-preserving framework that enables researchers to move beyond predictive modeling toward actionable causal insights. This shift supports precision public health strategies tailored to vulnerable populations, fostering more equitable and sustainable malaria control and contributing to the reduction of the global malaria burden.</p>
</abstract>
<kwd-group>
<kwd>artificial intelligence</kwd>
<kwd>causality</kwd>
<kwd>causal modelling</kwd>
<kwd>malaria</kwd>
<kwd>infectious diseases</kwd>
<kwd>public health</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Computational Genomics</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Malaria remains a major health challenge, particularly in tropical and subtropical regions facing poverty, limited healthcare access, and harsh environments, such as the Amazon rainforest. In 2023, an estimated 263 million malaria cases occurred across 83 countries and territories &#x2013; 37 million more than in 2015 (<xref ref-type="bibr" rid="B48">World Health Organization, 2024</xref>). Conflicts, humanitarian crises, climate change, drug and insecticide resistance, and resource constraints are among the threats to malaria control efforts.</p>
<p>
<italic>P. falciparum</italic> predominates in sub-Saharan Africa, causing the most severe form of human malaria (<xref ref-type="bibr" rid="B35">Poespoprodjo et al., 2023</xref>). <italic>P. vivax</italic> is the most geographically widespread parasite, responsible for over 80% of infections in the Amazon and causing recurrent infections. Malaria&#x2019;s impact extends beyond health, disrupting education, hindering economic growth, straining healthcare systems, and perpetuating poverty. Effective control is crucial for public health, equity and global prosperity, requiring a shift from the traditional human-mosquito transmission model to a broader understanding of biological, environmental, and socioeconomic factors.</p>
<p>We take as an example the M&#xe2;ncio Lima cohort study, which focuses on urban malaria in the Brazilian Amazon (<xref ref-type="bibr" rid="B22">Johansen et al., 2021</xref>). Approximately 20% of households in M&#xe2;ncio Lima, Brazil&#x2019;s primary urban hotspot near the Peruvian border, were randomly selected from census data, resulting in 2,774 participants tested for malaria parasites during seven cross-sectional surveys (2018&#x2013;2021) using conventional microscopy and highly sensitive, species-specific molecular techniques (<xref ref-type="bibr" rid="B41">Rodrigues et al., 2024</xref>). The study gathered data on demographics, health, housing conditions, occupation, lifestyle, and mobility, alongside blood samples for human genetics research, including genome-wide association studies.</p>
<p>Complementary longitudinal studies across Latin America have investigated the genomic diversity of <italic>P. vivax</italic> and <italic>P. falciparum</italic> (<xref ref-type="bibr" rid="B11">de Oliveira et al., 2020</xref>; <xref ref-type="bibr" rid="B4">Cabrera-Sosa et al., 2024</xref>; <xref ref-type="bibr" rid="B24">Kattenberg et al., 2024</xref>). Conducted in both urban and rural areas around M&#xe2;ncio Lima (2018&#x2013;2021) and the Peruvian Amazon (2007&#x2013;2020), these studies support integrative genomic surveillance to track transmission intensity, imported cases, and drug resistance markers. By linking human and parasite data across diverse settings, these efforts support research on malaria dynamics and the evolution of key traits, such as virulence, resistance, and local adaptation, while accounting for ecological and socio-demographic variation.</p>
<p>The M&#xe2;ncio Lima cohort has yielded several insights (<xref ref-type="bibr" rid="B10">Corder et al., 2019</xref>; <xref ref-type="bibr" rid="B9">Corder et al., 2020b</xref>; <xref ref-type="bibr" rid="B11">de Oliveira et al., 2020</xref>; <xref ref-type="bibr" rid="B7">Corder et al., 2023</xref>; <xref ref-type="bibr" rid="B41">Rodrigues et al., 2024</xref>). Of 11,730 samples screened using molecular methods, 4.0% were positive for <italic>P. vivax</italic> and 0.9% for <italic>P. falciparum</italic>, whereas standard microscopy detected much lower rates (0.4% for <italic>P. vivax</italic> and 0.2% for <italic>P. falciparum</italic>) (<xref ref-type="bibr" rid="B41">Rodrigues et al., 2024</xref>). Despite the low prevalence, <italic>P. vivax</italic> infections were recurrent (<xref ref-type="bibr" rid="B8">Corder et al., 2020a</xref>; <xref ref-type="bibr" rid="B7">Corder et al., 2023</xref>), with model simulations indicating that 20% of individuals at highest risk of infection accounted for 86% of the infection burden (<xref ref-type="bibr" rid="B9">Corder et al., 2020b</xref>). This highlights that malaria burden is often heterogeneously distributed within communities, following the 20/80 rule, where approximately 20% of individuals carry 80% of infections (<xref ref-type="bibr" rid="B7">Corder et al., 2023</xref>). Adult men face the highest risk (<xref ref-type="bibr" rid="B10">Corder et al., 2019</xref>), and most laboratory-confirmed infections were asymptomatic (<xref ref-type="bibr" rid="B41">Rodrigues et al., 2024</xref>). Human mobility between urban and rural areas appears to sustain malaria transmission (<xref ref-type="bibr" rid="B21">Johansen et al., 2020</xref>). Additionally, genetic analyses of <italic>P. vivax</italic> revealed diverse, spatially and temporally structured lineages, highlighting heterogeneous transmission dynamics across different settings (<xref ref-type="bibr" rid="B11">de Oliveira et al., 2020</xref>; <xref ref-type="bibr" rid="B24">Kattenberg et al., 2024</xref>). In contrast, <italic>P. falciparum</italic> exhibited lower genetic diversity and stronger temporal clustering, indicating localized and time-limited transmission (<xref ref-type="bibr" rid="B4">Cabrera-Sosa et al., 2024</xref>).</p>
<p>Despite these heterogeneities, malaria prevalence in Mancio Lima declined significantly from 2018 to 2021, likely due to extensive control and treatment efforts, including widespread indoor residual spraying, distribution of insecticide-treated bed nets, active case testing, and free treatment programs. Sustaining and advancing this progress requires improved identification of high-risk groups for optimizing resource distribution and implementing tailored interventions. A key challenge is understanding why some individuals repeatedly contract <italic>P. vivax</italic> while others remain uninfected. Clinically, such recurrences can lead to severe complications, including anemia, particularly among vulnerable groups, such as children and pregnant women (<xref ref-type="bibr" rid="B34">Pincelli et al., 2021</xref>). Economically, this heterogeneity complicates policy design. The 20/80 rule suggests that targeting high-risk individuals could maximize impact (<xref ref-type="bibr" rid="B7">Corder et al., 2023</xref>). Additionally, malaria has emerged as a zoonotic threat. <italic>P. simium</italic>, a parasite of non-human primates, has caused infections in humans in southeastern Brazil, where <italic>P. vivax</italic> is rare (<xref ref-type="bibr" rid="B12">de Oliveira et al., 2021a</xref>; <xref ref-type="bibr" rid="B13">b</xref>). Distinguishing between human and zoonotic parasites is critical for evaluating interventions and preparing for future outbreaks.</p>
<p>To elucidate the multifaceted dynamics underlying malaria risk, we propose a synergistic integration of AI, ML, and causal inference. This combination enables not only the identification of high-risk groups but also the discovery of causal mechanisms driving individual variability in malaria susceptibility. By leveraging cutting-edge methods, we can move beyond predictive modeling toward causal understanding, thereby informing the development of optimized, targeted interventions. Our approach relies on the integration of high-dimensional, multimodal datasets such as those from the Mancio Lima cohort and other regional studies &#x2013; including data on malaria episodes, clinical, behavioral, socioeconomic, environmental, and genetic factors. This rich data landscape enables the identification of structured patterns and interpretable representations that explain malaria risk and transmission dynamics. Causal inference methods that account for latent confounding and selection bias are essential to distinguish causal drivers from spurious associations, enabling robust estimation of intervention effects under real-world conditions. Ultimately, this framework will support precision public health by ensuring that prevention, control, and treatment strategies are both timely and tailored to those most at risk, maximizing impact and equity (<xref ref-type="bibr" rid="B25">Khoury et al., 2015</xref>).</p>
</sec>
<sec id="s2">
<title>Bridging AI and causality for targeted malaria interventions</title>
<p>AI and ML have driven significant advancements in medicine and public health (<xref ref-type="bibr" rid="B28">MacEachern and Forkert, 2021</xref>) due to their ability to model complex relationships and uncover subtle patterns in high-dimensional, heterogeneous datasets. These methods have been successfully applied across various medical domains (<xref ref-type="bibr" rid="B45">Theodosiou and Read, 2023</xref>), including infectious disease research, such as AMR prediction (<xref ref-type="bibr" rid="B36">Ren et al., 2022</xref>), zoonotic disease detection (<xref ref-type="bibr" rid="B37">Ren et al., 2024</xref>), and biomarker discovery in malaria (<xref ref-type="bibr" rid="B23">Jung et al., 2023</xref>).</p>
<p>In malaria research, AI and ML provide powerful tools to disentangle complex, often hidden dependency structures and enable precise individual risk stratification. The pipeline (<xref ref-type="fig" rid="F1">Figure 1</xref>) begins with data collection and preprocessing, crucial for multimodal, heterogeneous, and sensitive data such as genomic and socio-behavioral information. Ensuring data privacy and quality through anonymization, harmonization, imputation, and normalization &#x2013; while following FAIR principles (Findable, Accessible, Interoperable, Reusable) (<xref ref-type="bibr" rid="B26">Kush et al., 2020</xref>) &#x2013; is essential for robust model development. In multi-center studies, federated learning supports privacy-preserving collaboration by enabling joint analysis without exchanging raw data (<xref ref-type="bibr" rid="B29">McMahan et al., 2017</xref>; <xref ref-type="bibr" rid="B43">Tajabadi et al., 2023</xref>; <xref ref-type="bibr" rid="B44">Tajabadi et al., 2024</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>AI and Causal Inference Pipeline for Targeted Intervention Design in Malaria Research. The pipeline begins with Data Collection and Preprocessing, including anonymization, harmonization, and normalization of multimodal, multi-center data. In Data Integration, federated multi-view representation learning generates low-dimensional embeddings that capture both within- and cross-modal patterns while maintaining data privacy. Predictive Feature Selection uncovers latent risk profiles and selects interpretable features that predict malaria risk both globally and within specific subgroups. Finally, Causal Inference and Intervention Design applies causal discovery to reveal mechanisms underlying the selected features &#x2013; e.g., treatment regimens, prior infection history, genetic predispositions, bed net usage, healthcare access, urban vs. rural residence, and proximity to mosquito breeding sites. Causal effect estimation tools then quantify the (conditional) impact of specific interventions (e.g., increasing healthcare access, personalizing treatments, or implementing targeted screening) from observational data, supporting precision public health strategies for effective malaria prevention, treatment, and control.</p>
</caption>
<graphic xlink:href="fgene-16-1599826-g001.tif"/>
</fig>
<p>Multi-view representation learning approaches, such as multimodal variational autoencoders, enable data integration by generating low-dimensional latent embeddings that retain modality-specific features while capturing cross-modal dependencies (<xref ref-type="bibr" rid="B17">Guo et al., 2019</xref>). Clustering these embeddings can reveal subgroups of individuals with shared but not directly observed risk profiles, shaped by common exposures or susceptibilities (<xref ref-type="bibr" rid="B20">Jaeger et al., 2023</xref>). This step can be enriched through co-clustering, which jointly identifies groups of individuals and co-varying variables, highlighting context-specific drivers of malaria vulnerability (<xref ref-type="bibr" rid="B16">Govaert and Nadif, 2013</xref>). Moreover, federated representation learning and clustering (<xref ref-type="bibr" rid="B49">Zhang et al., 2023</xref>; <xref ref-type="bibr" rid="B32">Pedrycz, 2021</xref>) support robust and generalizable predictions across distributed, heterogeneous datasets. To enhance interpretability and inform downstream modeling, cluster-aware feature selection (<xref ref-type="bibr" rid="B47">Wang and Allen, 2021</xref>) identifies both globally predictive variables and those particularly informative within specific subgroups. These selected features and representations are then used to predict individual malaria risk, forming a cohesive and interpretable AI-driven framework for risk assessment.</p>
<p>While essential, high predictive accuracy alone is not sufficient to uncover the underlying data-generating mechanisms or support meaningful, actionable interventions. This is particularly true in biomedical and epidemiological research, where data are largely observational and vulnerable to multiple sources of bias. In malaria research, for example, unmeasured factors such as socio-economic status, mobility patterns, or environmental exposures can confound associations between risk factors and outcomes. Selection bias is also widespread due to underreporting, especially in remote regions or among asymptomatic individuals. If not properly addressed, these biases can reinforce existing health disparities and lead to interventions that are ineffective or even harmful.</p>
<p>Causal inference provides a principled framework to uncover cause-and-effect relationships and mitigate the impact of bias in observational studies (<xref ref-type="bibr" rid="B31">Pearl, 2009</xref>). It enables the estimation of the effect of interventions with a level of rigor comparable to randomized controlled trials. Several approaches exist, including the Potential Outcomes Framework (<xref ref-type="bibr" rid="B42">Rubin, 1974</xref>), Causal Machine Learning (<xref ref-type="bibr" rid="B46">van der Laan and Rubin, 2006</xref>; <xref ref-type="bibr" rid="B15">Feuerriegel et al., 2024</xref>), and Instrumental Variables (<xref ref-type="bibr" rid="B2">Angrist et al., 1996</xref>), also known in genetics as Mendelian Randomization (<xref ref-type="bibr" rid="B18">Haycock et al., 2016</xref>; <xref ref-type="bibr" rid="B40">Ribeiro et al., 2016</xref>). However, these frameworks rely on strong, sometimes unverifiable assumptions &#x2013; such as the absence of latent confounding or availability of valid instruments &#x2013; which are often violated in real-world settings.</p>
<p>In response, data-driven causal discovery methods within Pearl&#x2019;s framework have emerged as robust alternatives. Algorithms such as Fast Causal Inference (FCI) (<xref ref-type="bibr" rid="B50">Zhang, 2008</xref>) and its variants can recover causal structures directly from observational data, even in the presence of unmeasured confounding and selection bias. Notably, AnchorFCI (<xref ref-type="bibr" rid="B38">Ribeiro et al., 2024</xref>) enhances robustness and discovery power by strategically selecting and integrating reliable anchor variables &#x2013; such as genetic variants &#x2013; that are known not to be influenced by the variables of interest (e.g., clinical or sociodemographic factors). These methods infer a Partial Ancestral Graph (PAG) representing causal relationships shared across all models supported by the data, thus revealing the true data-generating processes. This enables the identification of key factors &#x2013; e.g., use of insecticide-treated bed nets, housing conditions, or access to healthcare &#x2013; that causally influence malaria risk and can be targeted by interventions. By applying causal effect identification algorithms to the resulting PAG, we can then quantify the isolated or combined impact of specific interventions, based solely on observational data (<xref ref-type="bibr" rid="B33">Perkovi&#x0107; et al., 2018</xref>; <xref ref-type="bibr" rid="B19">Jaber et al., 2022</xref>). This fully data-driven causal pipeline supports the development of more robust, transparent, and socially responsible interventions, providing a clearer pathway for addressing malaria risk in diverse settings.</p>
<p>A key strength of constraint-based causal discovery approaches such as FCI and its variants lies in their flexibility to account for mixed-type variables and complex dependency structures by adapting conditional independence tests. This is particularly important for analyzing malaria datasets, which typically comprise a mix of continuous, ordinal, categorical, and count variables, along with non-independent observations arising from genetic relatedness, repeated measures, household clustering, and spatial correlations. Conditional independence tests that account for such complexities can be constructed using generalized mixed models, which incorporate structured covariance and random effects to model known or inferred dependencies (<xref ref-type="bibr" rid="B39">Ribeiro and Soler, 2020</xref>). These tests can also be extended to federated learning settings, enabling collaborative, privacy-preserving causal discovery. Furthermore, causal discovery at the level of variable clusters &#x2013; either predefined or learned through representation learning and clustering &#x2013; can yield more interpretable insights into the interactions among biological, behavioral, and environmental risk factors for malaria (<xref ref-type="bibr" rid="B1">Anand et al., 2023</xref>).</p>
</sec>
<sec sec-type="discussion" id="s3">
<title>Discussion</title>
<p>Progress toward malaria elimination in regions such as the Amazon requires a deep understanding of the intricate factors driving infection risk and recurrence. The M&#xe2;ncio Lima cohort and regional studies offer a unique opportunity to uncover malaria dynamics by combining comprehensive data on human hosts, parasites, and their environments. However, the inherent complexity and heterogeneity of these datasets demand analytical frameworks that extend beyond traditional epidemiological or statistical approaches.</p>
<p>By integrating AI, ML, and causal inference, we move toward a more holistic strategy that not only accurately identifies high-risk individuals but also elucidates the causal mechanisms underlying malaria transmission and infection. This shift from descriptive and predictive modeling to causal reasoning enables the development of optimized, targeted interventions and lays the foundation for precision public health strategies that are not only more effective but also more equitable. Federated learning further supports this approach by enabling collaborative analysis across diverse regions without compromising data privacy. Together, these methodologies empower local health systems to respond more precisely and efficiently and contribute meaningfully to global control efforts.</p>
</sec>
</body>
<back>
<sec sec-type="author-contributions" id="s4">
<title>Author contributions</title>
<p>AR: Formal Analysis, Writing &#x2013; original draft, Methodology, Investigation, Conceptualization, Writing &#x2013; review and editing. JS: Conceptualization, Investigation, Resources, Writing &#x2013; review and editing. RC: Resources, Conceptualization, Investigation, Methodology, Writing &#x2013; review and editing, Formal Analysis, Writing &#x2013; original draft, Data curation. MF: Resources, Data curation, Supervision, Methodology, Investigation, Conceptualization, Writing &#x2013; original draft, Funding acquisition, Writing &#x2013; review and editing. DH: Writing &#x2013; review and editing, Project administration, Conceptualization, Supervision, Writing &#x2013; original draft, Funding acquisition, Investigation, Visualization.</p>
</sec>
<sec sec-type="funding-information" id="s5">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This work was financially supported by the German Federal Ministry of Education and Research (BMBF) [01DN24022] (MalariAI). The M&#xe2;ncio Lima cohort study has been supported by the Funda&#xe7;&#xe3;o de Amparo &#xe0; Pesquisa do Estado de S&#xe3;o Paulo (FAPESP), Brazil (2016/18740&#x2013;9 and 2022/11963-3), the National Institutes of Health (grant U19 AI089681), and the Funda&#xe7;&#xe3;o para a Ci&#xea;ncia e Tecnologia, Portugal (institutional GHTM project UID/04413/2020 and LA-REAL LA/P/0117/2020). The Conselho Nacional de Desenvolvimento Cient&#xed;fico e Tecnol&#xf3;gico (CNPq), Brazil, provides a senior research scholarship to MF We acknowledge support from the Open Access Publication Fund of the University of M&#x00FC;nster.</p>
</sec>
<sec sec-type="COI-statement" id="s6">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
<p>The author(s) declared that they were an editorial board member of Frontiers, at the time of submission. This had no impact on the peer review process and the final decision.</p>
</sec>
<sec sec-type="ai-statement" id="s7">
<title>Generative AI statement</title>
<p>The authors declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s8">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Anand</surname>
<given-names>T. V.</given-names>
</name>
<name>
<surname>Ribeiro</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Bareinboim</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Causal effect identification in cluster DAGs</article-title>. <source>Proc. AAAI Conf. Artif. Intell.</source> <volume>37</volume> (<issue>10</issue>), <fpage>12172</fpage>&#x2013;<lpage>12179</lpage>. <pub-id pub-id-type="doi">10.1609/aaai.v37i10.26435</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Angrist</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Imbens</surname>
<given-names>G. W.</given-names>
</name>
<name>
<surname>Rubin</surname>
<given-names>D. B.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Identification of causal effects using instrumental variables</article-title>. <source>J. Am. Stat. Assoc.</source> <volume>91</volume> (<issue>434</issue>), <fpage>444</fpage>&#x2013;<lpage>455</lpage>. <pub-id pub-id-type="doi">10.2307/2291629</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Bareinboim</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Correa</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Ibeling</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Icard</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2022</year>). &#x201c;<article-title>On Pearl&#x2019;s hierarchy and the foundations of causal inference</article-title>,&#x201d; in <source>Probabilistic and causal inference: the works of Judea Pearl</source>, <fpage>507</fpage>&#x2013;<lpage>556</lpage>.</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cabrera-Sosa</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Nolasco</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Kattenberg</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Fernandez-Mi&#xf1;ope</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Valdivia</surname>
<given-names>H. O.</given-names>
</name>
<name>
<surname>Barazorda</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Genomic surveillance of malaria parasites in an indigenous community in the Peruvian Amazon</article-title>. <source>Sci. Rep.</source> <volume>14</volume>, <fpage>16291</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-024-66925-x</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Corder</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Arez</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>M. U.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Individual variation in <italic>Plasmodium vivax</italic> malaria risk: are repeatedly infected people just unlucky?</article-title> <source>PLOS Neglected Trop. Dis.</source> <volume>17</volume> (<issue>1</issue>), <fpage>e0011020</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pntd.0011020</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Corder</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>de Lima</surname>
<given-names>A. C. P.</given-names>
</name>
<name>
<surname>Khoury</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Docken</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Davenport</surname>
<given-names>M. P.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>M. U.</given-names>
</name>
</person-group> (<year>2020a</year>). <article-title>Quantifying and preventing <italic>Plasmodium vivax</italic> recurrences in primaquine-untreated pregnant women: an observational and modeling study in Brazil</article-title>. <source>PLOS Neglected Trop. Dis.</source> <volume>14</volume> (<issue>7</issue>), <fpage>e0008526</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pntd.0008526</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Corder</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>M. U.</given-names>
</name>
<name>
<surname>Gomes</surname>
<given-names>M. G. M.</given-names>
</name>
</person-group> (<year>2020b</year>). <article-title>Modelling the epidemiology of residual <italic>Plasmodium vivax</italic> malaria in a heterogeneous host population: a case study in the Amazon Basin</article-title>. <source>PLOS Comput. Biol.</source> <volume>16</volume> (<issue>3</issue>), <fpage>e1007377</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1007377</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Corder</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Paula</surname>
<given-names>G. A.</given-names>
</name>
<name>
<surname>Pincelli</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>M. U.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Statistical modeling of surveillance data to identify correlates of urban malaria risk: a population-based study in the Amazon Basin</article-title>. <source>PLOS ONE</source> <volume>14</volume> (<issue>8</issue>), <fpage>e0220980</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0220980</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>de Oliveira</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Corder</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Early</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Rodrigues</surname>
<given-names>P. T.</given-names>
</name>
<name>
<surname>Ladeia-Andrade</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Alves</surname>
<given-names>J. M. P.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Population genomics reveals the expansion of highly inbred <italic>Plasmodium vivax</italic> lineages in the main malaria hotspot of Brazil</article-title>. <source>PLOS Neglected Trop. Dis.</source> <volume>14</volume> (<issue>10</issue>), <fpage>e0008808</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pntd.0008808</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>de Oliveira</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Rodrigues</surname>
<given-names>P. T.</given-names>
</name>
<name>
<surname>Duarte</surname>
<given-names>A. M. R. C.</given-names>
</name>
<name>
<surname>Rona</surname>
<given-names>L. D. P.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>M. U.</given-names>
</name>
</person-group> (<year>2021a</year>). <article-title>Ongoing host-shift speciation in <italic>Plasmodium simium</italic>
</article-title>. <source>Trends Parasitol.</source> <volume>37</volume> (<issue>11</issue>), <fpage>940</fpage>&#x2013;<lpage>942</lpage>. <pub-id pub-id-type="doi">10.1016/j.pt.2021.08.005</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>de Oliveira</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Rodrigues</surname>
<given-names>P. T.</given-names>
</name>
<name>
<surname>Early</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Duarte</surname>
<given-names>A. M. R. C.</given-names>
</name>
<name>
<surname>Buery</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Bueno</surname>
<given-names>M. G.</given-names>
</name>
<etal/>
</person-group> (<year>2021b</year>). <article-title>
<italic>Plasmodium simium</italic>: population genomics reveals the origin of a reverse zoonosis</article-title>. <source>J. Infect. Dis.</source> <volume>224</volume> (<issue>11</issue>), <fpage>1950</fpage>&#x2013;<lpage>1961</lpage>. <pub-id pub-id-type="doi">10.1093/infdis/jiab214</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feuerriegel</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Frauen</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Melnychuk</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Schweisthal</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hess</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Curth</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Causal machine learning for predicting treatment outcomes</article-title>. <source>Nat. Med.</source> <volume>30</volume>, <fpage>958</fpage>&#x2013;<lpage>968</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-024-02902-1</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Govaert</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Nadif</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2013</year>). <source>Co-clustering: models, algorithms and applications</source>. <publisher-name>John Wiley and Sons</publisher-name>.</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Deep multimodal representation learning: a survey</article-title>. <source>IEEE Access</source> <volume>7</volume>, <fpage>63373</fpage>&#x2013;<lpage>63394</lpage>. <pub-id pub-id-type="doi">10.1109/access.2019.2916887</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Haycock</surname>
<given-names>P. C.</given-names>
</name>
<name>
<surname>Burgess</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wade</surname>
<given-names>K. H.</given-names>
</name>
<name>
<surname>Bowden</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Relton</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Davey Smith</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Best (but oft-forgotten) practices: the design, analysis, and interpretation of Mendelian randomization studies</article-title>. <source>Am. J. Clin. Nutr.</source> <volume>103</volume> (<issue>4</issue>), <fpage>965</fpage>&#x2013;<lpage>978</lpage>. <pub-id pub-id-type="doi">10.3945/ajcn.115.118216</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jaber</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ribeiro</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Bareinboim</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Causal identification under Markov equivalence: calculus, algorithm, and completeness</article-title>. <source>Adv. Neural Inf. Process. Syst.</source> <volume>35</volume>, <fpage>3679</fpage>&#x2013;<lpage>3690</lpage>.</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jaeger</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Banks</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Cluster analysis: a modern statistical review</article-title>. <source>Wiley Interdiscip. Rev. Comput. Stat.</source> <volume>15</volume> (<issue>3</issue>), <fpage>e1597</fpage>. <pub-id pub-id-type="doi">10.1002/wics.1597</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johansen</surname>
<given-names>I. C.</given-names>
</name>
<name>
<surname>Rodrigues</surname>
<given-names>P. T.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>M. U.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Human mobility and urban malaria risk in the main transmission hotspot of Amazonian Brazil</article-title>. <source>PLOS ONE</source> <volume>15</volume> (<issue>11</issue>), <fpage>e0242357</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0242357</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johansen</surname>
<given-names>I. C.</given-names>
</name>
<name>
<surname>Rodrigues</surname>
<given-names>P. T.</given-names>
</name>
<name>
<surname>Tonini</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Vinetz</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Castro</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>M. U.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Cohort profile: the M&#xe2;ncio Lima cohort study of urban malaria in Amazonian Brazil</article-title>. <source>BMJ Open</source> <volume>11</volume> (<issue>11</issue>), <fpage>e048073</fpage>. <pub-id pub-id-type="doi">10.1136/bmjopen-2020-048073</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jung</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>M&#xf8;ller J&#xf8;rgensen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>B&#xe6;k</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Artho</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Griss</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Surface proteome of plasma extracellular vesicles as mechanistic and clinical biomarkers for malaria</article-title>. <source>Infection</source> <volume>51</volume> (<issue>5</issue>), <fpage>1491</fpage>&#x2013;<lpage>1501</lpage>. <pub-id pub-id-type="doi">10.1007/s15010-023-02022-x</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kattenberg</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Monsieurs</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>De Meyer</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>De Meulenaere</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Sauve</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>de Oliveira</surname>
<given-names>T. C.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Population genomic evidence of structured and connected <italic>Plasmodium vivax</italic> populations under host selection in Latin America</article-title>. <source>Ecol. Evol.</source> <volume>14</volume>, <fpage>e11103</fpage>. <pub-id pub-id-type="doi">10.1002/ece3.11103</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khoury</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Iademarco</surname>
<given-names>M. F.</given-names>
</name>
<name>
<surname>Riley</surname>
<given-names>W. T.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Precision public health for the era of precision medicine</article-title>. <source>Am. J. Prev. Med.</source> <volume>50</volume> (<issue>3</issue>), <fpage>398</fpage>&#x2013;<lpage>401</lpage>. <pub-id pub-id-type="doi">10.1016/j.amepre.2015.08.031</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kush</surname>
<given-names>R. D.</given-names>
</name>
<name>
<surname>Warzel</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Kush</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Sherman</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Navarro</surname>
<given-names>E. A.</given-names>
</name>
<name>
<surname>Fitzmartin</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>FAIR data sharing: the roles of common data elements and harmonization</article-title>. <source>J. Biomed. Inf.</source> <volume>107</volume>, <fpage>103421</fpage>. <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103421</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>MacEachern</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Forkert</surname>
<given-names>N. D.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Machine learning for precision medicine</article-title>. <source>Genome</source> <volume>64</volume> (<issue>4</issue>), <fpage>416</fpage>&#x2013;<lpage>425</lpage>. <pub-id pub-id-type="doi">10.1139/gen-2020-0131</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>McMahan</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Moore</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Ramage</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hampson</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Arcas</surname>
<given-names>B. A. y.</given-names>
</name>
</person-group> (<year>2017</year>). &#x201c;<article-title>Communication-efficient learning of deep networks from decentralized data</article-title>,&#x201d; in <source>Proceedings of the 20th International Conference on Artificial Intelligence and Statistics</source> (<publisher-name>Proceedings of Machine Learning Research</publisher-name>), <fpage>1273</fpage>&#x2013;<lpage>1282</lpage>. Available online at: <ext-link ext-link-type="uri" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="https://proceedings.mlr.press/v54/mcmahan17a.html">https://proceedings.mlr.press/v54/mcmahan17a.html</ext-link>.</citation>
</ref>
<ref id="B31">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Pearl</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2009</year>). <source>Causality: models, reasoning, and inference</source>. <edition>2nd ed.</edition> <publisher-name>Cambridge University Press</publisher-name>.</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pedrycz</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Federated FCM: clustering under privacy requirements</article-title>. <source>IEEE Trans. Fuzzy Syst.</source> <volume>30</volume> (<issue>8</issue>), <fpage>3384</fpage>&#x2013;<lpage>3388</lpage>. <pub-id pub-id-type="doi">10.1109/tfuzz.2021.3105193</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Perkovi&#x107;</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Textor</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kalisch</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Maathuis</surname>
<given-names>M. H.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Complete graphical characterization and construction of adjustment sets in Markov equivalence classes of ancestral graphs</article-title>. <source>J. Mach. Learn. Res.</source> <volume>18</volume>, <fpage>1</fpage>&#x2013;<lpage>62</lpage>.</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pincelli</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cardoso</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Malta</surname>
<given-names>M. B.</given-names>
</name>
<name>
<surname>Johansen</surname>
<given-names>I. C.</given-names>
</name>
<name>
<surname>Corder</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Nicolete</surname>
<given-names>V. C.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Low-level <italic>Plasmodium vivax</italic> exposure, maternal antibodies, and anemia in early childhood: population-based birth cohort study in Amazonian Brazil</article-title>. <source>PLOS Neglected Trop. Dis.</source> <volume>15</volume> (<issue>7</issue>), <fpage>e0009568</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pntd.0009568</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Poespoprodjo</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Douglas</surname>
<given-names>N. M.</given-names>
</name>
<name>
<surname>Ansong</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Kho</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Anstey</surname>
<given-names>N. M.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Malaria</article-title>. <source>Lancet</source> <volume>402</volume> (<issue>10419</issue>), <fpage>2328</fpage>&#x2013;<lpage>2345</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(23)01249-7</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ren</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chakraborty</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Doijad</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Falgenhauer</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Falgenhauer</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Goesmann</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Prediction of antimicrobial resistance based on whole-genome sequencing and machine learning</article-title>. <source>Bioinformatics</source> <volume>38</volume> (<issue>2</issue>), <fpage>325</fpage>&#x2013;<lpage>334</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btab681</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ren</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Nanayakkara Sapugahawatte</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Sp&#xe4;nig</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jamrozy</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Predicting hosts and cross-species transmission of <italic>Streptococcus agalactiae</italic> by interpretable machine learning</article-title>. <source>Comput. Biol. Med.</source> <volume>171</volume>, <fpage>108185</fpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2024.108185</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ribeiro</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Crnkovic</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pereira</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Fisberg</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Sarti</surname>
<given-names>F. M.</given-names>
</name>
<name>
<surname>Rogero</surname>
<given-names>M. M.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>AnchorFCI: harnessing genetic anchors for enhanced causal discovery of cardiometabolic disease pathways</article-title>. <source>Front. Genet.</source> <volume>15</volume>, <fpage>1436947</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2024.1436947</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ribeiro</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Soler</surname>
<given-names>J. M. P.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Learning genetic and environmental graphical models from family data</article-title>. <source>Statistics Med.</source> <volume>39</volume> (<issue>15</issue>), <fpage>2403</fpage>&#x2013;<lpage>2422</lpage>. <pub-id pub-id-type="doi">10.1002/sim.8545</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Ribeiro</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Soler</surname>
<given-names>J. M. P.</given-names>
</name>
<name>
<surname>Neto</surname>
<given-names>E. C.</given-names>
</name>
<name>
<surname>Fujita</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2016</year>). &#x201c;<article-title>Causal inference and structure learning of genotype&#x2013;phenotype networks using genetic variation</article-title>,&#x201d; in <source>Big data analytics in genomics</source> (<publisher-name>Springer</publisher-name>), <fpage>89</fpage>&#x2013;<lpage>143</lpage>.</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rodrigues</surname>
<given-names>P. T.</given-names>
</name>
<name>
<surname>Johansen</surname>
<given-names>I. C.</given-names>
</name>
<name>
<surname>Ladeia</surname>
<given-names>W. A.</given-names>
</name>
<name>
<surname>Esquivel</surname>
<given-names>F. D.</given-names>
</name>
<name>
<surname>Corder</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Tonini</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Lower microscopy sensitivity with decreasing malaria prevalence in the urban Amazon region, Brazil, 2018&#x2013;2021</article-title>. <source>Emerg. Infect. Dis.</source> <volume>30</volume> (<issue>9</issue>), <fpage>1884</fpage>&#x2013;<lpage>1894</lpage>. <pub-id pub-id-type="doi">10.3201/eid3009.240378</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rubin</surname>
<given-names>D. B.</given-names>
</name>
</person-group> (<year>1974</year>). <article-title>Estimating causal effects of treatments in randomized and nonrandomized studies</article-title>. <source>J. Educ. Psychol.</source> <volume>66</volume> (<issue>5</issue>), <fpage>688</fpage>&#x2013;<lpage>701</lpage>. <pub-id pub-id-type="doi">10.1037/h0037350</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tajabadi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Grabenhenrich</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ribeiro</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Leyer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Heider</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Sharing data with shared benefits: Artificial intelligence perspective</article-title>. <source>J. Med. Internet Res.</source> <volume>25</volume>, <fpage>e47540</fpage>. <pub-id pub-id-type="doi">10.2196/47540</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tajabadi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Martin</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Heider</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Privacy-preserving decentralized learning methods for biomedical applications</article-title>. <source>Comput. Struct. Biotechnol. J.</source> <volume>23</volume>, <fpage>3281</fpage>&#x2013;<lpage>3287</lpage>. <pub-id pub-id-type="doi">10.1016/j.csbj.2024.08.024</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Theodosiou</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Read</surname>
<given-names>R. C.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Artificial intelligence, machine learning and deep learning: potential resources for the infection clinician</article-title>. <source>J. Infect.</source> <volume>87</volume> (<issue>4</issue>), <fpage>287</fpage>&#x2013;<lpage>294</lpage>. <pub-id pub-id-type="doi">10.1016/j.jinf.2023.07.006</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>van der Laan</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Rubin</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Targeted maximum likelihood learning</article-title>. <source>Int. J. Biostat.</source> <volume>2</volume> (<issue>1</issue>). <comment>Article 11</comment>. <pub-id pub-id-type="doi">10.2202/1557-4679.1043</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Allen</surname>
<given-names>G. I.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Integrative generalized convex clustering optimization and feature selection for mixed multi-view data</article-title>. <source>J. Mach. Learn. Res.</source> <volume>22</volume> (<issue>55</issue>), <fpage>55</fpage>&#x2013;<lpage>73</lpage>.</citation>
</ref>
<ref id="B48">
<citation citation-type="book">
<collab>World Health Organization</collab> (<year>2024</year>). <source>World malaria report 2024. World Health Organization. Available online at: https://www.who.int/teams/global-malaria-programme/reports/world-malaria-report-2024</source>.</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Kuang</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>You</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Federated unsupervised representation learning</article-title>. <source>Front. Inf. Technol. and Electron. Eng.</source> <volume>24</volume> (<issue>8</issue>), <fpage>1181</fpage>&#x2013;<lpage>1193</lpage>. <pub-id pub-id-type="doi">10.1631/FITEE.2200268</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>On the completeness of orientation rules for causal discovery in the presence of latent confounders and selection bias</article-title>. <source>Artif. Intell.</source> <volume>172</volume> (<issue>16&#x2013;17</issue>), <fpage>1873</fpage>&#x2013;<lpage>1896</lpage>. <pub-id pub-id-type="doi">10.1016/j.artint.2008.08.001</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>