<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="brief-report" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Public Health</journal-id>
<journal-title>Frontiers in Public Health</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Public Health</abbrev-journal-title>
<issn pub-type="epub">2296-2565</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpubh.2025.1663373</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Public Health</subject>
<subj-group>
<subject>Brief Research Report</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>RISE: a novel unified framework for feature relevance in malnutrition analytics integrating statistical and expert insights</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Shruthi</surname>
<given-names>S.</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3062980/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Govindarajan</surname>
<given-names>Priya</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3128178/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Shalini</surname>
<given-names>S. R.</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Antony</surname>
<given-names>Pavan John</given-names>
</name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Uma</surname>
<given-names>A. N.</given-names>
</name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Rangarajan</surname>
<given-names>Lalith</given-names>
</name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Computer Science, School of Computing, Amrita Vishwa Vidyapeetham</institution>, <addr-line>Mysuru</addr-line>, <country>India</country></aff>
<aff id="aff2"><sup>2</sup><institution>Pediatric Department, Mysore Medical College and Research Institute</institution>, <addr-line>Mysuru</addr-line>, <country>India</country></aff>
<aff id="aff3"><sup>3</sup><institution>School of Education, Adelphi University</institution>, <addr-line>Garden City, NY</addr-line>, <country>United States</country></aff>
<aff id="aff4"><sup>4</sup><institution>Genetic Unit, Anatomy Department, Mahatma Gandhi Medical College and RI, Sri Balaji Vidyapeeth (Deemed to be University)</institution>, <addr-line>Puducherry</addr-line>, <country>India</country></aff>
<aff id="aff5"><sup>5</sup><institution>Department of Studies in Computer Science, University of Mysore</institution>, <addr-line>Mysuru</addr-line>, <country>India</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0001">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3094508/overview">Marta Esgalhado</ext-link>, Lus&#x00F3;fona University Research Centre for Biosciences &#x0026; Health Technologies, Portugal</p>
</fn>
<fn fn-type="edited-by" id="fn0002">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1736572/overview">Leandro Oliveira</ext-link>, Universidade Lus&#x00F3;fona Research Center for Biosciences &#x0026; Health Technologies, Portugal</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2344095/overview">Luis Javier S&#x00E1;nchez Mart&#x00ED;nez</ext-link>, Complutense University of Madrid, Spain</p>
</fn>
<corresp id="c001">&#x002A;Correspondence: Priya Govindarajan, <email>priyagovindarajan@my.amrita.edu</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>16</day>
<month>10</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>13</volume>
<elocation-id>1663373</elocation-id>
<history>
<date date-type="received">
<day>10</day>
<month>07</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>22</day>
<month>09</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Shruthi, Govindarajan, Shalini, Antony, Uma and Rangarajan.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Shruthi, Govindarajan, Shalini, Antony, Uma and Rangarajan</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Addressing child malnutrition remains a critical global health priority, directly contributing to Sustainable Development Goals (SDG 2 &#x2013; Zero Hunger and SDG 3 &#x2013; Good Health and Well-being). This study aims to identify and prioritize the most influential determinants of acute forms of malnutrition among children aged 0&#x2013;23&#x202F;months by developing a novel feature scoring framework, RISE (Relevance-based Integration of Statistics and Expertise). The objective is to bridge the gap between data-driven modeling and context-specific insights by integrating model-based scores (from XGBoost), statistical filter methods for frequency boosting, and domain-informed adjustments. Using real-world data from Nutrition Rehabilitation Centre (NRC) at K.R. District Hospital, Mysuru, the RISE framework enhances the interpretability and contextual relevance of predictors often underweighted in traditional models. Domain-relevant features such as Mother Height, Breastfeeding Status, Caste, Maternal Working Status, and Ration card emerged as critical factors when adjusted through the RISE Framework. The top-ranked features included Child Weight, maternal anthropometry, and Child order remained consistently influential determinants, reflecting maternal dependency and the double burden of malnutrition. RISE uncovers hidden yet meaningful contributors that often go underrepresented in purely model-driven analyses. By adjusting feature scores to recognize both empirical strength and domain importance. By aligning analytical rigor with public health relevance, this study contributes a scalable, context-sensitive approach to feature prioritization in malnutrition research, supporting more informed, targeted interventions and policy actions toward achieving global nutrition goals.</p>
</abstract>
<kwd-group>
<kwd>child malnutrition</kwd>
<kwd>maternal malnutrition</kwd>
<kwd>feature scoring</kwd>
<kwd>model-based scoring</kwd>
<kwd>domain-based scoring</kwd>
<kwd>filter-based feature Scoring</kwd>
<kwd>frequency boosting</kwd>
<kwd>XGBoost</kwd>
</kwd-group>
<counts>
<fig-count count="4"/>
<table-count count="4"/>
<equation-count count="5"/>
<ref-count count="38"/>
<page-count count="12"/>
<word-count count="8527"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Public Health and Nutrition</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>Malnutrition remains one of the most persistent global health challenges, with every country striving to control, manage, and ultimately eradicate it. Malnutrition of any form, such as wasting, stunting, or underweight (<xref ref-type="bibr" rid="ref1">1</xref>), can occur at various stages of life; its occurrence during childhood is considered the most alarming. Globally, stunting affected an estimated 23.2 percent or 150.2 million children, and wasting threatened the lives of an estimated 6.6 percent or 42.8 million children under 5 in 2024 (<xref ref-type="bibr" rid="ref2">2</xref>). The outcome of the &#x201C;Fifth National Family Health Survey (NFHS-5)&#x201D; discloses a prevalence of malnutrition in India, children under 5&#x202F;years who are &#x201C;stunted (height-for-age) 35.5, &#x2018;wasted (weight-for-height)&#x2019; 19.3, &#x2018;severely wasted (weight-for-height)&#x2019; 7.7, &#x2018;underweight (weight-for-age)&#x2019; by the &#x2018;World Health Organization&#x2019; (WHO) standards (<xref ref-type="bibr" rid="ref3">3</xref>)&#x201D;. Both national governments and international organizations have recognized its critical impact and continue introducing policies, programs, and guidelines to address this multifaceted issue. Addressing malnutrition during the formative years is a healthcare imperative and a socioeconomic priority. Malnutrition is influenced by region-specific, environmental, cultural, and socioeconomic factors (<xref ref-type="bibr" rid="ref2 ref3 ref4 ref5">2&#x2013;5</xref>). What contributes to malnutrition in one setting may not hold the same relevance in another, making context-sensitive analysis crucial (<xref ref-type="bibr" rid="ref5">5</xref>). Policymakers prioritize the identification of malnutrition determinants before formulating or revising any policies or guidelines (<xref ref-type="bibr" rid="ref4">4</xref>). Understanding these underlying factors is essential for effective intervention design, resource allocation, and impact measurement. As a result, the study of determinants of malnutrition has emerged as a critical area of research.</p>
<p>In recent years, machine learning (ML) has emerged as a powerful tool for identifying malnutrition determinants. Conventional feature selection methods, such as statistically based filter methods, have been widely used in ML to identify relevant features by evaluating statistical relationships between features and the outcome. These techniques are computationally efficient and easy to interpret, making them valuable tools in the early stages of exploratory data analysis (<xref ref-type="bibr" rid="ref6 ref7 ref8 ref9">6&#x2013;9</xref>). However, they often evaluate features independently, ignoring potential interactions among variables. These methods are sensitive to data distribution, scale, and noise, and may overlook contextually important features that do not exhibit strong statistical signals. This limitation becomes critical in complex public health problems like malnutrition, where domain knowledge and latent factors play a significant role. Hence, relying solely on conventional techniques may lead to the exclusion of key features that are crucial from a policy or intervention perspective (<xref ref-type="bibr" rid="ref10 ref11 ref12 ref13 ref14">10&#x2013;14</xref>). The research objective is to develop and implement the RISE (relevance-based integration of statistics and expertise) framework to enhance the identification of key determinants of acute forms of child malnutrition. By integrating model-based feature importance, domain knowledge, and frequency boost based on statistical relevance, the study aims to capture both dominant and overlooked factors that traditional statistical and machine learning models overlook. The RISE balances predictive power with contextual significance. Computationally, it introduces frequency boosting using a filter-based ensemble model, normalization across scales, and implementation of nested grid search for hyperparameter tuning. These positions RISE as both a technically rigorous and domain-sensitive framework, filling a critical gap in malnutrition-related ML research.</p>
<sec id="sec2">
<label>1.1</label>
<title>Literature review</title>
<p>The application of machine learning (ML) to malnutrition prediction has evolved significantly over the past few years. Early work by Anku et al. (<xref ref-type="bibr" rid="ref7">7</xref>) demonstrated the superiority of XGBoost (98% accuracy, 100% AUC) in predicting wasting, stunting, and underweight in Ghana. Talukder et al. (<xref ref-type="bibr" rid="ref8">8</xref>) demonstrated the potential of ML algorithms such as random forest (RF), logistic regression, and k-nearest neighbors (k-NN) in identifying malnutrition among children, with RF achieving the highest sensitivity (94.66%) and specificity (69.76%). In 2021, Fenta et al. (<xref ref-type="bibr" rid="ref9">9</xref>) conducted a comparative evaluation of six ML models&#x2014;including logistic regression, LASSO, ridge regression, elastic net, neural networks, and RF across Ethiopian zones and established RF as the top-performing algorithm based on sensitivity, specificity, accuracy, and AUC. That same year, Bitew et al. (<xref ref-type="bibr" rid="ref10">10</xref>) employed five ML methods, including XGBoost, RF, neural networks, and k-NN to predict socio-demographic risk factors of undernutrition, with XGBoost showing the highest accuracy (88.0%). Khan et al. (<xref ref-type="bibr" rid="ref11">11</xref>) further validated the utility of ensemble methods by identifying gradient boosting as the most accurate model for predicting stunting among children under five years old. Additionally, Vasu et al. (<xref ref-type="bibr" rid="ref12">12</xref>) employed the Boruta algorithm in conjunction with RF and PCA for dimensionality reduction to identify the most impactful features in malnutrition prediction. In 2022, Mohammad et al. (<xref ref-type="bibr" rid="ref13">13</xref>) proposed an optimized hybrid approach combining Harris Hawk Optimization (HHO) with ADASYN for defect prediction, achieving classification accuracies exceeding 99%, with clear implications for imbalanced malnutrition datasets. In 2023, Ndagijimana et al. (<xref ref-type="bibr" rid="ref14">14</xref>) used ensemble methods including gradient boosting and RF in Rwanda, where gradient boosting achieved the best performance (AUC 89%). The year 2024 has seen even broader adoption: Turjo et al. (<xref ref-type="bibr" rid="ref15">15</xref>) used six classifiers, including RF and gradient boosting, to assess women&#x2019;s malnutrition in Bangladesh, where RF showed the highest accuracy and AUC (0.604), Mkungudza et al. (<xref ref-type="bibr" rid="ref16">16</xref>) applied seven variable selection techniques to logistic regression models to predict undernutrition with modest AUC performance (64%), Boruta feature selection, and the variables&#x2019; importance scores were used to identify determinants of malnutrition (<xref ref-type="bibr" rid="ref17">17</xref>). Yal&#x00E7;&#x0131;n et al. (<xref ref-type="bibr" rid="ref18">18</xref>) applied elastic net and RF models in neonatal intensive care settings, showing the models&#x2019; capacity to accelerate early malnutrition risk identification. This meta-analysis indicated that ML models were observed to have moderate to good performance metrics in predicting malnutrition using DHS data among children under five years (<xref ref-type="bibr" rid="ref19">19</xref>). Collectively, studies reflect a growing confidence in machine learning models such as SVM, k-NN and ensemble methods, particularly RF. Gradient Boost and XGBoost, for accurate and scalable malnutrition prediction (<xref ref-type="bibr" rid="ref20 ref21 ref22 ref23">20&#x2013;23</xref>), though they also reveal ongoing challenges in feature selection, interpretability, and standardization of methodologies.</p>
</sec>
<sec id="sec3">
<label>1.2</label>
<title>Research gap</title>
<p>Machine learning techniques have significantly advanced the identification of malnutrition determinants; they are not without limitations, particularly in how they handle feature importance and inherent model bias. One critical challenge is that statistical variance, feature distribution, and model architecture heavily influence most model-driven feature importance scores (<xref ref-type="bibr" rid="ref7">7</xref>, <xref ref-type="bibr" rid="ref8">8</xref>). As a result, features that may hold substantial contextual or domain relevance can be assigned low importance because they exhibit weak correlations or appear less frequently in the training data. Furthermore, tree-based models like Random Forests or boosting algorithms may exhibit bias towards features with more unique values or features that dominate the data (<xref ref-type="bibr" rid="ref9 ref10 ref11 ref12">9&#x2013;12</xref>). This can lead to the underrepresentation of subtle but crucial socio-cultural or environmental factors. When models are trained on imbalanced or non-representative datasets, they may generalize poorly across regions or demographic groups, further skewing the feature rankings. While multiple studies apply ML algorithms, there is no uniform approach to feature selection, preprocessing, or handling of imbalanced data. Techniques like Boruta, PCA, and ADASYN are used in isolation (<xref ref-type="bibr" rid="ref12 ref13 ref14 ref15 ref16 ref17 ref18">12&#x2013;18</xref>), without comparative evaluations or integration into a common pipeline. Most models rely on statistical or wrapper-based feature selection methods (e.g., LASSO, Boruta), but very few studies integrate public health expertise or contextual domain relevance into feature importance ranking (<xref ref-type="bibr" rid="ref19 ref20 ref21">19&#x2013;21</xref>). This leads to the potential exclusion of sociocultural significant predictors that are weakly correlated in raw data but crucial in practice. These challenges make it difficult for policymakers to rely solely on raw model outputs, highlighting the need for more balanced frameworks that integrate statistical learning with human expertise to capture both machine-relevant and domain-important features. To address the limitations of traditional machine learning models in identifying determinants of malnutrition (<xref ref-type="bibr" rid="ref22">22</xref>, <xref ref-type="bibr" rid="ref23">23</xref>), this study proposes the RISE (Relevance-based Integration of Statistics and Expertise) framework. RISE integrates statistical scores, model-based importance, and domain knowledge to uncover both dominant and overlooked features influencing acute forms of child malnutrition.</p>
</sec>
</sec>
<sec sec-type="methods" id="sec4">
<label>2</label>
<title>Methods</title>
<sec id="sec5">
<label>2.1</label>
<title>Study design, setting, and population</title>
<p>A cross-sectional study was conducted at Mysuru Medical College and Research Center, in collaboration with the Nutrition Rehabilitation Centres (NRC), from March 2024 to January 2025. The sample included 208 children aged 1&#x2013;23&#x202F;months admitted to the NRC, and children included in the study were identified with Moderate Acute Malnutrition (MAM) and Severe Acute Malnutrition (SAM), with data on maternal and child anthropometry, and socio&#x2013;demographic information extracted from hospital records.</p>
</sec>
<sec id="sec6">
<label>2.2</label>
<title>Characteristics of the study population</title>
<p>The study population included child, maternal, and socio&#x2013;demographic information. The child&#x2019;s information includes 56.8% males and 43.2% females. Children were categorized into four age groups: Group 1 (0&#x2013;5&#x202F;months) had 16.0% children, Group 2 (6&#x2013;11&#x202F;months) had 40.8% children, Group 3 (12&#x2013;17&#x202F;months) included 27.7% children, and Group 4 (18&#x2013;23&#x202F;months) comprised 15.5% children. Regarding birth weight, 60.7% children have normal birth weight. Anthropometric measurements showed that the mean Mid-Upper Arm Circumference (MUAC) was 11.57&#x202F;cm (&#x00B1; 2.10&#x202F;cm), the average weight was 6.32&#x202F;kg (&#x00B1; 1.25&#x202F;kg), and the mean height was 69.51&#x202F;cm (&#x00B1; 6.71&#x202F;cm), Among the 206 children included in the study, 51.5% were identified MAM and 48.5% with SAM, reflecting considerable variability in physical growth indicators across the sample. During admission to the NRC, child feeding practices were recorded. The data revealed overlapping patterns; 88.35% of children received breastfeeding, and 73.79% received bottle feeding. Specifically, 66.02% of children were fed both, 22.33% were exclusively breastfed, 7.77% were exclusively bottle-fed, and 3.88% received neither. These overlaps reflect concurrent feeding practices reported by caregivers and were retained to preserve the full behavioral context in the analysis.</p>
<p>Under maternal characteristics, the majority of mothers, 56.31% in the study were between 20&#x2013;25 years. 52.91% of the mothers were classified as having an inadequate BMI, highlighting a significant burden of undernutrition among caregivers. Educational attainment with 65.05% having secondary education, though 4.85% remained illiterate. Regarding employment status, a substantial 91.26% were housewives, reflecting low workforce participation. In terms of reproductive profile, 60.19% of mothers had two or more children, and 56.31% of index children were of second or higher birth order, suggesting high family responsibility. 72.82% of mothers had not adopted any family planning methods, indicating a gap in reproductive health awareness and access.</p>
<p>The socio-demographic analysis reveals that 87.86% families reported a non-vegetarian diet. 50.97% of the mothers belonged to Other Backward Classes (OBC), followed by 36.41% from Scheduled Castes and Scheduled Tribes (SC/ST), and 12.62% from the General category. 66.5% of the children were from rural areas. The Ration Card feature in the dataset comprises two categories: Above Poverty Line (APL) and Below Poverty Line (BPL), with BPL accounting for approximately 99.51% of the records. Given this near-constant distribution, a sensitivity analysis was conducted by executing the model both with and without this feature. The results showed no change in model performance metrics or feature rankings. For reference, the model maintained an overall accuracy of 82.54%, as shown in <xref ref-type="fig" rid="fig1">Figure 1</xref>, indicating that the inclusion of this low-variance variable did not influence predictive accuracy. This reinforces the robustness of the model and confirms that its outputs are not dependent on statistically redundant features.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Comparative unified performance metrics with 95% confidence intervals across filter-based feature selection methods combined with XGBoost. Comparison of performance metrics with 95% confidence intervals across different filter-based feature selection methods combined with XGBoost. The plot shows Accuracy, Precision, Recall, and F1-score for five methods: ReliefF&#x202F;+&#x202F;XGB, ANOVA&#x202F;+&#x202F;XGB, Chi<sup>2</sup>&#x202F;+&#x202F;XGB, MI&#x202F;+&#x202F;XGB, and XGBoost. Bars represent the 95% confidence intervals for each metric.</p>
</caption>
<graphic xlink:href="fpubh-13-1663373-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Line graph showing performance metrics with 95% confidence intervals across five methods: ReliefF+XGB, ANOVA+XGB, Chi&#x00B2;+XGB, MI+XGB, and XGBoost. Metrics include accuracy, precision, recall, and F1-score, represented by different colored lines. Scores range from 0.5 to 0.9. All methods show similar trends, with variance in confidence intervals.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec7">
<label>2.3</label>
<title>Variables, definitions, and encoding</title>
<p>WHO Anthro software was used to compute Height for Age (HAZ), Weight for Age (WAZ), and Weight for Height (WHZ) scores based on each child&#x2019;s age, height, and weight from NRC records. Nutritional status was classified as SAM (WHZ&#x202F;&#x003C;&#x202F;&#x2212;3 SD) and MAM (WHZ between &#x2212;3 and &#x2212;2 SD) (<xref ref-type="bibr" rid="ref24">24</xref>).</p>
<p>Categorical variables in the dataset were numerically encoded to facilitate model training. Binary categorical features such as Breastfeeding Status, Bottle Feeding Status, Family Planning Status, Mother Working Status, Food Type, Child Gender, and Ration card were encoded using label encoding, with values assigned as 1 or 2 to represent distinct categories (e.g., yes/no or male/female). Ordinal variables such as Maternal BMI, Mother MUAC, Child Birth Weight, Maternal Education, and Child Age were label-encoded to preserve their rank structure. Nominal categorical variables like Caste and Residence were similarly encoded using integer labels. All remaining features, including anthropometric and demographic measures such as Child Weight, Child Height, Mother Weight, Mother Height, Child MUAC, and Total Child, were treated as either discrete or continuous numeric variables and used without transformation. This encoding strategy ensured compatibility with the modeling pipeline while preserving the interpretability of categorical distinctions.</p>
</sec>
<sec id="sec8">
<label>2.4</label>
<title>RISE framework for feature scoring and selection</title>
<p>The traditional machine learning models rely on feature selection driven primarily by model-based importance scores or a single statistical method such as Mutual Information (MI), Chi-Square (Chi<sup>2</sup>), or ANOVA for feature scoring. While these approaches can be effective in identifying statistically significant variables, they often place little to no emphasis on domain-driven feature scoring, which can capture contextually important variables that statistical methods may overlook (<xref ref-type="bibr" rid="ref25 ref26 ref27 ref28 ref29 ref30">25&#x2013;30</xref>).</p>
<p>The proposed methodology introduces a novel approach to feature selection through the RISE framework, which is designed to uncover important features that are underrepresented or overlooked by traditional ML models. Conventional model-based scoring methods tend to favor features with strong statistical patterns, frequently ignoring variables that are contextually significant in real-world scenarios. RISE addresses this imbalance by combining four modules:</p>
<list list-type="simple">
<list-item>
<p>(1)&#x00A0;&#x00A0;A statistical scoring module&#x2014;captures relevance based on statistical filter methods</p>
</list-item>
<list-item>
<p>(2)&#x00A0;&#x00A0;A frequency boost module&#x2014;provides the boosting scores based on its top priority</p>
</list-item>
<list-item>
<p>(3)&#x00A0;&#x00A0;A domain knowledge scoring module&#x2014;incorporates expert insight and contextual importance</p>
</list-item>
<list-item>
<p>(4)&#x00A0;&#x00A0;A model scoring module&#x2014;reflects importance as assigned by the machine learning model.</p>
</list-item>
</list>
<p>This integrated strategy ensures a more balanced and inclusive selection of features in acute forms of child malnutrition domains.</p>
<sec id="sec9">
<label>2.4.1</label>
<title>Statistical scoring module</title>
<p>The statistical scoring module in this study leverages filter-based feature selection techniques to evaluate the importance of features based on their statistical relationship with the target variable. The four key methods used are MI, Chi<sup>2</sup> test, ANOVA F-test, and ReliefF. Each method has its unique way of assessing relevance, which collectively contributes to a more robust feature evaluation.</p>
<sec id="sec10">
<label>2.4.1.1</label>
<title>Mutual information (MI)</title>
<p>Mutual Information measures the dependency between a feature and the target variable. It quantifies how much knowing the value of a feature reduces uncertainty about the target. It captures both linear and non-linear relationships. Features with higher MI scores are considered more informative (<xref ref-type="bibr" rid="ref26">26</xref>, <xref ref-type="bibr" rid="ref28">28</xref>).</p>
<disp-formula id="E1">
<mml:math id="M1">
<mml:mi>MI</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">X</mml:mi>
<mml:mo>;</mml:mo>
<mml:mi mathvariant="normal">Y</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mi>&#x03A3;</mml:mi>
<mml:mspace width="0.33em"/>
<mml:mi mathvariant="normal">P</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="normal">y</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2217;</mml:mo>
</mml:msup>
<mml:mspace width="0.33em"/>
<mml:mo>log</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">P</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="normal">y</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>/</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">P</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2217;</mml:mo>
</mml:msup>
<mml:mspace width="0.33em"/>
<mml:mi mathvariant="normal">P</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">y</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
</sec>
<sec id="sec11">
<label>2.4.1.2</label>
<title>Chi-square (Chi<sup>2</sup>) test</title>
<p>The Chi-Square test assesses whether there is a significant association between a categorical feature and the target class. It compares the observed frequencies of feature values with the expected frequencies under the assumption of independence. A higher Chi<sup>2</sup> score indicates a stronger dependency between the feature and the target (<xref ref-type="bibr" rid="ref28">28</xref>, <xref ref-type="bibr" rid="ref29">29</xref>).</p>
<disp-formula id="E2">
<mml:math id="M2">
<mml:msup>
<mml:mi>&#x03C7;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mi>&#x03A3;</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">O</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="normal">E</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>/</mml:mo>
<mml:mi mathvariant="normal">E</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
</sec>
<sec id="sec12">
<label>2.4.1.3</label>
<title>ANOVA F-test</title>
<p>ANOVA (Analysis of Variance) is used when the feature is continuous and the target is categorical. It evaluates whether the mean of the feature differs significantly across different classes of the target. A high <italic>F</italic>-value suggests that the feature contributes significantly to class separation (<xref ref-type="bibr" rid="ref27">27</xref>, <xref ref-type="bibr" rid="ref28">28</xref>).</p>
<disp-formula id="E3">
<mml:math id="M3">
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>MS</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi mathvariant="normal">B</mml:mi>
<mml:mo>/</mml:mo>
<mml:mi>MS</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi mathvariant="normal">W</mml:mi>
<mml:mspace width="0.33em"/>
<mml:mtext>where</mml:mtext>
<mml:mspace width="0.25em"/>
<mml:mi>MS</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi mathvariant="normal">B</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>SS</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi mathvariant="normal">B</mml:mi>
<mml:mo>/</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>k1</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mspace width="0.25em"/>
<mml:mtext>and</mml:mtext>
<mml:mspace width="0.25em"/>
<mml:mi>MS</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi mathvariant="normal">W</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>SS</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi mathvariant="normal">W</mml:mi>
<mml:mo>/</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>Nk</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
</sec>
<sec id="sec13">
<label>2.4.1.4</label>
<title>ReliefF algorithm</title>
<p>ReliefF is an instance-based feature selection method that considers feature value differences between neighboring instances. It evaluates how well each feature distinguishes between instances of different classes while considering feature interactions and redundancy. It is particularly useful for noisy and complex datasets (<xref ref-type="bibr" rid="ref30">30</xref>).</p>
<disp-formula id="E4">
<mml:math id="M4">
<mml:mi mathvariant="normal">W</mml:mi>
<mml:mo stretchy="true">[</mml:mo>
<mml:mi mathvariant="normal">A</mml:mi>
<mml:mo stretchy="true">]</mml:mo>
<mml:mo>=</mml:mo>
<mml:mi mathvariant="normal">W</mml:mi>
<mml:mo stretchy="true">[</mml:mo>
<mml:mi mathvariant="normal">A</mml:mi>
<mml:mo stretchy="true">]</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>/</mml:mo>
<mml:mi mathvariant="normal">m</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2217;</mml:mo>
</mml:msup>
<mml:mspace width="0.25em"/>
<mml:mi>&#x03A3;</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mtext>diff</mml:mtext>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">A</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mtext>nearHit</mml:mtext>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext>diff</mml:mtext>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="normal">A</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mtext>nearMiss</mml:mtext>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<p>These feature scores, derived before any model training. The selected features based on these scores are then used to train the ensemble boosting model separately for each filter method. The model&#x2019;s internal feature importance scores are subsequently extracted to evaluate how the model prioritizes features that were pre-selected using different statistical criteria. This approach ensures that the model&#x2019;s learning is influenced by features deemed relevant purely through statistical assessment, thereby linking filter-based selection with model-driven evaluation.</p>
</sec>
</sec>
<sec id="sec14">
<label>2.4.2</label>
<title>Frequency boosting module</title>
<p>The Frequency Boosting Module enhances the weight of features that consistently appear as important across multiple independent selection methods. This approach recognizes that a feature is repeatedly identified by statistical filters based ensemble model. Each time a feature is selected or ranked within the top tier by a model, it earns a frequency point. These counts are then normalized and converted into a frequency boosting score, reflecting the stability and consensus around a feature&#x2019;s importance. By incorporating this module into the RISE framework, features with cross-method agreement are justifiably promoted. This mechanism ensures that consistent signals are amplified, increasing the reliability of the final feature selection.</p>
</sec>
<sec id="sec15">
<label>2.4.3</label>
<title>Domain knowledge scoring module</title>
<p>This Module is designed to integrate expert-driven insights and Contextual relevance into the feature scoring process, leveraging both subject matter expertise and established literature. First, the features were grouped based on thematic relevance, guided by insights from domain experts and collaborators. These groups represent contextual domains that are well-established in influencing the severity of child malnutrition. Next, each feature was assigned an importance score using XGBoost. The scores were then aggregated within their respective groups to calculate a group-wise cumulative score. Based on these cumulative scores, ranks were assigned to each group. Group 1, Child Anthropometry, includes variables such as gender, age, MUAC, weight, and height of the child (<xref ref-type="bibr" rid="ref29">29</xref>). Group 2 covers Early Feeding Practices, including birth weight, breastfeeding, and bottle feeding (<xref ref-type="bibr" rid="ref31">31</xref>, <xref ref-type="bibr" rid="ref32">32</xref>). Group 3, Maternal Anthropometry, includes the mother&#x2019;s weight, height, age, BMI, and MUAC (<xref ref-type="bibr" rid="ref29">29</xref>). Group 4 focuses on Family Structure, including the total number of children and the child&#x2019;s birth order (<xref ref-type="bibr" rid="ref33">33</xref>). Group 5 includes Socio-Economic Factors such as residence type, ration card status, caste, and food type. Finally, Group 6 represents Maternal Empowerment, including education, working status, and family planning (<xref ref-type="bibr" rid="ref34">34</xref>). A numerical rank ranging from 6 (highest relevance) to 1 (lowest) was applied at the group level, and each feature within a group inherited the corresponding rank as presented in <xref ref-type="table" rid="tab1">Table 1</xref>. Finally, domain ranks of all features were normalized between 0&#x2013;1. These normalized scores serve as the final domain importance values in the RISE framework.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Domain-based feature grouping and prioritization for acute forms of child malnutrition.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Group priority</th>
<th align="left" valign="top">Group name</th>
<th align="left" valign="top">Group feature</th>
<th align="center" valign="top">Group score</th>
<th align="center" valign="top">Domain rank</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">1</td>
<td align="left" valign="top">Child anthropometry</td>
<td align="left" valign="top">Child gender, age, MUAC, weight, and height</td>
<td align="center" valign="top">0.275254</td>
<td align="center" valign="top">6</td>
</tr>
<tr>
<td align="left" valign="top">2</td>
<td align="left" valign="top">Early feeding practices</td>
<td align="left" valign="top">Birth weight, breastfeeding, and bottle-feeding practice</td>
<td align="center" valign="top">0.246018</td>
<td align="center" valign="top">5</td>
</tr>
<tr>
<td align="left" valign="top">3</td>
<td align="left" valign="top">Maternal anthropometry</td>
<td align="left" valign="top">Mother&#x2019;s weight, height, age, BMI, and MUAC</td>
<td align="center" valign="top">0.147003</td>
<td align="center" valign="top">4</td>
</tr>
<tr>
<td align="left" valign="top">4</td>
<td align="left" valign="top">Family structure</td>
<td align="left" valign="top">Total number of children and the child&#x2019;s birth order</td>
<td align="center" valign="top">0.127140</td>
<td align="center" valign="top">3</td>
</tr>
<tr>
<td align="left" valign="top">5</td>
<td align="left" valign="top">Socio-economic</td>
<td align="left" valign="top">Residence type, ration card, caste, and food type</td>
<td align="center" valign="top">0.110287</td>
<td align="center" valign="top">2</td>
</tr>
<tr>
<td align="left" valign="top">6</td>
<td align="left" valign="top">Maternal empowerment</td>
<td align="left" valign="top">Maternal education, working status, and family planning</td>
<td align="center" valign="top">0.094298</td>
<td align="center" valign="top">1</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Domain-wise grouping and ranking of features influencing acute forms of child malnutrition. Each group consists of thematically related variables aggregated to calculate a Group Score, which indicates the combined influence of that domain. Domain Rank shows the relative priority based on these scores, with higher values indicating greater importance.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="sec16">
<label>2.4.4</label>
<title>A model scoring module</title>
<p>The model scoring module independently generates feature importance scores directly from a boosting model without relying on any prior feature selection or pre-training. In this module, the full set of input features is used to train an ensemble boosting algorithm where the model itself learns which features contribute most to predictive performance.</p>
</sec>
<sec id="sec17">
<label>2.4.5</label>
<title>Final feature scores</title>
<p>The RISE framework computes a final feature score by integrating model-based performance, methodological consistency, and domain relevance. This scoring strategy ensures that selected features are not only powerful predictors but also consistently recognized across methods and grounded in expert knowledge.</p>
<p>The Model Score reflects the feature&#x2019;s contribution to prediction accuracy, derived directly from a boosting model without any prior filtering. The Frequency boost captures how often a feature is selected as important across a filter-based ensemble model, indicating its robustness and consistency. The Domain Importance represents the contextual and theoretical significance of a feature as determined by thematic grouping guided by subject matter experts.</p>
<p>RISE Final Score Formula:</p>
<disp-formula id="E5">
<mml:math id="M5">
<mml:msub>
<mml:mtext>RISE</mml:mtext>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mi>&#x03B1;</mml:mi>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mtext>Model Score</mml:mtext>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi>&#x03B2;</mml:mi>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mtext>Domain Importance</mml:mtext>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi>&#x03B3;</mml:mi>
<mml:mo>&#x00B7;</mml:mo>
<mml:msub>
<mml:mtext>Frequency Boost</mml:mtext>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
</mml:math>
</disp-formula>
<p>i: Feature index. <italic>&#x03B1;</italic>, <italic>&#x03B2;</italic>, <italic>&#x03B3;</italic>: Hyper-tuning values to adjust the contribution of each component. In the RISE framework, Selection of Hyperparameter tuning was done using nested validation. The final RISE score is defined as a weighted sum of Model Score, Domain importance, and Frequency Boost. The optimal configuration was determined to be &#x03B1;&#x202F;=&#x202F;&#x03B2;&#x202F;=&#x202F;&#x03B3;&#x202F;=&#x202F;0.1. The overall architecture of the RISE framework is presented in <xref ref-type="fig" rid="fig2">Figure 2</xref>.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Architecture of RISE framework.</p>
</caption>
<graphic xlink:href="fpubh-13-1663373-g002.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Flowchart depicting a feature scoring process for NRC data, utilizing model-based, filter-based, and domain-based methods. Key techniques include MI, Chi-squared, ANOVA, and ReliefF. An ensemble model is trained, and scores are computed using a formula: RISE equals alpha times Model Score plus beta times Frequency Boost plus gamma times Domain Importance. The process extracts top features of child malnutrition.</alt-text>
</graphic>
</fig>
</sec>
</sec>
</sec>
<sec sec-type="results" id="sec18">
<label>3</label>
<title>Results</title>
<p>The dataset used in this study comprises exclusively malnourished children, with the target variable categorically divided into SAM and MAM. The primary objective of this research is to identify the determinants of acute forms of child malnutrition. The analysis focuses on extracting and ranking features through a combination of model-based importance, domain knowledge insights, and frequency-based boosting grounded in a filter-based method. <italic>A priori</italic> power analysis using G&#x002A;Power (two-tailed, effect size d&#x202F;=&#x202F;0.5, <italic>&#x03B1;</italic>&#x202F;=&#x202F;0.05, power&#x202F;=&#x202F;0.90) indicated that a minimum of 172 participants (86 per group) would be required. This study includes real-time data of 206 children (100 SAM and 106 MAM), ensuring adequate statistical power as well as indicating a balanced distribution between the two groups. The dataset was obtained from the NRC register. All available features were taken for analysis to ensure a comprehensive evaluation and to support the development of a framework for identifying determinants of acute forms of child malnutrition. The study did not use any confounder study, pre-filtering, or exclusion based on correlation thresholds. It retained the full spectrum of variables that may contribute to nutritional outcomes of the child, whether directly or indirectly. This inclusive approach allows the model to assess the relative importance of each feature in context, which ensures completeness and eliminates concerns regarding missing values.</p>
<p>The implementation was done in Python version 3.11.11 (Anaconda distribution). The dataset was first partitioned into training and testing subsets to evaluate generalization performance. Feature selection was guided by XGBoost classifier, statistical importance based on filter-based XGBoost, and domain ranking with XGBoost. To ensure robustness and reduce overfitting, Stratified K-Fold Cross-Validation (with <italic>k</italic>&#x202F;=&#x202F;5) was employed on the training set. This approach preserved the class distribution across folds and allowed for consistent performance estimation. A nested cross-validation framework was employed for hyperparameter tuning. The outer loop used 5-fold cross-validation to evaluate generalization performance, while the inner loop applied 3-fold cross-validation within a grid search. The optimal values obtained were <italic>&#x03B1;</italic>&#x202F;=&#x202F;<italic>&#x03B2;</italic>&#x202F;=&#x202F;<italic>&#x03B3;</italic>&#x202F;=&#x202F;0.1, resulting in a Nested CV mean F1 score of 0.824. For the XGBoost classifier, parameters specified were the number of estimators (n_estimators&#x202F;=&#x202F;100), evaluation metric (eval_metric&#x202F;=&#x202F;logloss), and random seed (random_state&#x202F;=&#x202F;42). All other hyperparameters were retained at their default values (learning_rate&#x202F;=&#x202F;0.1, max_depth&#x202F;=&#x202F;6, subsample&#x202F;=&#x202F;1.0).</p>
<p>The XGBoost, a high-performance gradient boosting algorithm, is widely used for its accuracy, speed, and ability to handle complex, structured data (<xref ref-type="bibr" rid="ref35 ref36 ref37 ref38">35&#x2013;38</xref>). This section presents the experimental implementation of the RISE framework using the XGBoost model. However, the proposed approach is flexible and can be generalized to other machine learning ensemble methods for enhanced applicability. The results of model-based and domain-based feature scoring are summarized in <xref ref-type="table" rid="tab2">Table 2</xref>. The model-based scores were derived by training an XGBoost classifier independently on a curated set of input features and extracting importance, which reflects each feature&#x2019;s contribution to child malnutrition. In parallel, domain ranks were obtained based on thematic relevance, guided by insights from domain experts and group score, and it is further normalized to ensure symmetry in the RISE score components, as presented in <xref ref-type="table" rid="tab1">Table 1</xref>.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Feature importance from XGBoost model and normalized domain scores.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Feature</th>
<th align="center" valign="top">Model importance</th>
<th align="center" valign="top">Domain rank (normalized)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Child weight</td>
<td align="center" valign="top">0.1304</td>
<td align="center" valign="top">1.0</td>
</tr>
<tr>
<td align="left" valign="top">Child MUAC</td>
<td align="center" valign="top">0.0989</td>
<td align="center" valign="top">1.0</td>
</tr>
<tr>
<td align="left" valign="top">Breastfeeding status</td>
<td align="center" valign="top">0.0969</td>
<td align="center" valign="top">0.8</td>
</tr>
<tr>
<td align="left" valign="top">Child height</td>
<td align="center" valign="top">0.0820</td>
<td align="center" valign="top">1.0</td>
</tr>
<tr>
<td align="left" valign="top">Child order</td>
<td align="center" valign="top">0.0669</td>
<td align="center" valign="top">0.4</td>
</tr>
<tr>
<td align="left" valign="top">Mother age</td>
<td align="center" valign="top">0.0550</td>
<td align="center" valign="top">0.6</td>
</tr>
<tr>
<td align="left" valign="top">Food type</td>
<td align="center" valign="top">0.0539</td>
<td align="center" valign="top">0.2</td>
</tr>
<tr>
<td align="left" valign="top">Mother weight</td>
<td align="center" valign="top">0.0485</td>
<td align="center" valign="top">0.6</td>
</tr>
<tr>
<td align="left" valign="top">Child gender</td>
<td align="center" valign="top">0.0453</td>
<td align="center" valign="top">1.0</td>
</tr>
<tr>
<td align="left" valign="top">Maternal BMI</td>
<td align="center" valign="top">0.0443</td>
<td align="center" valign="top">0.6</td>
</tr>
<tr>
<td align="left" valign="top">Mother height</td>
<td align="center" valign="top">0.0443</td>
<td align="center" valign="top">0.6</td>
</tr>
<tr>
<td align="left" valign="top">Mother MUAC</td>
<td align="center" valign="top">0.0411</td>
<td align="center" valign="top">0.6</td>
</tr>
<tr>
<td align="left" valign="top">Residence</td>
<td align="center" valign="top">0.0340</td>
<td align="center" valign="top">0.2</td>
</tr>
<tr>
<td align="left" valign="top">Maternal education</td>
<td align="center" valign="top">0.0336</td>
<td align="center" valign="top">0.1</td>
</tr>
<tr>
<td align="left" valign="top">Child birth weight</td>
<td align="center" valign="top">0.0279</td>
<td align="center" valign="top">0.8</td>
</tr>
<tr>
<td align="left" valign="top">Total child</td>
<td align="center" valign="top">0.0252</td>
<td align="center" valign="top">0.4</td>
</tr>
<tr>
<td align="left" valign="top">Child age</td>
<td align="center" valign="top">0.0248</td>
<td align="center" valign="top">1.0</td>
</tr>
<tr>
<td align="left" valign="top">Bottle feeding status</td>
<td align="center" valign="top">0.0220</td>
<td align="center" valign="top">0.8</td>
</tr>
<tr>
<td align="left" valign="top">Caste</td>
<td align="center" valign="top">0.0139</td>
<td align="center" valign="top">0.2</td>
</tr>
<tr>
<td align="left" valign="top">Family planning status</td>
<td align="center" valign="top">0.0112</td>
<td align="center" valign="top">0.1</td>
</tr>
<tr>
<td align="left" valign="top">Maternal WORKING STATUS</td>
<td align="center" valign="top">0.0000</td>
<td align="center" valign="top">0.1</td>
</tr>
<tr>
<td align="left" valign="top">Ration card</td>
<td align="center" valign="top">0.0000</td>
<td align="center" valign="top">0.2</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Presents XGBoost model importance and normalized domain scores. The domain scores are adapted from domain-derived weightings as shown in <xref ref-type="table" rid="tab1">Table 1</xref> and further normalized between 0&#x2013;1.</p>
</table-wrap-foot>
</table-wrap>
<p>To identify the most influential factors associated with acute forms of child malnutrition, filter-based feature selection methods were employed. Each method prioritized the top 15 features based on their statistical relevance to the target outcome. These selected features were used independently to train XGBoost models. This approach allowed us to assess how feature selection strategies influence model performance and feature importance scoring. Further, each feature earns its frequency boost score based on the number of times it appears in the top 10 ranked features across four different filter-based feature selection methods. If a feature appears in the top 10 of all four methods, it is assigned a boost value of 4. If it appears in three methods, the boost value is 3; in two methods, it is 2, and in one method, it is 1. If the feature does not appear in the top 10 of any method, the frequency boost is 0. This scoring mechanism reflects the consistency and recurrence of feature importance across multiple selection methods. The results of filter-based XGBoost, along with frequency boost, are presented in <xref ref-type="table" rid="tab3">Table 3</xref>. The performance of the XGBoost model across various feature training configurations, its accuracy, recall, precision, and F1-scores are presented as a unified performance report in <xref ref-type="fig" rid="fig1">Figure 1</xref>.</p>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Consolidated feature importance scores from XGBoost models using multiple filter methods and associated frequency boosting.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">SL. no</th>
<th align="center" valign="top">Feature</th>
<th align="center" valign="top">MI+XGB</th>
<th align="center" valign="top">CHI2&#x202F;+&#x202F;XGB</th>
<th align="center" valign="top">ANOVA+XGB</th>
<th align="center" valign="top">ReliefF + XGB</th>
<th align="center" valign="top">Frequency boost</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">1</td>
<td align="left" valign="top">Child weight</td>
<td align="center" valign="top">0.17623</td>
<td align="center" valign="top">0.07254</td>
<td align="center" valign="top">0.07823</td>
<td align="center" valign="top">0.08677</td>
<td align="center" valign="top">4</td>
</tr>
<tr>
<td align="left" valign="top">2</td>
<td align="left" valign="top">Mother weight</td>
<td align="center" valign="top">0.07228</td>
<td align="center" valign="top">0.06940</td>
<td align="center" valign="top">0.06450</td>
<td align="center" valign="top">0.08097</td>
<td align="center" valign="top">4</td>
</tr>
<tr>
<td align="left" valign="top">3</td>
<td align="left" valign="top">Child age</td>
<td align="center" valign="top">0.05977</td>
<td align="center" valign="top">0.05965</td>
<td align="center" valign="top">0.04656</td>
<td align="center" valign="top">0.07366</td>
<td align="center" valign="top">4</td>
</tr>
<tr>
<td align="left" valign="top">4</td>
<td align="left" valign="top">Child order</td>
<td align="center" valign="top">0.11333</td>
<td align="center" valign="top">0.08627</td>
<td align="center" valign="top">0.07579</td>
<td align="center" valign="top">0.09466</td>
<td align="center" valign="top">4</td>
</tr>
<tr>
<td align="left" valign="top">5</td>
<td align="left" valign="top">Mother MUAC</td>
<td align="center" valign="top">0.03908</td>
<td align="center" valign="top">0.08464</td>
<td align="center" valign="top">0.06795</td>
<td align="center" valign="top">0.10448</td>
<td align="center" valign="top">3</td>
</tr>
<tr>
<td align="left" valign="top">6</td>
<td align="left" valign="top">Maternal BMI</td>
<td align="center" valign="top">0.07584</td>
<td align="center" valign="top">0.03560</td>
<td align="center" valign="top">0.04508</td>
<td align="center" valign="top">0.07273</td>
<td align="center" valign="top">3</td>
</tr>
<tr>
<td align="left" valign="top">7</td>
<td align="left" valign="top">Maternal education</td>
<td align="center" valign="top">0.02548</td>
<td align="center" valign="top">0.07033</td>
<td align="center" valign="top">0.10025</td>
<td align="center" valign="top">0.13661</td>
<td align="center" valign="top">3</td>
</tr>
<tr>
<td align="left" valign="top">8</td>
<td align="left" valign="top">Food type</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">0.22474</td>
<td align="center" valign="top">0.30430</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">2</td>
</tr>
<tr>
<td align="left" valign="top">9</td>
<td align="left" valign="top">Child MUAC</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">0.05691</td>
<td align="center" valign="top">0.08130</td>
<td align="center" valign="top">2</td>
</tr>
<tr>
<td align="left" valign="top">10</td>
<td align="left" valign="top">Child gender</td>
<td align="center" valign="top">0.09670</td>
<td align="center" valign="top">0.06540</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">2</td>
</tr>
<tr>
<td align="left" valign="top">11</td>
<td align="left" valign="top">Family planning status</td>
<td align="center" valign="top">0.06051</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">0.05844</td>
<td align="center" valign="top">2</td>
</tr>
<tr>
<td align="left" valign="top">12</td>
<td align="left" valign="top">Child birth weight</td>
<td align="center" valign="top">0.04554</td>
<td align="center" valign="top">0.05052</td>
<td align="center" valign="top">0.04102</td>
<td align="center" valign="top">0.04506</td>
<td align="center" valign="top">2</td>
</tr>
<tr>
<td align="left" valign="top">13</td>
<td align="left" valign="top">Residence</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">0.05299</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">1</td>
</tr>
<tr>
<td align="left" valign="top">14</td>
<td align="left" valign="top">Bottle feeding status</td>
<td align="center" valign="top">0.07320</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">1</td>
</tr>
<tr>
<td align="left" valign="top">15</td>
<td align="left" valign="top">Total child</td>
<td align="center" valign="top">0.01176</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">0.06862</td>
<td align="center" valign="top">1</td>
</tr>
<tr>
<td align="left" valign="top">16</td>
<td align="left" valign="top">Mother age</td>
<td align="center" valign="top">0.01176</td>
<td align="center" valign="top">0.05808</td>
<td align="center" valign="top">0.02073</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">1</td>
</tr>
<tr>
<td align="left" valign="top">17</td>
<td align="left" valign="top">Child height</td>
<td align="center" valign="top">0.13852</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">1</td>
</tr>
<tr>
<td align="left" valign="top">18</td>
<td align="left" valign="top">Mother height</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">0.03518</td>
<td align="center" valign="top">0.04935</td>
<td align="center" valign="top">0</td>
</tr>
<tr>
<td align="left" valign="top">19</td>
<td align="left" valign="top">Breastfeeding status</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">0.04736</td>
<td align="center" valign="top">0</td>
</tr>
<tr>
<td align="left" valign="top">20</td>
<td align="left" valign="top">Caste</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">0.04637</td>
<td align="center" valign="top">0.04038</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">0</td>
</tr>
<tr>
<td align="left" valign="top">21</td>
<td align="left" valign="top">Maternal working status</td>
<td align="center" valign="top">-</td>
<td align="center" valign="top">0.02346</td>
<td align="center" valign="top">0.02313</td>
<td align="center" valign="top">0.000000</td>
<td align="center" valign="top">0</td>
</tr>
<tr>
<td align="left" valign="top">22</td>
<td align="left" valign="top">Ration card</td>
<td align="center" valign="top">0.000000</td>
<td align="center" valign="top">0.000000</td>
<td align="center" valign="top">0.000000</td>
<td align="center" valign="top">0.000000</td>
<td align="center" valign="top">0</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>The table presents consolidated feature importance scores for acute forms of child malnutrition. The importance scores are obtained from XGBoost models trained using various filter methods: MI, CHI2, ANOVA, and ReliefF. Only features that appear in the top 10 of at least one configuration were given frequency boost score. The Frequency Boost Score indicates the feature&#x2019;s presence across top-10 lists: 4 &#x2013; feature appears in the top 10 of all 4 methods. 3 &#x2013; feature appears in the top 10 of any 3 methods. 2 &#x2013; feature appears in the top 10 of any 2 methods. 1 &#x2013; feature appears in the top 10 of any 1 method. 0 &#x2013; feature does not appear in the top 10 of any method.</p>
</table-wrap-foot>
</table-wrap>
<p>Now, the RISE framework is employed by integrating three key components: domain importance scoring, model-based feature scoring, and frequency-based boosting. Each feature&#x2019;s final score is computed by combining these elements using a weighted formula, enabling a balanced representation of statistical relevance, expert knowledge, and selection consistency presented in <xref ref-type="table" rid="tab4">Table 4</xref>. This comprehensive scoring strategy ensures that both high-performing and domain-relevant but underrepresented features are prioritized appropriately in the final analysis, visualized in <xref ref-type="fig" rid="fig3">Figure 3</xref>.</p>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>Final RISE with normalized domain score, frequency boost, and domain score with corresponding hyper tuning values.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Feature</th>
<th align="center" valign="top">Domain score</th>
<th align="center" valign="top">Model score</th>
<th align="center" valign="top">Frequency boost</th>
<th align="center" valign="top">RISE score</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Child weight</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">0.1304</td>
<td align="center" valign="top">1.00</td>
<td align="center" valign="top">0.2130</td>
</tr>
<tr>
<td align="left" valign="top">Child age</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">0.0248</td>
<td align="center" valign="top">1.00</td>
<td align="center" valign="top">0.2025</td>
</tr>
<tr>
<td align="left" valign="top">Mother weight</td>
<td align="center" valign="top">0.6</td>
<td align="center" valign="top">0.0485</td>
<td align="center" valign="top">1.00</td>
<td align="center" valign="top">0.1648</td>
</tr>
<tr>
<td align="left" valign="top">Child MUAC</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">0.0989</td>
<td align="center" valign="top">0.50</td>
<td align="center" valign="top">0.1599</td>
</tr>
<tr>
<td align="left" valign="top">Child gender</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">0.0453</td>
<td align="center" valign="top">0.50</td>
<td align="center" valign="top">0.1545</td>
</tr>
<tr>
<td align="left" valign="top">Child order</td>
<td align="center" valign="top">0.4</td>
<td align="center" valign="top">0.0669</td>
<td align="center" valign="top">1.00</td>
<td align="center" valign="top">0.1467</td>
</tr>
<tr>
<td align="left" valign="top">Maternal BMI</td>
<td align="center" valign="top">0.6</td>
<td align="center" valign="top">0.0443</td>
<td align="center" valign="top">0.75</td>
<td align="center" valign="top">0.1394</td>
</tr>
<tr>
<td align="left" valign="top">Mother MUAC</td>
<td align="center" valign="top">0.6</td>
<td align="center" valign="top">0.0411</td>
<td align="center" valign="top">0.75</td>
<td align="center" valign="top">0.1391</td>
</tr>
<tr>
<td align="left" valign="top">Child height</td>
<td align="center" valign="top">1.0</td>
<td align="center" valign="top">0.0820</td>
<td align="center" valign="top">0.25</td>
<td align="center" valign="top">0.1332</td>
</tr>
<tr>
<td align="left" valign="top">Child birth weight</td>
<td align="center" valign="top">0.8</td>
<td align="center" valign="top">0.0279</td>
<td align="center" valign="top">0.50</td>
<td align="center" valign="top">0.1328</td>
</tr>
<tr>
<td align="left" valign="top">Bottle feeding status</td>
<td align="center" valign="top">0.8</td>
<td align="center" valign="top">0.0220</td>
<td align="center" valign="top">0.25</td>
<td align="center" valign="top">0.1072</td>
</tr>
<tr>
<td align="left" valign="top">Mother age</td>
<td align="center" valign="top">0.6</td>
<td align="center" valign="top">0.0550</td>
<td align="center" valign="top">0.25</td>
<td align="center" valign="top">0.0905</td>
</tr>
<tr>
<td align="left" valign="top">Breastfeeding status</td>
<td align="center" valign="top">0.8</td>
<td align="center" valign="top">0.0969</td>
<td align="center" valign="top">0.00</td>
<td align="center" valign="top">0.0897</td>
</tr>
<tr>
<td align="left" valign="top">Maternal education</td>
<td align="center" valign="top">0.1</td>
<td align="center" valign="top">0.0336</td>
<td align="center" valign="top">0.75</td>
<td align="center" valign="top">0.0884</td>
</tr>
<tr>
<td align="left" valign="top">Food type</td>
<td align="center" valign="top">0.2</td>
<td align="center" valign="top">0.0539</td>
<td align="center" valign="top">0.50</td>
<td align="center" valign="top">0.0754</td>
</tr>
<tr>
<td align="left" valign="top">Total child</td>
<td align="center" valign="top">0.4</td>
<td align="center" valign="top">0.0252</td>
<td align="center" valign="top">0.25</td>
<td align="center" valign="top">0.0675</td>
</tr>
<tr>
<td align="left" valign="top">Mother height</td>
<td align="center" valign="top">0.6</td>
<td align="center" valign="top">0.0443</td>
<td align="center" valign="top">0.00</td>
<td align="center" valign="top">0.0644</td>
</tr>
<tr>
<td align="left" valign="top">Family planning status</td>
<td align="center" valign="top">0.1</td>
<td align="center" valign="top">0.0112</td>
<td align="center" valign="top">0.50</td>
<td align="center" valign="top">0.0611</td>
</tr>
<tr>
<td align="left" valign="top">Residence</td>
<td align="center" valign="top">0.2</td>
<td align="center" valign="top">0.0340</td>
<td align="center" valign="top">0.25</td>
<td align="center" valign="top">0.0484</td>
</tr>
<tr>
<td align="left" valign="top">Caste</td>
<td align="center" valign="top">0.2</td>
<td align="center" valign="top">0.0139</td>
<td align="center" valign="top">0.00</td>
<td align="center" valign="top">0.0214</td>
</tr>
<tr>
<td align="left" valign="top">Ration card</td>
<td align="center" valign="top">0.2</td>
<td align="center" valign="top">0.0000</td>
<td align="center" valign="top">0.00</td>
<td align="center" valign="top">0.0200</td>
</tr>
<tr>
<td align="left" valign="top">Working code</td>
<td align="center" valign="top">0.1</td>
<td align="center" valign="top">0.0000</td>
<td align="center" valign="top">0.00</td>
<td align="center" valign="top">0.0100</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>The table presents consolidated feature scores for malnutrition-related data. The RISE_Score represents the final integrated score for each feature, calculated by combining: 1. Domain score &#x2013; provided based on thematic grouping and expert ranking and further normalized between 0&#x2013;1. 2. Model score &#x2013; provides the feature importance obtained from the XGBoost classifier. 3. Frequency boost &#x2013; provided for the feature that is repeatedly identified by statistical filters based ensemble model. The combination is controlled by hyperparameters &#x03B1;, &#x03B2;, and &#x03B3;, which were optimized using nested cross-validation (nested CV). The optimal values obtained were &#x03B1;&#x202F;=&#x202F;&#x03B2;&#x202F;=&#x202F;&#x03B3;&#x202F;=&#x202F;0.1, resulting in a nested CV mean F1 score of 0.824.</p>
</table-wrap-foot>
</table-wrap>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Feature importance and RISE score visualization. This figure presents a comparative analysis of feature importance using four scoring metrics: model score: quantifies each feature&#x2019;s predictive contribution based on XGBoost. Domain score: reflects relevance based on thematic grouping and domain knowledge. Frequency boost: consistent top 10 features in filter-based XGBoost. RISE score: a composite metric integrating the above three scores to represent overall feature relevance.</p>
</caption>
<graphic xlink:href="fpubh-13-1663373-g003.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Bar chart titled "Feature Importance and RISE Score Visualization" showing various features on the x-axis and their corresponding scores on the y-axis. Bars represent Model Score (green), Domain Score (cyan), and Frequency Boost (red). A line graph overlays the bars depicting the RISE Score (brown line with dots), which decreases across features.</alt-text>
</graphic>
</fig>
</sec>
<sec sec-type="discussion" id="sec19">
<label>4</label>
<title>Discussion</title>
<p>The analysis of top-ranked features using the RISE framework reveals critical insights into the multifaceted nature of acute forms of child malnutrition. Among the various determinants, child anthropometric indicators emerged as the most influential, followed by maternal anthropometry and child order. However, Data from the NRC reinforces these findings: over 88% of malnourished children were being breastfed, including 58.51% of MAM cases and 44.32% of SAM cases. Furthermore, 49.0% of mothers of children diagnosed with SAM had an inadequate BMI, indicating undernutrition. Similarly, a higher proportion, 56.6% of mothers of children with MAM, also exhibited inadequate BMI levels (<xref ref-type="bibr" rid="ref8">8</xref>). This strongly suggests an interlinked pattern that mothers with poor nutritional status may be breastfeeding children who consequently face an increased risk of malnutrition, emphasizing the dual burden of maternal and child undernutrition. The study also implements SHAP (SHapley Additive Explanations), which indicates how each feature contributes to the model&#x2019;s predictions. The SHAP results further validate that maternal anthropometry, such as the mother&#x2019;s weight, plays a significant role in acute forms of child malnutrition presented in <xref ref-type="fig" rid="fig4">Figure 4</xref>. Child order reflects the burden of familial resource allocation, with 56.31% of malnourished children being of second birth order or higher, indicating that increasing family size may dilute maternal attention and care (<xref ref-type="bibr" rid="ref9">9</xref>, <xref ref-type="bibr" rid="ref10">10</xref>), further confirmed with SHAP analysis presented in <xref ref-type="fig" rid="fig4">Figure 4</xref>. Together, the integrated model insights and contextual statistics highlight critical intervention points. The evidence highlights the importance of policy strategies that enhance maternal nutrition, target vulnerable groups, and support young mothers, particularly those breastfeeding, in effectively breaking the intergenerational cycle of malnutrition (<xref ref-type="bibr" rid="ref29">29</xref>, <xref ref-type="bibr" rid="ref30">30</xref>).</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>SHAP summary plot showing feature contributions for acute forms of child malnutrition.</p>
</caption>
<graphic xlink:href="fpubh-13-1663373-g004.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">A SHAP summary plot displaying the impact of different features on model output. Features such as Weight, Height, and Mother_Weight show varying degrees of influence. Data points are colored on a spectrum from high (red) to low (blue) feature values, indicating their positive or negative impact on predictions. The x-axis represents SHAP values ranging from negative six to positive six, showing how each feature pushes the prediction higher or lower.</alt-text>
</graphic>
</fig>
<p>This research offers a novel contribution to the field of Child malnutrition and Machine learning. Firstly, in the child malnutrition domain, multi-dimensional and data-driven exploration of the complex determinants of acute forms of child undernutrition is achieved through integrated analysis of Maternal and Child Factors, emphasizing the mother&#x2013;child nutritional dyad as a central axis of malnutrition (<xref ref-type="bibr" rid="ref29">29</xref>). This integrated approach moves beyond child-focused indicators and reflects a life-cycle and intergenerational perspective on malnutrition. Secondly, this research introduces a novel and comprehensive feature prioritization framework, RISE (Relevance-based Integration of Statistics and Expertise), that represents a significant advancement in the field of child malnutrition analytics. Unlike conventional studies that depend on machine learning feature importance or subjective domain prioritization (<xref ref-type="bibr" rid="ref7 ref8 ref9 ref10 ref11 ref12 ref13 ref14 ref15 ref16 ref17">7&#x2013;17</xref>), this study uniquely integrates multi-dimensional evidence by combining four robust statistical filter methods (Mutual Information, Chi-square, ANOVA-F, ReliefF) with an ensemble model, domain-based scoring, and a newly proposed frequency boosting technique that captures the cross-method consensus of feature relevance. This multi-branch integration ensures that underrepresented yet contextually vital variables are not bypassed by purely statistical weightages (<xref ref-type="bibr" rid="ref27">27</xref>). The RISE framework thus reflects a paradigm shift from purely model-driven selection to an interpretable, explainable, and policy-relevant decision layer. It is an adaptable scoring logic and modular design, suitable for extension to other health and development research areas, establishing both scientific novelty and practical utility.</p>
<p>Some features, such as Mother Height, Breastfeeding Status, Caste, Maternal Working Status, and Ration Card, obtained a frequency boost score of zero. This indicates that none of the statistical feature selection methods consistently identified these variables as important predictors. The likely reasons include weak or indirect associations with acute forms of malnutrition and underrepresentation of certain subgroups in the dataset. Nevertheless, these features remain highly relevant from a public health and domain perspective, as they capture socioeconomic and behavioral dimensions of child nutrition that purely statistical methods may overlook. Therefore, the RISE framework incorporates domain-based correction to ensure such features are not disregarded solely based on low statistical detectability. Limitations of this study include the potential lack of generalizability due to the region-specific and institutionalized nature of the dataset. Such data may reflect only children accessing a particular facility, thereby excluding those without access to the facility or in different regional contexts. Additionally, while the RISE framework offers an advantage by incorporating domain knowledge along with statistical and model-driven methods, it introduces a level of subjectivity, particularly in assigning domain-based weights. Expert input for feature grouping and ranking was not derived through a formal elicitation process. External and temporal validation are essential to ensure the model&#x2019;s reliability across different populations, settings, and time periods. In the study, the model demonstrates strong performance within the current dataset; its generalizability remains untested.</p>
</sec>
<sec sec-type="conclusions" id="sec20">
<label>5</label>
<title>Conclusion</title>
<p>By examining the top features ranked by the RISE Score, Child anthropometry emerged as the most influential, followed by maternal anthropometry and child order. This hierarchy underscores a double burden of malnutrition. This reflects the importance of physical growth parameters in assessing nutritional status. Further down, features like maternal anthropometry and child order underscore its influence on child health outcomes. The presence of these variables at the top reinforces the understanding that the importance of maternal nutritional status and physical attributes plays a key role in shaping a child&#x2019;s growth and development, further highlighting the multifactorial nature of malnutrition.</p>
<p>The RISE framework demonstrates its strength by effectively identifying and assigning importance to features that were under-prioritized by conventional filter-based or model-based feature selection methods. For instance, features such as Ration card&#x202F;=&#x202F;0.0200, Working status&#x202F;=&#x202F;0.0100, Caste&#x202F;=&#x202F;0.0100, Mother height&#x202F;=&#x202F;0.0644, and Breastfeeding status&#x202F;=&#x202F;0.0897 lacked frequency boost contributions but were still given significant weight by the RISE framework. This reflects the inclusive nature of RISE, which integrates domain relevance, statistical contribution, and contextual importance, allowing it to highlight features that might be overlooked by purely data-driven models but are crucial in real-world health and nutritional contexts.</p>
<p>Addressing child malnutrition is a crucial step toward achieving Sustainable Development Goals, SDG 2 (Zero Hunger) and SDG 3 (Good Health and Well-being). The development and implementation of the RISE framework is an advancement in malnutrition analytics by bridging the gap between data-driven methodologies and domain expertise. Unlike traditional feature selection methods that may overlook critical variables due to statistical bias, RISE facilitates a more equitable, context-aware, and interpretable feature evaluation. By elevating the significance of factors like maternal education, breastfeeding practices, and socioeconomic conditions, the RISE approach ensures that key public health insights are retained and highlighted in machine learning models. Finally, this framework strengthens the translation of empirical data into actionable knowledge, empowering targeted interventions and evidence-based policymaking in the process of child malnutrition, thus contributing directly to global health equity and the realization of the SDGs.</p>
<sec id="sec21">
<label>5.1</label>
<title>Future work</title>
<p>While the current model demonstrates strong performance within the study dataset, to ensure reliability, broader applicability, or generalizability, future research should have a strong focus on external and temporal validation. Validating the framework on independent datasets from different geographic regions and across varied time periods, such validation would help in identifying the key determinants of acute child malnutrition.</p>
</sec>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec22">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/Supplementary material, further inquiries can be directed to the corresponding author. The code is available at: <ext-link xlink:href="https://github.com/Shruthi-S-Scholar/ChildMalnutrition-rise-framework" ext-link-type="uri">https://github.com/Shruthi-S-Scholar/ChildMalnutrition-rise-framework</ext-link>.</p>
</sec>
<sec sec-type="ethics-statement" id="sec23">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Mysore Medical College and Research Institute, Mysore, Karnataka. The studies were conducted in accordance with the local legislation and institutional requirements. Written informed consent for participation in this study was provided by the participants&#x2019; legal guardians/next of kin.</p>
</sec>
<sec sec-type="author-contributions" id="sec24">
<title>Author contributions</title>
<p>SShr: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. PG: Conceptualization, Supervision, Validation, Writing &#x2013; review &#x0026; editing. SSha: Data curation, Supervision, Validation, Writing &#x2013; review &#x0026; editing. PA: Supervision, Writing &#x2013; review &#x0026; editing. AU: Supervision, Writing &#x2013; review &#x0026; editing. LR: Supervision, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="funding-information" id="sec25">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research and/or publication of this article.</p>
</sec>
<sec sec-type="COI-statement" id="sec26">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec27">
<title>Generative AI statement</title>
<p>The author(s) declare that no Gen AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec28">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><label>1.</label> <citation citation-type="other"><person-group person-group-type="author"><collab id="coll1">World Health Organization</collab></person-group>. (<year>2024</year>). Malnutrition. Available online at: <ext-link xlink:href="https://www.who.int/news-room/fact-sheets/detail/malnutrition" ext-link-type="uri">https://www.who.int/news-room/fact-sheets/detail/malnutrition</ext-link>.</citation></ref>
<ref id="ref2"><label>2.</label> <citation citation-type="other"><person-group person-group-type="author"><collab id="coll2">World Health Organization, UNICEF, &#x0026; World Bank Group</collab></person-group>. (<year>2025</year>). Levels and trends in child malnutrition: UNICEF/WHO/World Bank Group joint child malnutrition estimates&#x2014;Key findings of the 2025 edition (ISBN 978&#x2013;92&#x2013;4-011230-8). Available online at: <ext-link xlink:href="https://www.who.int/publications/i/item/9789240112308" ext-link-type="uri">https://www.who.int/publications/i/item/9789240112308</ext-link>.</citation></ref>
<ref id="ref3"><label>3.</label> <citation citation-type="other"><person-group person-group-type="author"><collab id="coll3">IIPS &#x0026; MoHFW</collab></person-group>. (<year>2021</year>). International Institute for Population Sciences (IIPS) &#x0026; Ministry of Health and Family Welfare (MoHFW). Ministry of Health and Family Welfare, India. Available online at: <ext-link xlink:href="https://mohfw.gov.in/sites/default/files/NFHS-5_Phase-II_0.pdf" ext-link-type="uri">https://mohfw.gov.in/sites/default/files/NFHS-5_Phase-II_0.pdf</ext-link></citation></ref>
<ref id="ref4"><label>4.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Laksono</surname><given-names>AD</given-names></name> <name><surname>Izza</surname><given-names>N</given-names></name> <name><surname>Trisnani</surname><given-names>T</given-names></name> <name><surname>Paramita</surname><given-names>A</given-names></name> <name><surname>Sholikhah</surname><given-names>HH</given-names></name> <name><surname>Andarwati</surname><given-names>P</given-names></name> <etal/></person-group>. <article-title>Determination of appropriate policy targets to reduce the prevalence of stunting in children under five years of age in urban-poor communities in Indonesia: a secondary data analysis of the 2022 Indonesian national nutritional status survey</article-title>. <source>BMJ Open</source>. (<year>2024</year>) <volume>14</volume>:<fpage>e089531</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmjopen-2024-089531</pub-id>, PMID: <pub-id pub-id-type="pmid">39306355</pub-id></citation></ref>
<ref id="ref5"><label>5.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rezaee</surname><given-names>MT</given-names></name> <name><surname>Zakki</surname><given-names>SA</given-names></name> <name><surname>Haq</surname><given-names>I u</given-names></name> <name><surname>Rahimi</surname><given-names>N</given-names></name> <name><surname>Fayaz</surname><given-names>M</given-names></name></person-group>. <article-title>Cross-sectional study of determinants of undernutrition among children aged 6&#x2013;36 months in Kabul, Afghanistan</article-title>. <source>BMJ Open</source>. (<year>2024</year>) <volume>14</volume>:<fpage>e079839</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmjopen-2023-079839</pub-id>, PMID: <pub-id pub-id-type="pmid">39160103</pub-id></citation></ref>
<ref id="ref6"><label>6.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Qasrawi</surname><given-names>R</given-names></name> <name><surname>Sgahir</surname><given-names>S</given-names></name> <name><surname>Nemer</surname><given-names>M</given-names></name> <name><surname>Halaikah</surname><given-names>M</given-names></name> <name><surname>Badrasawi</surname><given-names>M</given-names></name> <name><surname>Amro</surname><given-names>M</given-names></name> <etal/></person-group>. <article-title>Machine learning approach for predicting the impact of food insecurity on nutrient consumption and malnutrition in children aged 6 months to 5 years</article-title>. <source>Children</source>. (<year>2024</year>) <volume>11</volume>:<fpage>7</fpage>. doi: <pub-id pub-id-type="doi">10.3390/children11070810</pub-id></citation></ref>
<ref id="ref7"><label>7.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Anku</surname><given-names>EK</given-names></name> <name><surname>Duah</surname><given-names>HO</given-names></name></person-group>. <article-title>Predicting and identifying factors associated with undernutrition among children under five years in Ghana using machine learning algorithms</article-title>. <source>PLoS One</source>. (<year>2024</year>) <volume>19</volume>:<fpage>e0296625</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0296625</pub-id>, PMID: <pub-id pub-id-type="pmid">38349921</pub-id></citation></ref>
<ref id="ref8"><label>8.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Talukder</surname><given-names>A</given-names></name> <name><surname>Ahammed</surname><given-names>B</given-names></name></person-group>. <article-title>Machine learning algorithms for predicting malnutrition among under-five children in Bangladesh</article-title>. <source>Nutrition</source>. (<year>2020</year>) <volume>78</volume>:<fpage>110861</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.nut.2020.110861</pub-id>, PMID: <pub-id pub-id-type="pmid">32592978</pub-id></citation></ref>
<ref id="ref9"><label>9.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fenta</surname><given-names>HM</given-names></name> <name><surname>Zewotir</surname><given-names>T</given-names></name> <name><surname>Muluneh</surname><given-names>EK</given-names></name></person-group>. <article-title>A machine learning classifier approach for identifying the determinants of under-five child undernutrition in Ethiopian administrative zones</article-title>. <source>BMC Med Inform Decis Mak</source>. (<year>2021</year>) <volume>21</volume>:<fpage>291</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12911-021-01652-1</pub-id>, PMID: <pub-id pub-id-type="pmid">34689769</pub-id></citation></ref>
<ref id="ref10"><label>10.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bitew</surname><given-names>FH</given-names></name> <name><surname>Sparks</surname><given-names>CS</given-names></name> <name><surname>Nyarko</surname><given-names>SH</given-names></name></person-group>. <article-title>Machine learning algorithms for predicting undernutrition among under-five children in Ethiopia</article-title>. <source>Public Health Nutr</source>. (<year>2022</year>) <volume>25</volume>:<fpage>269</fpage>&#x2013;<lpage>80</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S1368980021004262</pub-id>, PMID: <pub-id pub-id-type="pmid">34620263</pub-id></citation></ref>
<ref id="ref11"><label>11.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Khan</surname><given-names>JR</given-names></name> <name><surname>Tomal</surname><given-names>JH</given-names></name> <name><surname>Raheem</surname><given-names>E</given-names></name></person-group>. <article-title>Model and variable selection using machine learning methods with applications to childhood stunting in Bangladesh</article-title>. <source>Inform Health Soc Care</source>. (<year>2021</year>) <volume>46</volume>:<fpage>425</fpage>&#x2013;<lpage>42</lpage>. doi: <pub-id pub-id-type="doi">10.1080/17538157.2021.1904938</pub-id>, PMID: <pub-id pub-id-type="pmid">33851897</pub-id></citation></ref>
<ref id="ref12"><label>12.</label> <citation citation-type="book"><person-group person-group-type="author"><name><surname>Vasu</surname><given-names>SR</given-names></name> <name><surname>Khare</surname><given-names>S</given-names></name> <name><surname>Gupta</surname><given-names>D</given-names></name> <name><surname>Jyotishi</surname><given-names>A</given-names></name></person-group>. <article-title>Features explaining malnutrition in India: a machine learning approach to demographic and health survey data</article-title> In: <person-group person-group-type="editor"><name><surname>Garg</surname><given-names>D</given-names></name> <name><surname>Wong</surname><given-names>K</given-names></name> <name><surname>Sarangapani</surname><given-names>J</given-names></name> <name><surname>Gupta</surname><given-names>SK</given-names></name></person-group>, editors. <source>Advanced computing</source>. 10th International Conference, IACC 2020, Panaji, Goa, India: <publisher-name>Springer</publisher-name> (<year>2021</year>). <fpage>87</fpage>&#x2013;<lpage>99</lpage>.</citation></ref>
<ref id="ref13"><label>13.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mohammad</surname><given-names>UG</given-names></name> <name><surname>Imtiaz</surname><given-names>S</given-names></name> <name><surname>Shakya</surname><given-names>M</given-names></name> <name><surname>Almadhor</surname><given-names>A</given-names></name> <name><surname>Anwar</surname><given-names>F</given-names></name></person-group>. <article-title>An optimized feature selection method using ensemble classifiers in software defect prediction for healthcare systems</article-title>. <source>Wirel Commun Mob Comput</source>. (<year>2022</year>) <volume>2022</volume>:<fpage>1028175</fpage>. doi: <pub-id pub-id-type="doi">10.1155/2022/1028175</pub-id></citation></ref>
<ref id="ref14"><label>14.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ndagijimana</surname><given-names>S</given-names></name> <name><surname>Kabano</surname><given-names>IH</given-names></name> <name><surname>Masabo</surname><given-names>E</given-names></name> <name><surname>Ntaganda</surname><given-names>JM</given-names></name></person-group>. <article-title>Prediction of stunting among Under-5 children in Rwanda using machine learning techniques</article-title>. <source>J Prev Med Public Health</source>. (<year>2023</year>) <volume>56</volume>:<fpage>41</fpage>&#x2013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.3961/jpmph.22.388</pub-id>, PMID: <pub-id pub-id-type="pmid">36746421</pub-id></citation></ref>
<ref id="ref15"><label>15.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Turjo</surname><given-names>EA</given-names></name> <name><surname>Rahman</surname><given-names>MH</given-names></name></person-group>. <article-title>Assessing risk factors for malnutrition among women in Bangladesh and forecasting malnutrition using machine learning approaches</article-title>. <source>BMC Nutr</source>. (<year>2024</year>) <volume>10</volume>:<fpage>22</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s40795-023-00808-8</pub-id>, PMID: <pub-id pub-id-type="pmid">38303093</pub-id></citation></ref>
<ref id="ref16"><label>16.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mkungudza</surname><given-names>J</given-names></name> <name><surname>Twabi</surname><given-names>HS</given-names></name> <name><surname>Manda</surname><given-names>SOM</given-names></name></person-group>. <article-title>Development of a diagnostic predictive model for determining child stunting in Malawi: a comparative analysis of variable selection approaches</article-title>. <source>BMC Med Res Methodol</source>. (<year>2024</year>) <volume>24</volume>:<fpage>175</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12874-024-02283-6</pub-id>, PMID: <pub-id pub-id-type="pmid">39118039</pub-id></citation></ref>
<ref id="ref17"><label>17.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saleem</surname><given-names>J</given-names></name> <name><surname>Zakar</surname><given-names>R</given-names></name> <name><surname>Butt</surname><given-names>MS</given-names></name> <name><surname>Aadil</surname><given-names>RM</given-names></name> <name><surname>Ali</surname><given-names>Z</given-names></name> <name><surname>Bukhari</surname><given-names>GMJ</given-names></name> <etal/></person-group>. <article-title>Application of the Boruta algorithm to assess the multidimensional determinants of malnutrition among children under five years living in southern Punjab, Pakistan</article-title>. <source>BMC Public Health</source>. (<year>2024</year>) <volume>24</volume>:<fpage>167</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12889-024-17701-z</pub-id>, PMID: <pub-id pub-id-type="pmid">38216908</pub-id></citation></ref>
<ref id="ref18"><label>18.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yal&#x00E7;&#x0131;n</surname><given-names>N</given-names></name> <name><surname>Ka&#x015F;&#x0131;kc&#x0131;</surname><given-names>M</given-names></name> <name><surname>&#x00C7;elik</surname><given-names>HT</given-names></name> <name><surname>Demirkan</surname><given-names>K</given-names></name> <name><surname>Yi&#x011F;it</surname><given-names>&#x015E;</given-names></name> <name><surname>Yurdak&#x00F6;k</surname><given-names>M</given-names></name></person-group>. <article-title>Development and validation of machine learning-based clinical decision support tool for identifying malnutrition in NICU patients</article-title>. <source>Sci Rep</source>. (<year>2023</year>) <volume>13</volume>:<fpage>5227</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-023-32570-z</pub-id>, PMID: <pub-id pub-id-type="pmid">36997630</pub-id></citation></ref>
<ref id="ref19"><label>19.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rao</surname><given-names>B</given-names></name> <name><surname>Rashid</surname><given-names>M</given-names></name> <name><surname>Hasan</surname><given-names>MG</given-names></name> <name><surname>Thunga</surname><given-names>G</given-names></name></person-group>. <article-title>Machine learning in predicting child malnutrition: a Meta-analysis of demographic and health surveys data</article-title>. <source>Int J Environ Res Public Health</source>. (<year>2025</year>) <volume>22</volume>:<fpage>449</fpage>. doi: <pub-id pub-id-type="doi">10.3390/ijerph22030449</pub-id>, PMID: <pub-id pub-id-type="pmid">40238576</pub-id></citation></ref>
<ref id="ref20"><label>20.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zheng</surname><given-names>F</given-names></name> <name><surname>Chen</surname><given-names>K</given-names></name> <name><surname>Zhang</surname><given-names>X</given-names></name> <name><surname>Wang</surname><given-names>Q</given-names></name> <name><surname>Zhang</surname><given-names>Z</given-names></name> <name><surname>Niu</surname><given-names>W</given-names></name></person-group>. <article-title>Prevalence of malnutrition and associated factors in Chinese children and adolescents aged 3&#x2013;14 years using machine learning algorithms</article-title>. <source>J Glob Health</source>. (<year>2025</year>) <volume>15</volume>:<fpage>04204</fpage>. doi: <pub-id pub-id-type="doi">10.7189/jogh.15.04204</pub-id>, PMID: <pub-id pub-id-type="pmid">40689479</pub-id></citation></ref>
<ref id="ref21"><label>21.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ayele</surname><given-names>MK</given-names></name> <name><surname>Baye</surname><given-names>GA</given-names></name> <name><surname>Yesuf</surname><given-names>SH</given-names></name> <name><surname>Engda</surname><given-names>AA</given-names></name> <name><surname>Mitiku</surname><given-names>ET</given-names></name></person-group>. <article-title>Predicting stunting status among under five children in Ethiopia using ensemble machine learning algorithms</article-title>. <source>Sci Rep</source>. (<year>2025</year>) <volume>15</volume>:<fpage>27907</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-025-03206-1</pub-id>, PMID: <pub-id pub-id-type="pmid">40745172</pub-id></citation></ref>
<ref id="ref22"><label>22.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hendy</surname><given-names>A</given-names></name> <name><surname>Abdelaliem</surname><given-names>SMF</given-names></name> <name><surname>Sultan</surname><given-names>HM</given-names></name> <name><surname>Alahmedi</surname><given-names>SH</given-names></name> <name><surname>Ibrahim</surname><given-names>RK</given-names></name> <name><surname>Abdelrazek</surname><given-names>EME</given-names></name> <etal/></person-group>. <article-title>Unlocking insights: using machine learning to identify wasting and risk factors in Egyptian children under 5</article-title>. <source>Nutrition</source>. (<year>2025</year>) <volume>131</volume>:<fpage>112631</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.nut.2024.112631</pub-id>, PMID: <pub-id pub-id-type="pmid">39616982</pub-id></citation></ref>
<ref id="ref23"><label>23.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sugihartono</surname><given-names>T</given-names></name> <name><surname>Wijaya</surname><given-names>B</given-names></name> <name><surname>Marini</surname><given-names>M</given-names></name> <name><surname>Alkayess</surname><given-names>AP</given-names></name> <name><surname>Anugerah</surname><given-names>HA</given-names></name></person-group>. <article-title>Optimizing stunting detection through SMOTE and machine learning: a comparative study of XGBoost, random forest, SVM, and k-NN</article-title>. <source>J Appl Data Sci</source>. (<year>2025</year>) <volume>6</volume>:<fpage>667</fpage>&#x2013;<lpage>82</lpage>. doi: <pub-id pub-id-type="doi">10.47738/jads.v6i1.494</pub-id></citation></ref>
<ref id="ref24"><label>24.</label> <citation citation-type="other"><person-group person-group-type="author"><collab id="coll4">World Health Organization (WHO)</collab></person-group> (<year>2006</year>). Child growth standards. Available online at: <ext-link xlink:href="https://www.who.int/publications/i/item/924154693X" ext-link-type="uri">https://www.who.int/publications/i/item/924154693X</ext-link></citation></ref>
<ref id="ref25"><label>25.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Paul</surname><given-names>S</given-names></name> <name><surname>Rahman</surname><given-names>M</given-names></name> <name><surname>Dolley</surname><given-names>A</given-names></name> <name><surname>Saikia</surname><given-names>K</given-names></name> <name><surname>Singh</surname><given-names>CS</given-names></name> <name><surname>Mohammed</surname><given-names>A</given-names></name> <etal/></person-group>. <article-title>A retrospective study using machine learning to develop predictive model to identify rotavirus-associated acute gastroenteritis in children</article-title>. <source>PeerJ</source>. (<year>2025</year>) <volume>13</volume>:<fpage>e19025</fpage>. doi: <pub-id pub-id-type="doi">10.7717/peerj.19025</pub-id>, PMID: <pub-id pub-id-type="pmid">40247842</pub-id></citation></ref>
<ref id="ref26"><label>26.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tripathi</surname><given-names>A</given-names></name> <name><surname>Ragiri</surname><given-names>PR</given-names></name> <name><surname>Jain</surname><given-names>D</given-names></name> <name><surname>Yadav</surname><given-names>T</given-names></name></person-group>. <article-title>Machine learning-based predictive models for early diagnosis of liver disease</article-title>. <source>J Sci Ind Res</source>. (<year>2025</year>) <volume>84</volume>, 575&#x2013;583. doi: <pub-id pub-id-type="doi">10.56042/jsir.v84i5.14828</pub-id></citation></ref>
<ref id="ref27"><label>27.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rabie</surname><given-names>AH</given-names></name> <name><surname>Aldawsari</surname><given-names>M</given-names></name> <name><surname>Saleh</surname><given-names>AI</given-names></name> <name><surname>Saraya</surname><given-names>MS</given-names></name> <name><surname>Rashad</surname><given-names>M</given-names></name></person-group>. <article-title>HFSA: hybrid feature selection approach to improve medical diagnostic system</article-title>. <source>PeerJ Comput Sci</source>. (<year>2025</year>) <volume>11</volume>:<fpage>e2764</fpage>. doi: <pub-id pub-id-type="doi">10.7717/peerj-cs.2764</pub-id>, PMID: <pub-id pub-id-type="pmid">40567630</pub-id></citation></ref>
<ref id="ref28"><label>28.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Soliman</surname><given-names>MM</given-names></name> <name><surname>Chowdhury</surname><given-names>MH</given-names></name> <name><surname>Murugappan</surname><given-names>M</given-names></name> <name><surname>Chowdhury</surname><given-names>MEH</given-names></name></person-group>. <article-title>Automated classification of post-operative gait abnormalities following hip surgery using machine learning</article-title>. <source>Eng Res Exp</source>. (<year>2025</year>) <volume>7</volume>:<fpage>035203</fpage>. doi: <pub-id pub-id-type="doi">10.1088/2631-8695/ade84d</pub-id></citation></ref>
<ref id="ref29"><label>29.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mekonnen</surname><given-names>S</given-names></name> <name><surname>Birhanu</surname><given-names>D</given-names></name> <name><surname>Menber</surname><given-names>Y</given-names></name> <name><surname>Gebreegziabher</surname><given-names>ZA</given-names></name> <name><surname>Belay</surname><given-names>MA</given-names></name></person-group>. <article-title>Double burden of malnutrition and associated factors among mother&#x2013;child pairs at household level in Bahir Dar City, Northwest Ethiopia: community based cross-sectional study design</article-title>. <source>Front Nutr</source>. (<year>2024</year>) <volume>11</volume>:<fpage>1340382</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fnut.2024.1340382</pub-id>, PMID: <pub-id pub-id-type="pmid">38445209</pub-id></citation></ref>
<ref id="ref30"><label>30.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rabiei</surname><given-names>S</given-names></name> <name><surname>Ebrahimof</surname><given-names>S</given-names></name> <name><surname>Rasekhi</surname><given-names>H</given-names></name> <name><surname>Amini</surname><given-names>M</given-names></name> <name><surname>Ghodsi</surname><given-names>D</given-names></name> <name><surname>Yari</surname><given-names>Z</given-names></name> <etal/></person-group>. <article-title>Exploring the determinants of malnutrition in 2&#x2013;5 year Iranian children using structural equation modeling: national food and nutrition surveillance</article-title>. <source>BMC Public Health</source>. (<year>2024</year>) <volume>24</volume>:<fpage>3406</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12889-024-20931-w</pub-id>, PMID: <pub-id pub-id-type="pmid">39696079</pub-id></citation></ref>
<ref id="ref31"><label>31.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kofi Amegah</surname><given-names>A</given-names></name> <name><surname>Ayinemi</surname><given-names>R</given-names></name> <name><surname>Sewor</surname><given-names>C</given-names></name> <name><surname>Fenta</surname><given-names>HM</given-names></name> <name><surname>Yeboah</surname><given-names>K</given-names></name> <name><surname>Mohammed</surname><given-names>SA</given-names></name> <etal/></person-group>. <article-title>Birth weight mediates the association of maternal undernutrition with child undernutrition prevalence in West Africa</article-title>. <source>Eur J Clin Nutr</source>. (<year>2024</year>) <volume>78</volume>:<fpage>772</fpage>&#x2013;<lpage>81</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41430-024-01453-5</pub-id>, PMID: <pub-id pub-id-type="pmid">38806645</pub-id></citation></ref>
<ref id="ref32"><label>32.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chiopris</surname><given-names>G</given-names></name> <name><surname>Chiopris</surname><given-names>C</given-names></name> <name><surname>Valenti</surname><given-names>M</given-names></name> <name><surname>Esposito</surname><given-names>S</given-names></name></person-group>. <article-title>Determinants of undernutrition among children admitted to a Pediatric Hospital in Port Sudan, Sudan</article-title>. <source>Nutrients</source>. (<year>2024</year>) <volume>16</volume>:<fpage>787</fpage>. doi: <pub-id pub-id-type="doi">10.3390/nu16060787</pub-id>, PMID: <pub-id pub-id-type="pmid">38542698</pub-id></citation></ref>
<ref id="ref33"><label>33.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Riwa</surname><given-names>FP</given-names></name> <name><surname>Odgers-Jewell</surname><given-names>K</given-names></name> <name><surname>Jones</surname><given-names>MA</given-names></name> <name><surname>Mushi</surname><given-names>AA</given-names></name></person-group>. <article-title>The prevalence and determinants of undernutrition among infants and children aged 6 months to 5 years in sub-Saharan African countries: a systematic scoping review</article-title>. <source>Nutr Rev</source>. (<year>2025</year>) <volume>83</volume>:<fpage>e1896</fpage>&#x2013;<lpage>916</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nutrit/nuae189</pub-id>, PMID: <pub-id pub-id-type="pmid">39760760</pub-id></citation></ref>
<ref id="ref34"><label>34.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pandey</surname><given-names>S</given-names></name> <name><surname>Rahut</surname><given-names>DB</given-names></name> <name><surname>Araki</surname><given-names>T</given-names></name></person-group>. <article-title>Ethnicity/caste and child anthropometric outcomes in India using the National Family Health Survey 2015&#x2013;16 and 2019&#x2013;21</article-title>. <source>PLoS One</source>. (<year>2024</year>) <volume>19</volume>:<fpage>e0311092</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0311092</pub-id>, PMID: <pub-id pub-id-type="pmid">39656694</pub-id></citation></ref>
<ref id="ref35"><label>35.</label> <citation citation-type="other"><person-group person-group-type="author"><name><surname>Bardia</surname><given-names>V.</given-names></name> <name><surname>Sophiya</surname><given-names>E.</given-names></name></person-group>. (<year>2024</year>). Diabetes prediction using machine learning algorithm: a comparative analysis. 2024 10th International Conference on Advanced Computing and Communication Systems (ICACCS), 1973&#x2013;1979.</citation></ref>
<ref id="ref36"><label>36.</label> <citation citation-type="journal"><person-group person-group-type="author"><name><surname>Km</surname><given-names>KR</given-names></name> <name><surname>Khan</surname><given-names>SB</given-names></name> <name><surname>Govindarajan</surname><given-names>P</given-names></name> <name><surname>TR</surname><given-names>M</given-names></name> <name><surname>Alojail</surname><given-names>M</given-names></name> <name><surname>Gadekallu</surname><given-names>TR</given-names></name></person-group>. <article-title>Machine learning-driven intelligent water quality assessment for enhanced drinking safety and real-time consumer awareness</article-title>. <source>Hydrol Res</source>. (<year>2025</year>) <volume>56</volume>:<fpage>136</fpage>&#x2013;<lpage>52</lpage>. doi: <pub-id pub-id-type="doi">10.2166/nh.2025.097</pub-id></citation></ref>
<ref id="ref37"><label>37.</label> <citation citation-type="other"><person-group person-group-type="author"><name><surname>Bonthu</surname><given-names>Y.</given-names></name> <name><surname>Mannam</surname><given-names>S.</given-names></name> <name><surname>Kandikunta</surname><given-names>G.</given-names></name> <name><surname>Keshagani</surname><given-names>V. G.</given-names></name> <name><surname>Sarath</surname><given-names>G</given-names></name></person-group>. (<year>2024</year>). Heart attack risk prediction using advanced machine learning techniques. 2024 15th International Conference on Computing Communication and Networking Technologies (ICCCNT), 1&#x2013;6.</citation></ref>
<ref id="ref38"><label>38.</label> <citation citation-type="other"><person-group person-group-type="author"><name><surname>Reddy</surname><given-names>J. V. N. Y.</given-names></name> <name><surname>Ram</surname><given-names>G. S. S.</given-names></name> <name><surname>Varshini</surname><given-names>V.</given-names></name> <name><surname>Srinivas</surname><given-names>M.</given-names></name></person-group>. (<year>2025</year>). An empirical evaluation of machine learning models for stroke risk assessment with explainable AI. 2025 International Conference on Artificial Intelligence and Data Engineering (AIDE), 150&#x2013;157.</citation></ref>
</ref-list>
</back>
</article>