<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="systematic-review" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Public Health</journal-id>
<journal-title-group>
<journal-title>Frontiers in Public Health</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Public Health</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-2565</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpubh.2025.1667792</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Systematic Review</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Prediction of frailty in community older adults based on machine learning: a systematic review and meta-analysis</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Ou</surname>
<given-names>Yifan</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn0001"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3098719"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Jiang</surname>
<given-names>Dandan</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn0001"><sup>&#x2020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Pan</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Wen</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhou</surname>
<given-names>Yutong</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2768830"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Yao</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3217560"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Yin</surname>
<given-names>Xinhong</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>School of Nursing, University of South China</institution>, <city>Hengyang</city>, <state>Hunan</state>, <country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>The Second Hospital, University of South China</institution>, <city>Hengyang</city>, <state>Hunan</state>, <country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>&#x002A;</label>Correspondence: Xinhong Yin, <email xlink:href="mailto:2018000091@usc.edu.cn">2018000091@usc.edu.cn</email></corresp>
<fn fn-type="equal" id="fn0001">
<label>&#x2020;</label>
<p>These authors have contributed equally to this work and share first authorship</p>
</fn>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-01-12">
<day>12</day>
<month>01</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2025</year>
</pub-date>
<volume>13</volume>
<elocation-id>1667792</elocation-id>
<history>
<date date-type="received">
<day>17</day>
<month>07</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>28</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>18</day>
<month>12</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2026 Ou, Jiang, Li, Zhang, Zhou, Chen and Yin.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Ou, Jiang, Li, Zhang, Zhou, Chen and Yin</copyright-holder>
<license>
<ali:license_ref start_date="2026-01-12">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>An increasing number of predictive models for frailty in community-dwelling older adults are now being developed using machine learning methods. Differences between model performances limit their practical application. Therefore, we conducted a systematic review and meta-analysis to summarize and evaluate the performance and clinical applicability of these risk prediction models.</p>
</sec>
<sec>
<title>Methods</title>
<p>PubMed, Web of Science, Embase, Cochrane Library, Scopus, CINAHL, SinoMed, VIP, CNKI, and Wanfang were searched. The search time was from the database establishment to June 10, 2025. The PROBAST+AI assessment tool was used to assess the study quality, and a meta-analysis of the area under the curve (AUC) was performed using Stata18.0 software.</p>
</sec>
<sec>
<title>Results</title>
<p>A total of 10 studies were included, and 45 Machine Learning (ML) models were developed, of which 36 models were developed for internal validation and 9 for external validation. In the internal validation set, the pooled AUC for baseline frailty prediction studies was 0.878 (95% CI 0.799, 0.958), while the pooled AUC for longitudinal frailty prediction studies was 0.730 (0.670, 0.790). When all studies were pooled without distinguishing prediction time points, the overall pooled AUC was 0.786 (95% CI 0.697, 0.875).</p>
</sec>
<sec>
<title>Conclusion</title>
<p>Although most of the included models had good discrimination and calibration, the overall quality and applicability of the current study are still problematic. In future studies, researchers should follow the TRIPOD+AI statement and the PROBAST+AI list to construct high-quality, more applicable predictive models.</p>
</sec>
<sec>
<title>Systematic review registration</title>
<p><ext-link ext-link-type="uri" xlink:href="https://www.crd.york.ac.uk/PROSPERO/view/CRD420251071061">https://www.crd.york.ac.uk/PROSPERO/view/CRD420251071061</ext-link>, identifier CRD420251071061.</p>
</sec>
</abstract>
<kwd-group>
<kwd>aged</kwd>
<kwd>artificial intelligence</kwd>
<kwd>community</kwd>
<kwd>frailty</kwd>
<kwd>machine learning</kwd>
<kwd>prediction model</kwd>
<kwd>systematic review/meta-analysis</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. Project funded by Hunan Provincial Science and Technology Department (grant no. 2021SK51704). Funded by Natural Science Foundation of Hunan Province (grant no. 2024JJ6400). Research on the Teaching Reform of Degree and Graduate Students in Hunan Province (grant no. 024JGYB191).</funding-statement>
</funding-group>
<counts>
<fig-count count="5"/>
<table-count count="4"/>
<equation-count count="0"/>
<ref-count count="77"/>
<page-count count="20"/>
<word-count count="11486"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Aging and Public Health</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>As people around the world are living longer, populations are aging much faster than ever before. According to United Nations data, by 2050, the number of people over the age of 60 will increase to 2.1 billion worldwide (<xref ref-type="bibr" rid="ref1">1</xref>). Frailty is primarily characterized by a decrease in physiological reserves and resistance to stressors as we age (<xref ref-type="bibr" rid="ref2">2</xref>). The global prevalence of frailty among older people in the community is 43.3% (<xref ref-type="bibr" rid="ref3">3</xref>). Not only does frailty affect the physical health and quality of life of older people, but it can also pose significant challenges to clinical practice and public health (<xref ref-type="bibr" rid="ref4">4</xref>). In addition to this, frailty increases the incidence of adverse health outcomes such as falls (<xref ref-type="bibr" rid="ref5">5</xref>), hospitalization (<xref ref-type="bibr" rid="ref6">6</xref>), and death (<xref ref-type="bibr" rid="ref7">7</xref>) among community-dwelling older adults.</p>
<p>Relevant research suggests that exercise interventions, nutritional support (<xref ref-type="bibr" rid="ref8">8</xref>), and the development of management plans through comprehensive geriatric assessments (<xref ref-type="bibr" rid="ref9">9</xref>) can prevent, delay, or reverse frailty in community-dwelling older adults (<xref ref-type="bibr" rid="ref10">10</xref>). Due to the complex pathophysiological mechanisms and diverse manifestations of frailty, it often presents with atypical symptoms clinically, making it prone to being overlooked and underdiagnosed in routine medical care (<xref ref-type="bibr" rid="ref11">11</xref>). Furthermore, frailty typically progresses insidiously, and by the time a definitive diagnosis is made in the late stages, the optimal window for intervention is often missed. Currently, commonly used frailty assessment tools, such as the Fried Frailty Phenotype and Frailty Index, are primarily employed to screen individuals already in a frail state, rather than identifying those at high risk of frailty (<xref ref-type="bibr" rid="ref12">12</xref>). The use of validated measurement tools to identify frailty and, thus, early management of frailty is considered a critical step in preventing frailty (<xref ref-type="bibr" rid="ref13">13</xref>, <xref ref-type="bibr" rid="ref14">14</xref>). Predictive models can estimate an individual&#x2019;s risk of a specific clinical outcome or event within a specific time frame based on multiple predictors (<xref ref-type="bibr" rid="ref15">15</xref>), which can help to screen at-risk populations so that early interventions can be made to prevent disease progression (<xref ref-type="bibr" rid="ref16">16</xref>).</p>
<p>In recent years, research on developing, validating, and updating predictive models in this field has increased to enable early identification of frailty-prone older adults individuals within communities (<xref ref-type="bibr" rid="ref17">17</xref>). These models assess the likelihood and risk of frailty onset among community-dwelling older adults based on multidimensional predictors including demographic characteristics, laboratory indicators, and clinical and psychological assessments. Relevant studies indicate that machine learning not only enhances predictive accuracy by leveraging big data or multidimensional datasets but also facilitates early disease detection and promotes targeted preventive interventions (<xref ref-type="bibr" rid="ref18">18</xref>, <xref ref-type="bibr" rid="ref19">19</xref>). Furthermore, machine learning efficiently processes large-scale datasets, generates hypotheses from data, and identifies underlying patterns. Advances in machine learning methodologies have made developing predictive models using these techniques faster and more accessible (<xref ref-type="bibr" rid="ref20">20</xref>). In summary, machine learning algorithms hold potential value in identifying frailty risk among community-dwelling older adults. However, due to the diversity of ML algorithms, variations in sample sizes and datasets, differences exist in the predictive performance of different models. The risk of bias in predictive models and their applicability in clinical practice requires further evaluation.</p>
<p>With the widespread application of machine learning in the health sector, research on frailty prediction models for older adults has been increasing. Existing systematic reviews have primarily focused on traditional statistical models such as logistic regression and Cox proportional hazards models (<xref ref-type="bibr" rid="ref17">17</xref>). While one study most closely aligned with this topic systematically reviewed machine learning-based frailty prediction models for community-dwelling older adults, revealing widespread deficiencies in reporting standards and methodological quality within the field, it did not conduct correlation analyses on model performance (<xref ref-type="bibr" rid="ref21">21</xref>). Although researchers are employing reporting guidelines and quality assessment tools to address modeling deficiencies and reduce bias, model predictive performance remains inconsistent, casting uncertainty over their clinical applicability. Therefore, in this study, the latest risk prediction model evaluation tool, PROBAST+AI (<xref ref-type="bibr" rid="ref22">22</xref>), was used to evaluate frailty prediction models constructed for community-dwelling older adults using machine-learning methods, and a meta-analysis was performed to analyze the AUC of the prediction models. It is expected to provide valuable guidance and reference for clinical practitioners in the development of frailty risk prediction models for community-dwelling older adults.</p>
</sec>
<sec sec-type="methods" id="sec2">
<label>2</label>
<title>Methods</title>
<p>This department&#x2019;s research adheres to the Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis or Diagnosis-Systematic Reviews and Meta-Analysis (TRIPOD-SRMA) (<xref ref-type="bibr" rid="ref23">23</xref>) and the Preferred Reporting Items for Systematic Reviews and Meta-Analyses (PRISMA) 2020 guidelines (<xref ref-type="bibr" rid="ref24">24</xref>). This study has been registered with PROSPERO (CRD420251071061).</p>
<sec id="sec3">
<label>2.1</label>
<title>Search strategy</title>
<p>We conducted a comprehensive search of multiple databases, including PubMed, Web of Science, Embase, Cochrane Library, Scopus, SinoMed, China National Knowledge Infrastructure (CNKI), Wanfang Database, China Science and Technology Journal Database (VIP), Cumulative Index to Nursing and Allied Health Literature (CINAHL). The search was conducted from the time of database construction to June 10, 2025. The objective was to identify studies that used machine learning methods to predict the onset of frailty in community-dwelling older adults. The search strategy used a combination of keywords and subject terms such as &#x201C;machine learning,&#x201D; &#x201C;artificial intelligence,&#x201D; &#x201C;predictive models,&#x201D; &#x201C;risk prediction modelling,&#x201D; &#x201C;frailty,&#x201D; &#x201C;aged&#x201D;, &#x201C;community&#x201D;, etc. The detailed search strategy is shown in <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref>, and the reference lists of the included literature were carefully reviewed to ensure comprehensiveness.</p>
<p>For systematic evaluation, we used the PICOTS system recommended by the CHARMS (Critical Appraisal and Data Extraction for Systematic Reviews of Prediction Modeling Studies) list (<xref ref-type="bibr" rid="ref25">25</xref>). The system helps frame the purpose of the review, the search strategy, and the inclusion and exclusion criteria for the studies. The key items of PICOTS are described as <xref ref-type="table" rid="tab1">Table 1</xref>.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Key projects of PICOTS.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">PICOTS</th>
<th align="left" valign="top">Description</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">P (population)</td>
<td align="left" valign="top">Community-dwelling older adults aged &#x2265;60&#x2009;years</td>
</tr>
<tr>
<td align="left" valign="top">I (Index prediction model)</td>
<td align="left" valign="top">Predictive models developed and/or validated using machine learning algorithms</td>
</tr>
<tr>
<td align="left" valign="top">C (Comparative)</td>
<td align="left" valign="top">A comparative study of machine learning algorithms versus other machine learning algorithms, traditional statistical analysis, and clinical scoring tools</td>
</tr>
<tr>
<td align="left" valign="top">O (Outcomes)</td>
<td align="left" valign="top">The predicted outcome is frailty</td>
</tr>
<tr>
<td align="left" valign="top">T (Timing)</td>
<td align="left" valign="top">Studies on cross-sectional and/or longitudinal prediction</td>
</tr>
<tr>
<td align="left" valign="top">S (Setting)</td>
<td align="left" valign="top">Research conducted in community settings</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec4">
<label>2.2</label>
<title>Inclusion and exclusion criteria</title>
<p>Based on the aforementioned research framework, we established the following inclusion and exclusion criteria:</p>
<p>Inclusion criteria: (1) Population: Community-dwelling older adults aged &#x2265;60&#x2009;years; (2) Predictive Model Type: Studies must develop or validate at least one machine learning-based predictive model, or compare machine learning algorithms with other machine learning algorithms, traditional statistical analyses, or clinical scoring tools, and must report at least one model performance metric (discrimination and/or calibration); (3) Study design: cohort studies, cross-sectional studies, and case&#x2013;control studies; (4) Study outcome: predicted outcome of frailty (comprehensive physical frailty), with frailty defined based on recognized standards or tools.</p>
<p>Exclusion criteria: (1) Studies not reporting the predictive model development process; (2) Studies limited to cognitive frailty or social frailty; (3) Literature not in English or Chinese; (4) Studies where full text was unavailable; (5) Case reports, reviews, conference abstracts, or guidelines; (6) Studies employing only traditional statistical models without machine learning algorithms, or studies conducted in non-community settings such as hospitals, clinics, or long-term care facilities; (7) Studies failing to report model performance metrics.</p>
</sec>
<sec id="sec5">
<label>2.3</label>
<title>Screening of articles</title>
<p>First, all literature retrieved from various databases was imported into EndNote X9 software for management, with duplicate records automatically removed. Subsequently, two independent researchers conducted an initial screening of the remaining literature&#x2019;s titles and abstracts to exclude obviously irrelevant studies. Finally, the same two researchers reviewed the full texts of the initially screened articles against predefined inclusion and exclusion criteria to determine the final list of included studies. Any disagreements were resolved through discussion or adjudication by a third researcher. Additionally, we carefully examined the reference lists of all eligible studies to ensure the completeness of the included literature.</p>
</sec>
<sec id="sec6">
<label>2.4</label>
<title>Data extraction</title>
<p>The search results were screened independently by two authors according to the CHARMS list. In case of disagreement, it was decided through discussion or by the third author. The information extracted from the selected articles included: (1) Basic information of the study: including information on the data source, country, year of publication, authors, sample size, outcome, outcome assessment tool, and candidate predictors. (2) Model information: including the extraction of information such as predictor screening methods, model construction methods, missing data handling methods, continuous variable handling methods, evaluation model indicators, and predictors finally included in the model.</p>
</sec>
<sec id="sec7">
<label>2.5</label>
<title>Quality assessment</title>
<p>Quality, potential risk of bias, and study applicability of the included literature were assessed using the PROBAST+AI evaluation tool (<xref ref-type="bibr" rid="ref22">22</xref>), a newly developed assessment tool for evaluating the quality, risk of bias, and applicability of regression- or artificial intelligence-based predictive models. It includes four domains: participants and data sources, predictors, outcomes, and analyses; a total of 34 signaling questions (16 for model development and 18 for model evaluation) and 6 applicability items (3 each for model development and model evaluation) were addressed. Signaling questions are answered as yes, probably yes, no, probably no, no information, or, when appropriate, not applicable. Quality concerns (for model development) are judged as low, high, or unclear, and risk of bias (for model evaluation) is judged as low, high, or unclear.</p>
</sec>
<sec id="sec8">
<label>2.6</label>
<title>Statistical analysis</title>
<p>First, we summarized the AUC values and their 95% confidence intervals (95% CI) for each study. Due to the inconsistent time windows for frailty prediction across the included studies&#x2014;three studies assessed baseline prediction, six studies assessed longitudinal prediction, and one study assessed both baseline and longitudinal prediction&#x2014;we conducted meta-analyses based on the prediction window (baseline vs. longitudinal) and stratified analyses based on the model construction method. For studies that did not report the standard error (SE) or 95% CI of AUC, the Hanley and McNeil formula was used to estimate the SE and 95% CI (<xref ref-type="bibr" rid="ref26">26</xref>, <xref ref-type="bibr" rid="ref27">27</xref>). Considering that the included studies may have heterogeneity among study designs, ML models, and predictors. Therefore, the AUC of each study was combined in the meta-analysis using the Der Simonian and Laird random effects model (<xref ref-type="bibr" rid="ref28">28</xref>). Heterogeneity between studies was assessed using the Cochrane <italic>Q</italic>-test and the <italic>I</italic><sup>2</sup> statistic (<italic>I</italic><sup>2</sup>&#x2009;&#x2265;&#x2009;50% or <italic>p</italic>&#x2009;&#x2264;&#x2009;0.10) to determine whether to use a fixed-effects model or a random-effects model (<xref ref-type="bibr" rid="ref29">29</xref>). All statistical analyses were performed using Stata18.0 software and results were considered statistically significant at <italic>p</italic>&#x2009;&#x003C;&#x2009;0.05.</p>
</sec>
</sec>
<sec sec-type="results" id="sec9">
<label>3</label>
<title>Results</title>
<sec id="sec10">
<label>3.1</label>
<title>Search results</title>
<p>Through systematic searching, we retrieved 8,210 articles from 10 databases. We also identified 4 studies by reviewing reference lists. After deduplication using EndNote X9 literature management software, 4,836 articles remained. Initial screening based on titles and abstracts led to the exclusion of 4,812 articles, leaving 24 articles for full-text eligibility assessment. After reviewing the full texts, we excluded 14 articles (reasons for exclusion detailed in <xref ref-type="fig" rid="fig1">Figure 1</xref>). Ultimately, 10 articles were included in this study (<xref ref-type="bibr" rid="ref30">30</xref>&#x2013;<xref ref-type="bibr" rid="ref39">39</xref>). <xref ref-type="fig" rid="fig1">Figure 1</xref> shows the Preferred Reporting Items for Systematic reviews and Meta-Analyses (PRISMA) 2020 flowchart depicting the comprehensive search process and results.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Shows the Preferred Reporting Items for Systematic reviews and Meta-Analyses (PRISMA) 2020 flowchart depicting the comprehensive search process and results.</p>
</caption>
<graphic xlink:href="fpubh-13-1667792-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Flowchart illustrating the identification of studies through databases and registers for a meta-analysis. Initial records (n=8214) were identified from sources like PubMed, Web of Science, and others. Duplicates removed were 3378. After screening 4836 records, 4812 were excluded based on title and abstract. Full-text articles assessed were 24, with 14 excluded for reasons such as pre-frailty outcomes or traditional models. Ten studies were included in the review, with nine in the meta-analysis. One report was excluded due to incomplete data.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec11">
<label>3.2</label>
<title>Basic characteristics of the included literature</title>
<p>Ten studies were included in this study with publication dates of 2022&#x2013;2025, all of which were in English. Most studies were cohort-based, including six prospective cohort studies, one retrospective cohort study, one cross-sectional cohort study, and two cross-sectional studies. Data for seven studies originated from single-center databases, while the remaining three studies utilized data collected by researchers from community sources. Among studies developing models using databases, data were sourced from China (<italic>n</italic> =&#x2009;5), Japan (<italic>n</italic> =&#x2009;1), and South Korea (<italic>n</italic> =&#x2009;1). Study sample sizes ranged from 214 to 14,540 participants, with 28&#x2013;4,883 outcome events recorded. Prevalence rates varied between 5.33% and 64.77%.</p>
<p>Candidate predictors numbered between 16 and 56, most commonly comprising demographic characteristics, clinical laboratory data, and lifestyle factors. Regarding frailty assessment, the most frequently used tools were the Fried Phenotype (<italic>n</italic> =&#x2009;4) and Frailty Index (<italic>n</italic> =&#x2009;3), with others including Kihon (<italic>n</italic> =&#x2009;1), Study of Osteoporotic Fractures (SOF) Index (<italic>n</italic> =&#x2009;1), and Tilburg Frailty Indicator (TFI) (<italic>n</italic> =&#x2009;1). Among these, five studies employed a binary classification of &#x201C;frail&#x201D; and &#x201C;non-frail&#x201D; to define outcomes, while the remaining five studies included a &#x201C;pre-frail&#x201D; state in their outcome definitions. The detailed characteristics of the included models are shown in <xref ref-type="table" rid="tab2">Table 2</xref>.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Overview of basic data of the included studies.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Author (year)</th>
<th align="left" valign="top">Country</th>
<th align="left" valign="top">Study design</th>
<th align="left" valign="top">Participants</th>
<th align="left" valign="top">Data source</th>
<th align="left" valign="top">Time windows</th>
<th align="left" valign="top">Main outcome</th>
<th align="left" valign="top">Frailty cases/sample size (%)</th>
<th align="left" valign="top">Candidate predictors</th>
<th align="left" valign="top">Outcome measures</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Mengjiao Yang 2024 (<xref ref-type="bibr" rid="ref37">37</xref>)</td>
<td align="left" valign="top">Japanese</td>
<td align="left" valign="top">Cross-sectional and longitudinal study</td>
<td align="left" valign="top">Aged &#x2265;65&#x2009;years<break/>Mean age 73.7<break/>Female 49.7%</td>
<td align="left" valign="top">Community Empowerment and Care for Wellbeing and Healthy Longevity: Evidence from a Cohort Study</td>
<td align="left" valign="top">Baseline and Longitudinal</td>
<td align="left" valign="top">Frailty</td>
<td align="left" valign="top">Cross-sectional: 95/673 (14.1%)<break/>Longitudinal: 90/373 (24.1%)</td>
<td align="left" valign="top">34 (Socio-demographic characteristics, Lifestyle characteristics, Disease characteristics, Physical condition, Psychological condition, Social relationships)</td>
<td align="left" valign="top">Kihon</td>
</tr>
<tr>
<td align="left" valign="top">Qinqin Liu 2023 (<xref ref-type="bibr" rid="ref34">34</xref>)</td>
<td align="left" valign="top">China</td>
<td align="left" valign="top">Prospective cohort study</td>
<td align="left" valign="top">Aged &#x2265;60&#x2009;years<break/>Mean age 66.7<break/>Female 47.3%</td>
<td align="left" valign="top">China Health and Retirement Longitudinal Study</td>
<td align="left" valign="top">Longitudinal</td>
<td align="left" valign="top">Frailty</td>
<td align="left" valign="top">Derivation cohort:<break/>766/2,241 (34.2%)<break/>Internal validation cohort:<break/>195/561 (34.8%)<break/>External validation cohort:<break/>557/1,721 (32.4%)</td>
<td align="left" valign="top">37 (Sociodemographic, Clinical, lifestyle-related and Cognitive psychological factors)</td>
<td align="left" valign="top">Fried frailty Phenotype</td>
</tr>
<tr>
<td align="left" valign="top">Shaoyi Fan 2023 (<xref ref-type="bibr" rid="ref31">31</xref>)</td>
<td align="left" valign="top">China</td>
<td align="left" valign="top">Prospective cohort study</td>
<td align="left" valign="top">Aged 60&#x2013;95&#x2009;years<break/>Mean age 68.9<break/>Female 72.9%</td>
<td align="left" valign="top">Four community centers in Guangzhou</td>
<td align="left" valign="top">Baseline</td>
<td align="left" valign="top">Frailty</td>
<td align="left" valign="top">28/214 (13.1%)</td>
<td align="left" valign="top">16 (GCA, Walking test)</td>
<td align="left" valign="top">Fried frailty Phenotype</td>
</tr>
<tr>
<td align="left" valign="top">Yafei Wu 2022 (<xref ref-type="bibr" rid="ref36">36</xref>)</td>
<td align="left" valign="top">China</td>
<td align="left" valign="top">Retrospective cohort</td>
<td align="left" valign="top">Aged &#x2265;65&#x2009;years<break/>Mean age 77.0<break/>Female 52.0%</td>
<td align="left" valign="top">Chinese Longitudinal Healthy Longevity and Happy Family Study</td>
<td align="left" valign="top">Longitudinal</td>
<td align="left" valign="top">Frailty</td>
<td align="left" valign="top">713/4,083 (17.4%)</td>
<td align="left" valign="top">56 (Socio-demographic characteristics, Lifestyles, self-reported health and Objective examination)</td>
<td align="left" valign="top">Frailty Index</td>
</tr>
<tr>
<td align="left" valign="top">Heeeun Jung 2023 (<xref ref-type="bibr" rid="ref33">33</xref>)</td>
<td align="left" valign="top">Korea</td>
<td align="left" valign="top">Cross-sectional</td>
<td align="left" valign="top">Aged 70&#x2013;84</td>
<td align="left" valign="top">Korea frailty and aging cohort study</td>
<td align="left" valign="top">Baseline</td>
<td align="left" valign="top">Frailty</td>
<td align="left" valign="top">216/1,482 (25.0%)</td>
<td align="left" valign="top">32 (Socio-demographic domain, Physical domain, Biological domain, Lifestyle domain, Health condition domain, Medical domain, Psychological domain, Social domain)</td>
<td align="left" valign="top">Fried frailty Phenotype</td>
</tr>
<tr>
<td align="left" valign="top">Yin Yuan 2022 (<xref ref-type="bibr" rid="ref38">38</xref>)</td>
<td align="left" valign="top">China</td>
<td align="left" valign="top">Prospective cohort study</td>
<td align="left" valign="top">Aged &#x2265; 60&#x2009;years<break/>Mean age 72.5<break/>Female 60.0%</td>
<td align="left" valign="top">The residents from community and nursing homes in Fujian Province</td>
<td align="left" valign="top">Longitudinal</td>
<td align="left" valign="top">Frailty</td>
<td align="left" valign="top">711/1,981 (35.8%)</td>
<td align="left" valign="top">32 (Demographic characteristic, Lifestyle factors, Physical function, Psychophysiological, Social support, Social environment, Physical examination, Laboratory indicators)</td>
<td align="left" valign="top">Fried frailty Phenotype</td>
</tr>
<tr>
<td align="left" valign="top">Yongfei Dong 2025 (<xref ref-type="bibr" rid="ref30">30</xref>)</td>
<td align="left" valign="top">China</td>
<td align="left" valign="top">Prospective cohort</td>
<td align="left" valign="top">Aged &#x2265;65&#x2009;years</td>
<td align="left" valign="top">Chinese Longitudinal Healthy Longevity Survey</td>
<td align="left" valign="top">Longitudinal</td>
<td align="left" valign="top">Frailty</td>
<td align="left" valign="top">Training:<break/>1,493/4,878 (30.6%)<break/>External Validation 1:<break/>968/3,840 (25.2%)<break/>External Validation 2:<break/>1,531/5,822 (26.3%)</td>
<td align="left" valign="top">22 (Socio-demographic, Socio behavioral, Medical measures factors)</td>
<td align="left" valign="top">Frailty Index</td>
</tr>
<tr>
<td align="left" valign="top">Lin Qi 2025 (<xref ref-type="bibr" rid="ref35">35</xref>)</td>
<td align="left" valign="top">China</td>
<td align="left" valign="top">Cross-sectional</td>
<td align="left" valign="top">Aged &#x2265;60&#x2009;years<break/>Female 52.5%</td>
<td align="left" valign="top">Communities in eastern China</td>
<td align="left" valign="top">Baseline</td>
<td align="left" valign="top">Frailty</td>
<td align="left" valign="top">818/1,263 (64.7%)</td>
<td align="left" valign="top">17 (Demographic characteristic, Frailty indicators)</td>
<td align="left" valign="top">Tilburg Frailty Indicator</td>
</tr>
<tr>
<td align="left" valign="top">Wei Zhang 2024 (<xref ref-type="bibr" rid="ref39">39</xref>)</td>
<td align="left" valign="top">China</td>
<td align="left" valign="top">Prospective cohort</td>
<td align="left" valign="top">Aged &#x2265;65&#x2009;years</td>
<td align="left" valign="top">Chinese Longitudinal Healthy Longevity Survey</td>
<td align="left" valign="top">Longitudinal</td>
<td align="left" valign="top">Frailty</td>
<td align="left" valign="top">912/6,997 (13.0%)</td>
<td align="left" valign="top">46 (Demographic data, Health-related risk factors, Risk factors for chronic diseases)</td>
<td align="left" valign="top">SOF index</td>
</tr>
<tr>
<td align="left" valign="top">Li Huang 2024 (<xref ref-type="bibr" rid="ref32">32</xref>)</td>
<td align="left" valign="top">China</td>
<td align="left" valign="top">Prospective cohort</td>
<td align="left" valign="top">Aged &#x2265;65&#x2009;years<break/>Mean age 85.3/85.3/89.5<break/>Female 54.1%/54.8%/49.6%</td>
<td align="left" valign="top">Chinese Longitudinal Healthy Longevity Survey</td>
<td align="left" valign="top">Baseline</td>
<td align="left" valign="top">Frailty</td>
<td align="left" valign="top">4,883/14,925 (29.3%)</td>
<td align="left" valign="top">54 (Demographic characteristics)</td>
<td align="left" valign="top">Frailty Index</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec12">
<label>3.3</label>
<title>Characteristics of the model development</title>
<p><xref ref-type="table" rid="tab3">Table 3</xref> summarizes detailed information on model development characteristics. In terms of variable treatment, four studies converted continuous variables to categorical variables (<xref ref-type="bibr" rid="ref32">32</xref>, <xref ref-type="bibr" rid="ref35">35</xref>, <xref ref-type="bibr" rid="ref37">37</xref>, <xref ref-type="bibr" rid="ref38">38</xref>). In terms of missing data treatment, four studies used multiple imputation (<xref ref-type="bibr" rid="ref31">31</xref>, <xref ref-type="bibr" rid="ref34">34</xref>, <xref ref-type="bibr" rid="ref37">37</xref>, <xref ref-type="bibr" rid="ref39">39</xref>), two studies excluded missing data (<xref ref-type="bibr" rid="ref33">33</xref>, <xref ref-type="bibr" rid="ref35">35</xref>), three studies did not report information about missing data (<xref ref-type="bibr" rid="ref30">30</xref>, <xref ref-type="bibr" rid="ref32">32</xref>, <xref ref-type="bibr" rid="ref38">38</xref>), and one study used the miss Forest method for missing data (<xref ref-type="bibr" rid="ref36">36</xref>). Among the methods for predictor screening, commonly used approaches include Lasso regression (<xref ref-type="bibr" rid="ref37">37</xref>, <xref ref-type="bibr" rid="ref38">38</xref>), random forest method (<xref ref-type="bibr" rid="ref33">33</xref>, <xref ref-type="bibr" rid="ref36">36</xref>), and univariable analysis (<xref ref-type="bibr" rid="ref31">31</xref>, <xref ref-type="bibr" rid="ref35">35</xref>). The number of predictors included in the final model ranged from 5 to 16, covering a total of 61 predictors. The most common predictor was age (<italic>n</italic> =&#x2009;8), followed by cognitive function (<italic>n</italic> =&#x2009;5) and depression (<italic>n</italic> =&#x2009;3).</p>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Overview of the information of the included prediction models.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Author (year)</th>
<th align="left" valign="top">Missing data handling</th>
<th align="left" valign="top">Continuous variable processing method</th>
<th align="left" valign="top">Variable selection</th>
<th align="left" valign="top">Model development method</th>
<th align="left" valign="top">Validation method</th>
<th align="left" valign="top">Calibration method</th>
<th align="left" valign="top">Model performance (AUC)</th>
<th align="left" valign="top">Final predictors</th>
<th align="left" valign="top">Model presentation</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Mengjiao Yang 2024 (<xref ref-type="bibr" rid="ref37">37</xref>)</td>
<td align="left" valign="top">Multiple imputation</td>
<td align="left" valign="top">Categorical variable</td>
<td align="left" valign="top">LASSO regression</td>
<td align="left" valign="top">Bayesian networks</td>
<td align="left" valign="top">Internal validation (tenfold cross-validation)</td>
<td align="left" valign="top">B: Hosmer-Lemeshow <italic>p</italic>&#x2009;=&#x2009;0.395</td>
<td align="left" valign="top">B:<break/>Cross-section:<break/>0.943 (0.913, 0.974)<break/>Longitudinal:<break/>0.722 (0.656, 0.788)</td>
<td align="left" valign="top">7:&#x2265;75&#x2009;years<break/>Having physical dysfunction<break/>Polypharmacy<break/>Dementia<break/>Musculoskeletal disorders<break/>Depression<break/>Social relationships</td>
<td align="left" valign="top">Graphical score char</td>
</tr>
<tr>
<td align="left" valign="top">Qinqin Liu 2023 (<xref ref-type="bibr" rid="ref34">34</xref>)</td>
<td align="left" valign="top">Multiple imputations</td>
<td align="left" valign="top">Continuous variable</td>
<td align="left" valign="top">LASSO regression and Expert opinion</td>
<td align="left" valign="top">LR<break/>SVM<break/>RF<break/>XGBoost</td>
<td align="left" valign="top">Internal validation (random split) and External validation</td>
<td align="left" valign="top">Hosmer-Lemeshow test<break/>LR: 0.614/0.919/0.008<break/>SVM: 0.134/0.138/0.039<break/>RF: &#x003C;0.001/0.249/0.107<break/>XGBoost: 0.600/0.120/&#x003C;0.001<break/>Brier score:<break/>LR: 0.207/0.206/0.214<break/>SVM: 0.209/0.207/0.217<break/>RF: 0.193/0.205/0.213<break/>XGBoost: 0.200/0.200/0.216</td>
<td align="left" valign="top">A:<break/>LR: 0.669 (0.645, 0.692)<break/>SVM: 0.665 (0.641, 0.688)<break/>RF: 0.748 (0.727, 0.769)<break/>XGBoost: 0.700 (0.628, 0.723)<break/>B:<break/>LR: 0.676 (0.628, 0.723)<break/>SVM: 0.676 (0.629, 0.722)<break/>RF: 0.687 (0.641, 0.733)<break/>XGBoost: 0.701 (0.655, 0.746)<break/>C:<break/>LR: 0.614 (0.586, 0.642)<break/>SVM: 0.611 (0.583, 0.640)<break/>RF: 0.621 (0.584, 0.640)<break/>XGBoost: 0.612 (0.584, 0.640)</td>
<td align="left" valign="top">14: Waist circumference<break/>Age<break/>Cognitive function<break/>SRH<break/>Material health<break/>Medical insurance<break/>Current residence location<break/>Pension insurance<break/>Housing tenure<break/>Afternoon napping,<break/>Eating habit<break/>Depression<break/>Hearing impairment<break/>Lung diseases</td>
<td align="left" valign="top">Online clinical support, Nomogram</td>
</tr>
<tr>
<td align="left" valign="top">Shaoyi Fan 2023 (<xref ref-type="bibr" rid="ref31">31</xref>)</td>
<td align="left" valign="top">Multiple imputations</td>
<td align="left" valign="top">Continuous variable</td>
<td align="left" valign="top">Univariable analysis</td>
<td align="left" valign="top">RF<break/>DT<break/>NN<break/>SGD<break/>NB</td>
<td align="left" valign="top">Internal validation<break/>(random split)</td>
<td align="left" valign="top">&#x2013;</td>
<td align="left" valign="top">B:<break/>RF: 0.926<break/>DT: 0.850<break/>NN: 0.761<break/>SGD: 0.834<break/>NB: 0.761</td>
<td align="left" valign="top">5: Large-step walking speed<break/>Average step size<break/>Age<break/>Total step walking distance<break/>MMSE</td>
<td align="left" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">Yafei Wu 2022 (<xref ref-type="bibr" rid="ref36">36</xref>)</td>
<td align="left" valign="top">Miss Forest</td>
<td align="left" valign="top">Continuous variable</td>
<td align="left" valign="top">Recursive feature elimination (RFE) and 10-fold cross-validation based on random forest</td>
<td align="left" valign="top">NB<break/>LR<break/>DT<break/>SVM<break/>ANN,<break/>RF<break/>XGB</td>
<td align="left" valign="top">Bootstrap internal validation</td>
<td align="left" valign="top">B:<break/>Brier score:<break/>LR: 0.205<break/>NB: 0.161<break/>DT: 0.208<break/>SVM: 0.181<break/>RF: 0.143<break/>XGB: 0.134<break/>ANN: 0.193</td>
<td align="left" valign="top">B:<break/>LR: 0.728 (0.687, 0.769)<break/>NB: 0.722 (0.687, 0.769)<break/>DT: 0.612 (0.580, 0.643)<break/>SVM: 0.661 (0.619, 0.703)<break/>RF: 0.702 (0.659, 0.745)<break/>XGB: 0.677 (0.659, 0.745)<break/>ANN: 0.640 (0.595, 0.685)</td>
<td align="left" valign="top">11: Marital status<break/>ADL; IADL; MMSE<break/>Hypertension<break/>Childhood starvation<break/>Heart disease<break/>Weight<break/>Stroke<break/>Cerebrovascular disease<break/>Medical costs payer</td>
<td align="left" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">Heeeun Jung 2023 (<xref ref-type="bibr" rid="ref33">33</xref>)</td>
<td align="left" valign="top">Remove</td>
<td align="left" valign="top">Continuous variable</td>
<td align="left" valign="top">Random forest model analysis</td>
<td align="left" valign="top">LR<break/>KNN<break/>SVM<break/>Gaussian NB<break/>RF</td>
<td align="left" valign="top">Internal validation (random split)</td>
<td align="left" valign="top">&#x2013;</td>
<td align="left" valign="top">F1score:<break/>LR: 0.920<break/>KNN: 0.820<break/>SVM: 0.870<break/>Gaussian NB: 0.880<break/>RF: 0.910</td>
<td align="left" valign="top">16: Age<break/>Low education level<break/>Residence<break/>Low calf circumference<break/>TUG duration<break/>SPPB; Hs-CRP; eGFR<break/>Serum creatinine<break/>Triglyceride<break/>RBC<break/>25-hydroxy vitamin D<break/>Number of medications<break/>Risk of malnutrition<break/>EQ-5D index<break/>Depressive symptoms</td>
<td align="left" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">Yin Yuan 2022 (<xref ref-type="bibr" rid="ref38">38</xref>)</td>
<td align="left" valign="top">&#x2013;</td>
<td align="left" valign="top">Categorical Variable</td>
<td align="left" valign="top">LASSO regression</td>
<td align="left" valign="top">Bayesian networks</td>
<td align="left" valign="top">Internal validation (random split)</td>
<td align="left" valign="top">Calibration plots and Hosmer-Lemeshow (<italic>p</italic>&#x2009;=&#x2009;0.160/0.341)</td>
<td align="left" valign="top">B:<break/>0.701</td>
<td align="left" valign="top">6: Age<break/>Nutritional status<break/>IADL<break/>Balance capacity<break/>Social support</td>
<td align="left" valign="top">Graphical score char</td>
</tr>
<tr>
<td align="left" valign="top">Yongfei Dong 2025 (<xref ref-type="bibr" rid="ref30">30</xref>)</td>
<td align="left" valign="top">&#x2013;</td>
<td align="left" valign="top">Continuous variable</td>
<td align="left" valign="top">Stepwise-multivariate and Cox model</td>
<td align="left" valign="top">XG Boost<break/>GBM<break/>Cox Boost.</td>
<td align="left" valign="top">Bootstrap Internal validation and external validation</td>
<td align="left" valign="top">Brier score: &#x003C;0.25</td>
<td align="left" valign="top">B:<break/>XG Boost:<break/>0.830 (0.810, 0.840)<break/>GBM:<break/>0.820 (0.800, 0.830)<break/>CoxBoost:<break/>0.800 (0.780, 0.820)<break/>Cox model:<break/>0.800 (0.780, 0.820)<break/>C:<break/>XG Boost:<break/>0.850 (0.830, 0.870)<break/>GBM:<break/>0.850 (0.830, 0.870)<break/>CoxBoost.:<break/>0.850 (0.830, 0.870)<break/>Cox model:<break/>0.850 (0.830, 0.870)</td>
<td align="left" valign="top">9: Age<break/>BMI<break/>Cognitive function,<break/>Gender<break/>Ethnicity<break/>Education<break/>Natural teeth status<break/>Smoking status<break/>Occupation</td>
<td align="left" valign="top">Nomogram</td>
</tr>
<tr>
<td align="left" valign="top">Lin Qi 2025 (<xref ref-type="bibr" rid="ref35">35</xref>)</td>
<td align="left" valign="top">Remove</td>
<td align="left" valign="top">Categorical Variable</td>
<td align="left" valign="top">Univariable analysis</td>
<td align="left" valign="top">RF<break/>XG Boost<break/>DT</td>
<td align="left" valign="top">Internal validation (random split)</td>
<td align="left" valign="top">&#x2013;</td>
<td align="left" valign="top">A:<break/>RF: 0.990<break/>XGBoost: 0.810<break/>DT: 0.780<break/>B:<break/>RF: 0.750<break/>XGBoost: 0.720<break/>DT: 0.660</td>
<td align="left" valign="top">9: Age<break/>BMI<break/>Monthly income<break/>Living arrangement<break/>Visit frequency<break/>Pension insurance<break/>Smoking status<break/>Number of chronic diseases<break/>Type of medication</td>
<td align="left" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">Wei Zhang 2024 (<xref ref-type="bibr" rid="ref39">39</xref>)</td>
<td align="left" valign="top">Multiple imputation</td>
<td align="left" valign="top">Continuous variable</td>
<td align="left" valign="top">Stepwise regression</td>
<td align="left" valign="top">RF<break/>LR</td>
<td align="left" valign="top">Internal validation<break/>(random split)</td>
<td align="left" valign="top">&#x2013;</td>
<td align="left" valign="top">A:<break/>RF: 0.970<break/>LR: 0.780<break/>B:<break/>RF: 0.770<break/>LR: 0.760</td>
<td align="left" valign="top">10: Age<break/>Household status<break/>Marital status<break/>Self-reported health status<break/>MMSE<break/>Exercise<break/>ADL<break/>Sleep duration<break/>Hypertension<break/>Pulmonary disease</td>
<td align="left" valign="top">Nomogram</td>
</tr>
<tr>
<td align="left" valign="top">Li Huang 2024 (<xref ref-type="bibr" rid="ref32">32</xref>)</td>
<td align="left" valign="top">&#x2013;</td>
<td align="left" valign="top">Categorical Variable</td>
<td align="left" valign="top">Lasso regression and<break/>Boruta algorithm<break/>Random forest and classifier score</td>
<td align="left" valign="top">LR<break/>RF<break/>SVM<break/>XG Boost<break/>SHLNN</td>
<td align="left" valign="top">Internal validation (random split) and external validation</td>
<td align="left" valign="top">&#x2013;</td>
<td align="left" valign="top">B:<break/>LR: 0.974<break/>RF: 0.967<break/>SVM: 0.974<break/>XGBoost: 0.974<break/>SHLNN: 0.974 C:<break/>LR (2,011): 0.963 (0.946, 0.979)<break/>LR (2,014): 0.977 (0.968, 0.987)<break/>AUC (Women): 0.971<break/>AUC (Man): 0.975</td>
<td align="left" valign="top">10 key features:<break/>Able to go shopping by yourself?<break/>Able to walk one kilometer?<break/>Able to carry 5&#x2009;kg weight?<break/>Able to make food by yourself?<break/>Able to crouch and stand for three times?<break/>Able to wash clothes by yourself?<break/>Able to take public transport?<break/>Able to pick up a book from the floor?<break/>Able to stand up from sitting in a chair?<break/>Visual function</td>
<td align="left" valign="top">Website</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>&#x2013;, No information; A, Training set; B, Internal validation; C, External validation. RF, Random forest; LR, Logistic regression: SVM, Support vector machine; XGBoost, eXtreme Gradient Boosting; NN, Neural network; SGD, Stochastic gradient descent; NB, Na&#x00EF;ve Bayes; ANN, Artificial neural network; KNN, K-nearest neighbors; Gaussian NB, Gaussian Na&#x00EF;ve Bayes; GBM, Gradient Boosting Machine; SHLNN, Single-hidden-layer Neural Net; DT, Decision tree; MMSE, Mini Mental State Examination score; IADL, Instrumental activities of daily living.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="sec13">
<label>3.4</label>
<title>Characteristics of model validation</title>
<p>Internal validation was performed in all 10 included studies, with three studies performing both internal and external validation (<xref ref-type="bibr" rid="ref30">30</xref>, <xref ref-type="bibr" rid="ref32">32</xref>, <xref ref-type="bibr" rid="ref34">34</xref>) and two studies performing two external validations. The methods used in internal validation were random split (<italic>n</italic> =&#x2009;7), bootstrap (<italic>n</italic> =&#x2009;2), and 10-Fold Cross-Validation (<italic>n</italic> =&#x2009;1). The three studies that conducted external validation used the time validation method. Specific information about modeling is shown in <xref ref-type="table" rid="tab3">Table 3</xref>.</p>
</sec>
<sec id="sec14">
<label>3.5</label>
<title>Performance of the models</title>
<p><xref ref-type="table" rid="tab3">Table 3</xref> summarizes detailed information on model performance. A total of 45 models were constructed using 16 methods across the 10 studies. The most used methods were Random Forest (RF, <italic>n</italic> = 8), Logistic Regression (LR, <italic>n</italic> = 7), Extreme Gradient Boosting (XGB, <italic>n</italic> = 7), and Support vector machine (<italic>n</italic> = 5). In the included studies, the performance of the models was assessed mainly through differentiation and calibration methods. Nine of the studies measured model discrimination by AUC, and one study did not report model discrimination and used the F1 score to measure model performance.</p>
<p>Five studies reported model calibration methods. In the model construction phase, two studies assessed calibration using the Brier score and their constructed models all scored &#x003C;0.25, and 2 studies assessed calibration using the Hosmer-Lemeshow (H-L) test, with the majority of the models demonstrating good calibration performance (<italic>p</italic>&#x2009;&#x003E;&#x2009;0.05). In internal validation, studies using the H-L test and Brier score also showed good calibration performance (<italic>p</italic>&#x2009;&#x003E;&#x2009;0.05, Brier score &#x003C; 0.25). In external validation, two studies assessed predictive model calibration using the Brier score (<italic>n</italic> = 2) and H-L test (<italic>n</italic> = 1), respectively.</p>
</sec>
<sec id="sec15">
<label>3.6</label>
<title>Form of model presentation</title>
<p>Six studies reported on the presentation form of the model. Of these, one study presented the model in Nomogram and Online clinical supports, and another presented it in Nomogram and Prognostic index, respectively. The models of the remaining four studies were presented as graphs (<italic>n</italic> = 2), websites (<italic>n</italic> = 1), and column line graphs (<italic>n</italic> = 1), respectively.</p>
</sec>
<sec id="sec16">
<label>3.7</label>
<title>Interpretability of predictive models</title>
<p>Among the 10 included studies, two employed the SHAP method to quantify feature contributions, two conducted interpretable model inference based on Bayesian networks, four presented primary predictors through feature importance ranking, one visualized predictor weights using a column chart, and one study utilized both feature importance ranking and column charts. To further summarize interpretive findings across models, we compiled the top five key predictors reported in the included studies. Results indicated that age (<italic>n</italic> =&#x2009;7), cognitive function (<italic>n</italic> =&#x2009;5), and ADL (<italic>n</italic> =&#x2009;3) were the most frequently occurring predictors. <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 3</xref> summarizes the interpretability analysis methods used in the study and the top five key predictors identified by each method.</p>
</sec>
<sec id="sec17">
<label>3.8</label>
<title>Evaluation of the quality of the literature</title>
<p>Two personnel used the PROBAST+AI assessment tool to evaluate the quality and applicability of the model development process and the risk of bias and applicability of the model performance assessment. After careful evaluation, in the model development and assessment section, seven studies had low-quality issues and high risk of bias concerns (<xref ref-type="bibr" rid="ref31">31</xref>, <xref ref-type="bibr" rid="ref33">33</xref>, <xref ref-type="bibr" rid="ref34">34</xref>, <xref ref-type="bibr" rid="ref36">36</xref>&#x2013;<xref ref-type="bibr" rid="ref39">39</xref>) and the quality of the remaining three studies was rated as unclear (<xref ref-type="bibr" rid="ref30">30</xref>, <xref ref-type="bibr" rid="ref32">32</xref>, <xref ref-type="bibr" rid="ref34">34</xref>). The results of applicability in the model development and assessment sections were the same, with low applicability of models in four studies (<xref ref-type="bibr" rid="ref31">31</xref>, <xref ref-type="bibr" rid="ref33">33</xref>&#x2013;<xref ref-type="bibr" rid="ref35">35</xref>), high applicability of models in five studies (<xref ref-type="bibr" rid="ref30">30</xref>, <xref ref-type="bibr" rid="ref32">32</xref>, <xref ref-type="bibr" rid="ref37">37</xref>&#x2013;<xref ref-type="bibr" rid="ref39">39</xref>), and unclear applicability of models in one study (<xref ref-type="bibr" rid="ref36">36</xref>). The final results of bias and applicability of the included models are shown in <xref ref-type="table" rid="tab4">Table 4</xref>. Bar charts showing the PROBAST+AI quality and risk of bias assessment results included in the study are presented in <xref ref-type="fig" rid="fig2">Figures 2</xref>, <xref ref-type="fig" rid="fig3">3</xref>.</p>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>Assess the overall concerns regarding quality, risk of bias and applicability of the prediction model.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Study</th>
<th align="center" valign="top" colspan="2">Model development</th>
<th align="center" valign="top" colspan="2">Model evaluation</th>
</tr>
<tr>
<th align="center" valign="top">Quality</th>
<th align="center" valign="top">Application</th>
<th align="center" valign="top">Risk of bias</th>
<th align="center" valign="top">Application</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Mengjiao Yang 2024 (<xref ref-type="bibr" rid="ref37">37</xref>)</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">&#x2212;</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">&#x2212;</td>
</tr>
<tr>
<td align="left" valign="top">Qinqin Liu 2023 (<xref ref-type="bibr" rid="ref34">34</xref>)</td>
<td align="center" valign="top">?</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">?</td>
<td align="center" valign="top">+</td>
</tr>
<tr>
<td align="left" valign="top">Shaoyi Fan 2023 (<xref ref-type="bibr" rid="ref31">31</xref>)</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">+</td>
</tr>
<tr>
<td align="left" valign="top">Yafei Wu 2022 (<xref ref-type="bibr" rid="ref36">36</xref>)</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">?</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">?</td>
</tr>
<tr>
<td align="left" valign="top">Heeeun Jung 2023 (<xref ref-type="bibr" rid="ref33">33</xref>)</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">+</td>
</tr>
<tr>
<td align="left" valign="top">Yin Yuan 2022 (<xref ref-type="bibr" rid="ref38">38</xref>)</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">&#x2212;</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">&#x2212;</td>
</tr>
<tr>
<td align="left" valign="top">Yongfei Dong 2025 (<xref ref-type="bibr" rid="ref30">30</xref>)</td>
<td align="center" valign="top">?</td>
<td align="center" valign="top">&#x2212;</td>
<td align="center" valign="top">?</td>
<td align="center" valign="top">&#x2212;</td>
</tr>
<tr>
<td align="left" valign="top">Lin Qi 2025 (<xref ref-type="bibr" rid="ref35">35</xref>)</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">+</td>
</tr>
<tr>
<td align="left" valign="top">Wei Zhang 2024 (<xref ref-type="bibr" rid="ref39">39</xref>)</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">&#x2212;</td>
<td align="center" valign="top">+</td>
<td align="center" valign="top">&#x2212;</td>
</tr>
<tr>
<td align="left" valign="top">Li Huang 2024 (<xref ref-type="bibr" rid="ref32">32</xref>)</td>
<td align="center" valign="top">?</td>
<td align="center" valign="top">&#x2212;</td>
<td align="center" valign="top">?</td>
<td align="center" valign="top">&#x2212;</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>&#x2212;, Low bias risk/high quality/high applicability; +, High bias risk/low quality/low applicability; ?, Unclear bias risk/unclear quality/unclear applicability.</p>
</table-wrap-foot>
</table-wrap>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Bar chart of PROBAST+AI quality assessment results included in the study.</p>
</caption>
<graphic xlink:href="fpubh-13-1667792-g002.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Bar chart titled "Model development" showing five categories: Quality, Analysis, Outcome, Predictors, and Participants. Each bar is divided into blue (low), orange (high), and gray (unclear) segments. Participants have the highest proportion of high, while Analysis and Outcome have noticeable unclear segments. Quality and Predictors have substantial low segments.</alt-text>
</graphic>
</fig>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Bar chart of PROBAST+AI bias risk assessment results included in the study.</p>
</caption>
<graphic xlink:href="fpubh-13-1667792-g003.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Bar chart titled "Model Evaluation" comparing five categories of bias: Risk of bias, Analysis, Outcome, Predictors, and Participants. Categories are rated as low (blue), high (orange), or unclear (gray). Predictors and Participants have larger low ratings, while Risk of bias and Analysis have larger high ratings. Outcome shows a mix of all ratings.</alt-text>
</graphic>
</fig>
<p>In the model development and assessment section, the reasons for being rated as low quality and high bias were mainly attributed to (1) retrospective cohort studies raising low-quality concerns and high risk of bias among participants and data sources; (2) not reporting whether the measurements of the predictors were affected by outcomes that had already occurred; (3) the number of events per variable (EVP) was less than 20; (4) categorization of the continuous predictors; (5) missing data were directly excluded or information on missing data was not reported; (6) there was no information on methods to address category imbalance; and (7) there may be concerns about data leakage. Detailed assessment information is provided in <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 4</xref>.</p>
</sec>
<sec id="sec18">
<label>3.9</label>
<title>Statistical analysis</title>
<p>A total of 45 models were developed in the 10 included studies: 36 models were developed for internal validation, and nine models were developed for external validation. Since only three studies performed external validation and one study evaluated the performance of the model with the F1 score, the meta-analysis only included data from the internal validation set of 9 studies. Because most of the included studies used multiple ML models, we first summarized the AUC for each study, as shown in <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 5</xref>. Given the variation in prediction time points across studies, we further conducted a stratified meta-analysis based on prediction windows (baseline prediction vs. longitudinal prediction). Results showed that the pooled AUC for baseline frailty prediction studies was 0.878 (95% CI 0.799, 0.958; <italic>I</italic><sup>2</sup> =&#x2009;94.9%; heterogeneity <italic>p</italic> &#x003C;&#x2009;0.001), while the pooled AUC for longitudinal frailty prediction studies was 0.730 (0.670, 0.790; <italic>I</italic><sup>2</sup> =&#x2009;96.6%; heterogeneity <italic>p</italic> &#x003C;&#x2009;0.001). The overall pooled AUC for all studies, regardless of prediction time point, was 0.786 (0.697, 0.875; <italic>I</italic><sup>2</sup> =&#x2009;99.4%; heterogeneity <italic>p</italic> &#x003C;&#x2009;0.001). These findings indicate that frailty prediction models based on baseline data demonstrate superior discriminatory performance, with a significantly higher pooled AUC compared to longitudinal prediction studies. The results of the meta-analysis are shown in <xref ref-type="fig" rid="fig4">Figure 4</xref>.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Random forest plot of area under the curve (AUC) values stratified by prediction window.</p>
</caption>
<graphic xlink:href="fpubh-13-1667792-g004.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Forest plot showing the Area Under the Curve (AUC) with 95% Confidence Intervals for various studies, categorized by cohort and cross-sectional studies. Each study is plotted with its respective AUC value, confidence interval, and percentage weight. Subgroup analysis shows significant heterogeneity with p-values below 0.001. Overall AUC is 0.786 with substantial heterogeneity indicated by I-squared values. The note highlights the use of a random-effects model.</alt-text>
</graphic>
</fig>
<p>Based on the different algorithms of model, we categorize them into traditional regression models (<italic>n</italic> = 4) as well as ML models (<italic>n</italic> = 28). Among them, the traditional regression models include LR, and the ML models include RF, SVM, XGB, etc. After summarizing the AUC of these models, we found that the combined AUC of the traditional regression model was 0.785 (95% CI 0.615, 0.955; <italic>I</italic><sup>2</sup> = 99.2%; heterogeneity <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001), and the combined AUC of the ML model was 0.784 (95% CI 0.747, 0.822; <italic>I</italic><sup>2</sup> = 99.1%; heterogeneity <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001). The results showed that the combined AUC values of the two models were similar. However, due to the smaller sample size of the traditional regression model, its CI was wider, suggesting higher uncertainty in the results. The results of the meta-analysis are shown in <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure 1</xref>.</p>
<p>To determine which ML model in the set of 9 internal validations had the better performance ability, we pooled and compared the AUCs of the models that were used three or more times. The results of the combined AUCs of the different ML models were as follows: 0.785 (95% CI 0.615, 0.955; <italic>I</italic><sup>2</sup> = 99.2%; heterogeneity <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001); SVM, 0.711 (95% CI 0.527, 1; <italic>I</italic><sup>2</sup> = 99.4%; heterogeneity <italic>p</italic> &#x003C; 0.001); DT, 0.696 (95% CI 0.591, 0.801; <italic>I</italic><sup>2</sup> = 90.2%; heterogeneity <italic>p</italic> &#x003C; 0.001); RF, 0.802 (95% CI 0.677, 0.927; <italic>I</italic><sup>2</sup> = 98.8%; heterogeneity <italic>p</italic> &#x003C; 0.001); XGB. 0.782 (95% CI 0.668, 0.896; <italic>I</italic><sup>2</sup> = 99.3%; heterogeneity <italic>p</italic> &#x003C; 0.001). Among these models, RF had the best performance, while DT had a lower performance. However, these differences were not statistically significant. The results of the meta-analysis are shown in <xref ref-type="fig" rid="fig5">Figure 5</xref>.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Random-effects forest plot of the area under the curve (AUC) values with 95% confidence intervals (CIs) for machine learning (ML) types.</p>
</caption>
<graphic xlink:href="fpubh-13-1667792-g005.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Forest plot depicting the Area Under the Curve (AUC) with 95% Confidence Intervals (CI) for different studies and machine learning models: LR, SVM, DT, RF, and XGB. Each study has associated weight percentages. Subgroup analysis includes heterogeneity indicators. Overall AUC is 0.776 (CI: 0.735, 0.818), with weights and heterogeneity tests sourced from the random-effects model.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec19">
<label>3.10</label>
<title>Sensitivity analysis</title>
<p>This study included a total of 9 research projects. Sensitivity analysis indicated that the pooled results demonstrated good robustness. Forest plot results showed that the point estimates for all individual studies, after exclusion, clustered closely around the overall pooled effect size (between 0.72 and 0.74), with high overlap in confidence intervals. The results of the sensitivity analysis are shown in <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure 2</xref>.</p>
</sec>
</sec>
<sec sec-type="discussion" id="sec20">
<label>4</label>
<title>Discussion</title>
<p>This study reviewed machine-learning-based methods for constructing risk prediction models for the occurrence of frailty in community-dwelling older adults. The aim was to assess the quality of these studies and the performance of the machine learning predictive models to assist in the development of frailty screening tools and interventions for community-dwelling older adults.</p>
<sec id="sec21">
<label>4.1</label>
<title>Comparison of baseline prediction and longitudinal prediction</title>
<p>This study revealed through stratified meta-analysis that the performance of frailty prediction models based on baseline data (AUC&#x2009;=&#x2009;0.878; 95% CI 0.799, 0.958) exceeded that of longitudinal prediction models (AUC&#x2009;=&#x2009;0.730; 95% CI 0.670, 0.790). This performance difference stems not from inherent model superiority but from the fundamental distinction between the two predictive tasks.</p>
<p>In baseline prediction models, all predictors and frailty status are measured at the same point in time. While this feature helps the model identify individuals who are frail at baseline, it also leads to construct overlap between some predictors and the frailty phenotype itself, thereby introducing endogeneity issues (<xref ref-type="bibr" rid="ref22">22</xref>). When predictors conceptually overlap with frailty or exhibit reverse causality due to simultaneous measurement, non-independence between predictors and frailty outcomes may occur, leading to overestimation of model performance (<xref ref-type="bibr" rid="ref40">40</xref>). Consequently, baseline prediction models are better suited for screening and case identification, enabling the rapid detection of individuals who are currently in a frail state.</p>
<p>In contrast, the longitudinal prediction model seeks to forecast future events. During follow-up, subjects may experience competing risk events such as death, other illnesses, or lifestyle changes that influence frailty development. These events introduce random variability that is not accounted for by the model, objectively limiting its performance (<xref ref-type="bibr" rid="ref41">41</xref>). Consequently, longitudinal predictive models perform below baseline models; yet, their clinical value lies primarily in their risk assessment and primary prevention capabilities. However, longitudinal prediction allows tracking and evaluation over time, yielding more accurate assessments of a model&#x2019;s performance and effectiveness on a long-term timescale (<xref ref-type="bibr" rid="ref32">32</xref>, <xref ref-type="bibr" rid="ref42">42</xref>). This enables the identification of currently healthy individuals at high risk of developing frailty in the future, facilitating early interventions to prevent or delay the onset of frailty.</p>
<p>In summary, the two models address distinct clinical questions, and their performance differences stem not only from randomness in follow-up processes but also from underlying endogeneity mechanisms within the data structure. Therefore, a model&#x2019;s value should not be measured solely by AUC scores but interpreted based on its specific design objectives and application scenarios. Future research may utilize variables from non-frailty performance components as predictors, or consider methods such as mediation analysis and joint modeling to generate inputs with greater causal significance. This approach could reduce bias arising from endogeneity, thereby enhancing the conceptual rigor and technical validity of predictive models.</p>
</sec>
<sec id="sec22">
<label>4.2</label>
<title>Research on the application of machine learning for predicting frailty in community-dwelling older adults remains in its exploratory phase</title>
<p>Without distinguishing prediction time points, the pooled AUC across all studies was 0.786 (95% CI 0.697, 0.875). This suggests that machine learning shows promising performance in predicting frailty onset among community-dwelling older adults, although the pooled AUC exhibits substantial heterogeneity. PROBAST+AI results suggest that most current studies raise concerns about low quality and high risk of bias. These issues may lead to potential overestimation of model performance metrics in this meta-analysis, while reducing the robustness and generalizability of the findings. Therefore, future research requires further standardization and improvement in study populations, data sources, predictive factors, and data analysis methodologies.</p>
<sec id="sec23">
<label>4.2.1</label>
<title>Study population and data sources</title>
<p>In the included studies, most data originated from single-center databases with relatively limited sample sources, which may restrict the applicability of the model to other populations. In predictive modeling, prospective cohort studies are considered to be more advantageous due to their ability to provide the best measure of predictors and outcomes. In addition, the use of registered datasets as a source for modeling is thought to reduce bias (<xref ref-type="bibr" rid="ref22">22</xref>). In contrast, using existing data and retrospective studies to construct models is not only susceptible to confounding factors. However, it may also cause recall bias, information bias, and selection bias, thus affecting the application of models in practice (<xref ref-type="bibr" rid="ref43">43</xref>). In subsequent studies, it is recommended to prioritize multicenter, prospective samples for model development and validation to assess model performance across different settings and enhance model generalizability. When data originates from databases, details of data collection and measurement procedures should be reported. Additionally, researchers should clearly define the intended use of predictive models and establish appropriate inclusion and exclusion criteria.</p>
</sec>
<sec id="sec24">
<label>4.2.2</label>
<title>Differences in frailty assessment tools</title>
<p>Consistent with previous studies, the literature reviewed in this study revealed that the prevalence of frailty among the older adults in the community varied significantly (<xref ref-type="bibr" rid="ref44">44</xref>), ranging from 13.00 to 64.77%. This difference may be due to the use of different assessment tools. Currently, although a variety of frailty assessment tools have been developed both domestically and abroad, there is no unified standard (<xref ref-type="bibr" rid="ref45">45</xref>). Previous studies have shown that the reported prevalence of frailty is generally low due to the relatively strict criteria of tools such as SOF, FRAIL scale, Fried phenotype, and EFS; Scales such as CFS, VES-13, TFI, GFI, and FI tend to report a higher prevalence of frailty (<xref ref-type="bibr" rid="ref46">46</xref>, <xref ref-type="bibr" rid="ref47">47</xref>). In community settings, the FRAIL scale is considered the most effective screening tool for distinguishing between frail and non-frail individuals, particularly in larger populations (<xref ref-type="bibr" rid="ref48">48</xref>, <xref ref-type="bibr" rid="ref49">49</xref>). In this paper, a total of five frailty assessment tools is involved, although they are widely used in clinical research; however, the results may be inconsistent due to differences in assessment content.</p>
<p>Additionally, the definition of the debilitating outcome is a key factor influencing prevalence. Studies have shown that binary classifications that distinguish only between &#x201C;frailty&#x201D; and &#x201C;non-frailty&#x201D; tend to produce a higher prevalence of frailty than a trichotomy that includes &#x201C;pre-frailty&#x201D; states (<xref ref-type="bibr" rid="ref50">50</xref>). Of the included studies, only five used binary classification to define outcomes. Additionally, one study combined &#x2018;pre-frailty&#x2019; with &#x2018;frailty&#x2019; as a predictive outcome, both of which may have influenced the results. Therefore, when developing a risk prediction model for frailty in the future, researchers should adopt more accurate methods for assessing and classifying frailty.</p>
</sec>
<sec id="sec25">
<label>4.2.3</label>
<title>Data analysis</title>
<p>First, among the included studies, three were deemed to have insufficient sample size due to an EPV&#x2009;&#x003C;&#x2009;20. PROBAST+AI indicates that in predictive model development, an EPV&#x2009;&#x003C;&#x2009;20 may increase the risk of model overfitting, thereby leading to an overestimation of the predictive model&#x2019;s performance. Relevant studies have shown that when using machine learning methods to develop risk prediction models, a larger sample size is needed so that a small amount of overfitting can be achieved to ensure the stability of the developed model. When developing and validating predictive models, researchers are advised to calculate the required sample size based on the prevalence of the overall event, the number of candidate predictors, the model&#x2019;s anticipated overall performance, and the target maximum level of overfitting. This approach helps reduce model overfitting and enhances model robustness (<xref ref-type="bibr" rid="ref51">51</xref>). Second, the continuum predictors in the four studies were inappropriately converted to categorical variables, which may lead to missing information as well as spurious exchange effects that weaken the discriminatory power and calibration of the models (<xref ref-type="bibr" rid="ref52">52</xref>, <xref ref-type="bibr" rid="ref53">53</xref>). During the development of predictive models, unnecessary grouping of continuous variables should be avoided whenever possible. Continuous variables should be incorporated into the model in their original form or converted into ordinal variables with clearly defined classification criteria.</p>
<p>In terms of the treatment of missing data, seven studies reported methods for handling missing data, while two studies deleted missing data. But even a small amount of missing or deleted data may introduce selective bias, reduce the representativeness of the sample, and may affect the judgment of model validity (<xref ref-type="bibr" rid="ref54">54</xref>). PROBAST+AI noted that multiple interpolation was considered the preferred method of dealing with missing data, in addition to pattern-mixing models, proxy splitting, and other alternative strategies to avoid the need for interpolation, which can prevent biased results by dealing with missing data directly during the construction and validation of the predictive model (<xref ref-type="bibr" rid="ref55">55</xref>). In one study, miss Forest was employed to address missing data, and this method, although highly predictive, may yield severely biased regression coefficient estimates and downwardly biased confidence interval coverage (<xref ref-type="bibr" rid="ref56">56</xref>). Future researchers developing frailty prediction models should employ reasonable methods to handle missing data based on professional expertise, clearly reporting the proportion of missing data and the processing strategy to enhance model performance.</p>
<p>This study reveals that data leakage represents a prevalent yet underappreciated methodological flaw in this field, undermining the reliability of model performance evaluation. It frequently leads to overestimation of generalization capabilities, resulting in outcomes that cannot be accurately replicated in real-world scenarios (<xref ref-type="bibr" rid="ref57">57</xref>, <xref ref-type="bibr" rid="ref58">58</xref>). Applying SMOTE (Synthetic Minority Over-sampling Technique) to the entire dataset before splitting it into training and test sets will cause overlapping leakage, thereby distorting model evaluation metrics. Among the included studies, two explicitly reported applying SMOTE oversampling only within the training set, effectively avoiding this type of information leakage (<xref ref-type="bibr" rid="ref58">58</xref>). On the other hand, preprocessing operations (such as missing value imputation or feature selection) performed on the entire dataset before splitting it into training and test sets can introduce preprocessing leakage (<xref ref-type="bibr" rid="ref59">59</xref>). Specifically, while all six included studies reported handling missing data, they failed to clarify the sequence of randomization versus data processing or disclose the imputation strategy. This methodological ambiguity elevates the risk of preprocessing leakage in their analyses. Therefore, future studies should prioritize data workflow standardization by adhering to the &#x201C;split first, preprocess later&#x201D; principle. Detailed data processing steps must be clearly documented in publications, particularly the methods for isolating training and test sets. This approach effectively prevents data leakage, enhances model reproducibility, and improves generalization performance.</p>
<p>Calibration and discrimination are two key metrics for evaluating predictive model performance. In the included studies, most models employed AUC to assess model discrimination, yielding favorable performance results. However, even with good discrimination, estimated risks may remain unreliable (<xref ref-type="bibr" rid="ref60">60</xref>). Model calibration, which assesses the consistency between predicted risks and observed outcomes (<xref ref-type="bibr" rid="ref61">61</xref>), is crucial for the validity and safety of clinical prediction models (<xref ref-type="bibr" rid="ref62">62</xref>). Yet in practice, model calibration is often overlooked. Similarly, among the studies we included, only five reported model calibration. Furthermore, research suggests using decision curve analysis to evaluate model performance (e.g., net benefit). Decision curves comprehensively consider sensitivity, specificity, and the risk&#x2013;benefit balance at different thresholds, providing crucial evidence for assessing a model&#x2019;s value in real-world clinical settings (<xref ref-type="bibr" rid="ref63">63</xref>). However, even when a model demonstrates strong discriminatory performance, its net benefit may diminish due to poor calibration (<xref ref-type="bibr" rid="ref61">61</xref>). Therefore, future research should comprehensively evaluate model performance using multiple metrics&#x2014;including discriminatory ability, calibration, and net benefit&#x2014;to enhance reliability and practicality in real-world applications.</p>
<p>In predictive modeling research, external validation is often considered a critical step for predictive models to be applied in real-world practice. However, external validation using completely independent datasets is often overlooked (<xref ref-type="bibr" rid="ref64">64</xref>). Of the 10 studies we included, only 3 performed external validation, while the rest performed only internal validation. The lack of external validation may have implications for model generalizability and robustness assessment (<xref ref-type="bibr" rid="ref65">65</xref>). External validation, unlike model development, not only evaluates the model performance on a new dataset but also tests its adaptability to different environments or different datasets, thus demonstrating the generalizability and portability of the model (<xref ref-type="bibr" rid="ref20">20</xref>). In addition, external validation can reveal whether the models in the training set are overfitted or not, as well as selectivity bias in the internal validation set. Models performing well in internal validation but with significant performance degradation in external validation (&#x2018;performance decay&#x2019;) is a common phenomenon in predictive modeling studies (<xref ref-type="bibr" rid="ref66">66</xref>). Therefore, the direct application of unvalidated models to clinical practice or public health screening is hazardous. Future research can evaluate model performance across diverse geographic regions, social contexts, and healthcare systems through time-geographic validation and multi-center validation at the institutional level, thereby enhancing the model&#x2019;s fairness, generalizability, and external applicability. Furthermore, external validation of existing predictive models can reduce research waste and help bridge the gap between model development and implementation (<xref ref-type="bibr" rid="ref67">67</xref>).</p>
</sec>
</sec>
<sec id="sec26">
<label>4.3</label>
<title>Interpretability of predictive models and key predictors</title>
<p>The studies we included employed various methods to enhance interpretability. Feature importance, the most common approach, enables researchers to identify key predictors influencing the model rapidly (<xref ref-type="bibr" rid="ref68">68</xref>). However, it struggles to explain complex interactions between features, thereby limiting the depth of model interpretation and clinical applicability (<xref ref-type="bibr" rid="ref69">69</xref>, <xref ref-type="bibr" rid="ref70">70</xref>). In contrast, Bayesian networks, as inherently interpretable models, reveal conditional dependencies between variables. They can identify potential causal relationships based on conditional dependencies and independence among variables (<xref ref-type="bibr" rid="ref71">71</xref>). However, their construction accuracy relies on prior knowledge and data quality, which limits their practical application (<xref ref-type="bibr" rid="ref72">72</xref>). Furthermore, SHapley Additive exPlanations (SHAP) stands as one of the most widely adopted explainable AI methods today. Its strength lies in simultaneously providing global feature importance and locally revealing key features and logical relationships underlying prediction outcomes. By quantifying the contribution of each feature to specific predictions, SHAP enhances model transparency and clinical interpretability (<xref ref-type="bibr" rid="ref73">73</xref>, <xref ref-type="bibr" rid="ref74">74</xref>). Future research may develop multi-level interpretability frameworks that simultaneously report global feature importance and local prediction explanations. This approach could enhance model transparency and clinical applicability while maintaining predictive performance.</p>
<p>Based on the above analysis, we synthesized the interpretable findings from the included studies. The final results encompassed seven distinct categories of predictors: demographic data, socioeconomic factors, physical function and fitness indicators, cognitive and mental health, chronic diseases and medical conditions, nutritional and metabolic status, and social support. The heterogeneity of these predictors reflects that frailty arises from the combined effects of multiple influencing factors. Notably, across different explanatory methodologies, age, cognitive function, and activities of daily living (ADL) ability were the most frequently identified predictors. In most studies, age was recognized as a key predictor of frailty. Cognitive decline was also identified as a critical predictor of frailty progression. Research indicates a bidirectional relationship between cognitive impairment and physical functional decline, with both factors jointly accelerating the onset and progression of frailty (<xref ref-type="bibr" rid="ref75">75</xref>). Furthermore, the combination of cognitive impairment and frailty may increase the risk of adverse health outcomes in older adults. Additionally, ADL is closely associated with frailty development. Previous studies suggest that ADL decline not only represents a clinical manifestation of frailty but may also serve as a mediating factor in its progression (<xref ref-type="bibr" rid="ref5">5</xref>).</p>
</sec>
<sec id="sec27">
<label>4.4</label>
<title>Comparison of predictive performance between machine learning models and traditional regression models</title>
<p>Given that ML is more efficient in dealing with complex nonlinear relationships and can improve prediction accuracy, we compared the performance of the ML model with that of the traditional regression model. Our results showed that the combined AUC point estimates of the traditional regression model and the ML model were similar, 0.785 (95% CI 0.615, 0.955) and 0.784 (95% CI 0.747, 0.822), respectively. However, due to the lack of statistical efficacy of the traditional regression group, which contained only four models at the time of the analysis, it is not yet possible to conclude that there is no difference in the performance of the two types of methods. Such small subgroups cannot reliably support the &#x201C;no difference&#x201D; conclusion, and their wide confidence intervals may improve the truthfulness, ranging from significantly worse to better than the ML models (<xref ref-type="bibr" rid="ref76">76</xref>). Thus, the current results do not negate the theoretical advantages of ML in dealing with complex relationships. However, it suggests that logistic regression models are still competitive in specific scenarios due to their simplicity, stability, and ease of interpretation (<xref ref-type="bibr" rid="ref77">77</xref>). Future research should fairly compare the advantages and disadvantages of different algorithms on the same high-quality dataset while ensuring methodological rigor.</p>
</sec>
</sec>
<sec id="sec28">
<label>5</label>
<title>Future outlook</title>
<p>This study provides a systematic evaluation of machine learning models for predicting frailty in community-dwelling older adults, offering insights for the development of healthcare policy and clinical practice. In clinical settings, the key predictors identified through interpretability analysis provide evidence-based support for developing concise and efficient frailty screening tools, enabling primary care providers to identify high-risk individuals rapidly. Furthermore, machine learning&#x2019;s capability to handle complex nonlinear relationships among variables holds promise for future integration with primary healthcare management systems or electronic health records. This integration could enable the automated assessment of frailty risk and the development of early warning systems, thereby supporting the creation of personalized intervention plans tailored to individual needs.</p>
<p>However, the field currently faces challenges, including limited sample sizes, inadequate data processing methods, and insufficient external validation, which constrain model performance and clinical translation potential. To propel further research development, we recommend strengthening future studies in the following areas: (1) In terms of study design, encourage the conduct of multicenter prospective cohort studies to enhance data representativeness and model robustness; (2) Regarding data processing, it is recommended to adopt the TRIPOD+AI standard to enhance the transparency of methodology reporting, thereby ensuring the scientific rigor of model construction and the credibility of results.; (3) For predictors, clearly report their definitions, evaluation methods, and inclusion criteria to avoid spurious associations caused by ambiguous or non-standard variables; (4) For model validation, place greater emphasis on external validation by testing model performance on independent cohorts to enhance generalization and clinical applicability; (5) Regarding clinical translation, future studies should evaluate models&#x2019; practical clinical impact through prospective studies and randomized controlled trials, advancing their algorithms toward truly usable clinical tools.</p>
</sec>
<sec id="sec29">
<label>6</label>
<title>Strengths and limitations</title>
<p>In this review, we conducted a systematic review and meta-analysis of machine learning methods to develop a predictive model of frailty risk in older adults in the community. In order to provide guidance for the development and update of subsequent models, and to help the application of such models in clinical practice. However, there were the following limitations in this study: (1) insufficient external validation: most of the included studies lacked external validation, so we were unable to perform meta-analysis of the pooled AUC of the model on the external validation set, which may affect the applicability and generalization of the model; (2) heterogeneity of assessment methods: the included studies had differences in the selection and measurement of frailty assessment methods and their predictors, which may introduce potential bias in the results of meta-analysis; (3) Heterogeneity between studies: Meta-analyses showed that there was in-house heterogeneity between studies, which may include differences between participants and study designs, predictor sets, and data analysis methods.</p>
</sec>
<sec sec-type="conclusions" id="sec30">
<label>7</label>
<title>Conclusion</title>
<p>This study included a total of 10 original studies, with meta-analyses conducted on the internal validation sets of 9 studies. Among these, the pooled AUC for baseline frailty prediction studies was 0.878 (95% CI 0.799, 0.958), while the pooled AUC for longitudinal frailty prediction studies was 0.730 (95% CI 0.670, 0.790). When all studies were pooled without distinguishing prediction time points, the overall pooled AUC was 0.786 (95% CI 0.697, 0.875). This indicates that current machine learning-based predictive models for frailty onset in community-dwelling older adults demonstrate satisfactory performance. However, the 10 included studies were rated as low quality in model construction, high risk of bias in model validation, and lack of external validation for most of the models due to a lack of sufficient rigor in the model development process. Future studies should validate them through large-scale, multicenter prospective cohort studies with external validation to enhance the applicability of the models. Also, future studies should strictly adhere to the TRIPOD+AI reporting specifications and PROBAST+AI design specifications. This includes but is not limited to, detailed reporting of data sources, predictor definitions and measurements, missing data handling processes, sample size justification, category imbalance handling methods, strict data leakage prevention measures (explicit preprocessing after training&#x2013;testing split), model tuning details, multiple performance metrics (discriminatory, calibration, and clinical utility), details of internal validation methodology, and conducting and reporting on independent external validation. Complete and transparent reporting and rigorous methodological design are cornerstones for improving study quality, reducing the risk of bias, and enhancing confidence and reproducibility of results.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec31">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref rid="SM1" ref-type="supplementary-material">Supplementary material</xref>, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="author-contributions" id="sec32">
<title>Author contributions</title>
<p>YO: Conceptualization, Formal analysis, Writing &#x2013; original draft. DJ: Conceptualization, Formal analysis, Writing &#x2013; original draft. PL: Investigation, Validation, Writing &#x2013; original draft. WZ: Data curation, Investigation, Writing &#x2013; original draft. YZ: Investigation, Validation, Writing &#x2013; original draft. YC: Funding acquisition, Supervision, Writing &#x2013; review &#x0026; editing. XY: Funding acquisition, Supervision, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="COI-statement" id="sec33">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec34">
<title>Generative AI statement</title>
<p>The authors declare that no Gen AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec35">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec36">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fpubh.2025.1667792/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fpubh.2025.1667792/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><label>1.</label><mixed-citation publication-type="other"><person-group person-group-type="author"><collab id="coll1">World Population Prospects</collab></person-group> (<year>2022</year>). Available online at: <ext-link xlink:href="https://www.un.org/development/desa/pd/content/World-Population-Prospects-2022" ext-link-type="uri">https://www.un.org/development/desa/pd/content/World-Population-Prospects-2022</ext-link> (Accessed June 12, 2025).</mixed-citation></ref>
<ref id="ref2"><label>2.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Clegg</surname><given-names>A</given-names></name> <name><surname>Young</surname><given-names>J</given-names></name> <name><surname>Iliffe</surname><given-names>S</given-names></name> <name><surname>Rikkert</surname><given-names>MO</given-names></name> <name><surname>Rockwood</surname><given-names>K</given-names></name></person-group>. <article-title>Frailty in elderly people</article-title>. <source>Lancet</source>. (<year>2013</year>) <volume>381</volume>:<fpage>752</fpage>&#x2013;<lpage>62</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(12)62167-9</pub-id>, <pub-id pub-id-type="pmid">23395245</pub-id></mixed-citation></ref>
<ref id="ref3"><label>3.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ofori-Asenso</surname><given-names>R</given-names></name> <name><surname>Chin</surname><given-names>KL</given-names></name> <name><surname>Mazidi</surname><given-names>M</given-names></name> <name><surname>Zomer</surname><given-names>E</given-names></name> <name><surname>Ilomaki</surname><given-names>J</given-names></name> <name><surname>Zullo</surname><given-names>AR</given-names></name> <etal/></person-group>. <article-title>Global incidence of frailty and prefrailty among community-dwelling older adults</article-title>. <source>JAMA Netw Open</source>. (<year>2019</year>) <volume>2</volume>:<fpage>e198398</fpage>. doi: <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2019.8398</pub-id>, <pub-id pub-id-type="pmid">31373653</pub-id></mixed-citation></ref>
<ref id="ref4"><label>4.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hoogendijk</surname><given-names>EO</given-names></name> <name><surname>Afilalo</surname><given-names>J</given-names></name> <name><surname>Ensrud</surname><given-names>KE</given-names></name> <name><surname>Kowal</surname><given-names>P</given-names></name> <name><surname>Onder</surname><given-names>G</given-names></name> <name><surname>Fried</surname><given-names>LP</given-names></name></person-group>. <article-title>Frailty: implications for clinical practice and public health</article-title>. <source>Lancet</source>. (<year>2019</year>) <volume>394</volume>:<fpage>1365</fpage>&#x2013;<lpage>75</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(19)31786-6</pub-id>, <pub-id pub-id-type="pmid">31609228</pub-id></mixed-citation></ref>
<ref id="ref5"><label>5.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ji</surname><given-names>D</given-names></name> <name><surname>Guo</surname><given-names>H</given-names></name> <name><surname>Qiu</surname><given-names>S</given-names></name> <name><surname>Dong</surname><given-names>L</given-names></name> <name><surname>Shen</surname><given-names>Y</given-names></name> <name><surname>Shen</surname><given-names>Z</given-names></name> <etal/></person-group>. <article-title>Screening for frailty and its association with activities of daily living, cognitive impairment, and falls among community-dwelling older adults in China</article-title>. <source>BMC Geriatr</source>. (<year>2024</year>) <volume>24</volume>:<fpage>576</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12877-024-05173-0</pub-id></mixed-citation></ref>
<ref id="ref6"><label>6.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>S&#x00E1;nchez-Garc&#x00ED;a</surname><given-names>S</given-names></name> <name><surname>Garc&#x00ED;a-Pe&#x00F1;a</surname><given-names>C</given-names></name> <name><surname>Salv&#x00E0;</surname><given-names>A</given-names></name> <name><surname>S&#x00E1;nchez-Arenas</surname><given-names>R</given-names></name> <name><surname>Granados-Garc&#x00ED;a</surname><given-names>V</given-names></name> <name><surname>Cuadros-Moreno</surname><given-names>J</given-names></name> <etal/></person-group>. <article-title>Frailty in community-dwelling older adults: association with adverse outcomes</article-title>. <source>Clin Interv Aging</source>. (<year>2017</year>) <volume>12</volume>:<fpage>1003</fpage>&#x2013;<lpage>11</lpage>. doi: <pub-id pub-id-type="doi">10.2147/CIA.S139860</pub-id></mixed-citation></ref>
<ref id="ref7"><label>7.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>&#x00C1;lvarez-Bustos</surname><given-names>A</given-names></name> <name><surname>Carnicero-Carre&#x00F1;o</surname><given-names>JA</given-names></name> <name><surname>Sanchez-Sanchez</surname><given-names>JL</given-names></name> <name><surname>Garcia-Garcia</surname><given-names>FJ</given-names></name> <name><surname>Alonso-Bouz&#x00F3;n</surname><given-names>C</given-names></name> <name><surname>Rodr&#x00ED;guez-Ma&#x00F1;as</surname><given-names>L</given-names></name></person-group>. <article-title>Associations between frailty trajectories and frailty status and adverse outcomes in community-dwelling older adults</article-title>. <source>J Cachexia Sarcopenia Muscle</source>. (<year>2022</year>) <volume>13</volume>:<fpage>230</fpage>&#x2013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.1002/jcsm.12888</pub-id>, <pub-id pub-id-type="pmid">34951157</pub-id></mixed-citation></ref>
<ref id="ref8"><label>8.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ni Lochlainn</surname><given-names>M</given-names></name> <name><surname>Cox</surname><given-names>NJ</given-names></name> <name><surname>Wilson</surname><given-names>T</given-names></name> <name><surname>Hayhoe</surname><given-names>RPG</given-names></name> <name><surname>Ramsay</surname><given-names>SE</given-names></name> <name><surname>Granic</surname><given-names>A</given-names></name> <etal/></person-group>. <article-title>Nutrition and frailty: opportunities for prevention and treatment</article-title>. <source>Nutrients</source>. (<year>2021</year>) <volume>13</volume>:<fpage>2349</fpage>. doi: <pub-id pub-id-type="doi">10.3390/nu13072349</pub-id>, <pub-id pub-id-type="pmid">34371858</pub-id></mixed-citation></ref>
<ref id="ref9"><label>9.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Briggs</surname><given-names>R</given-names></name> <name><surname>McDonough</surname><given-names>A</given-names></name> <name><surname>Ellis</surname><given-names>G</given-names></name> <name><surname>Bennett</surname><given-names>K</given-names></name> <name><surname>O&#x2019;Neill</surname><given-names>D</given-names></name> <name><surname>Robinson</surname><given-names>D</given-names></name></person-group>. <article-title>Comprehensive geriatric assessment for community-dwelling, high-risk, frail, older people</article-title>. <source>Cochrane Database Syst Rev</source>. (<year>2022</year>) <volume>2022</volume>:<fpage>CD012705</fpage>. doi: <pub-id pub-id-type="doi">10.1002/14651858.CD012705.pub2</pub-id>, <pub-id pub-id-type="pmid">35521829</pub-id></mixed-citation></ref>
<ref id="ref10"><label>10.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ruiz</surname><given-names>JG</given-names></name> <name><surname>Dent</surname><given-names>E</given-names></name> <name><surname>Morley</surname><given-names>JE</given-names></name> <name><surname>Merchant</surname><given-names>RA</given-names></name> <name><surname>Beilby</surname><given-names>J</given-names></name> <name><surname>Beard</surname><given-names>J</given-names></name> <etal/></person-group>. <article-title>Screening for and managing the person with frailty in primary care: ICFSR consensus guidelines</article-title>. <source>J Nutr Health Aging</source>. (<year>2020</year>) <volume>24</volume>:<fpage>920</fpage>&#x2013;<lpage>7</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s12603-020-1498-x</pub-id>, <pub-id pub-id-type="pmid">33155616</pub-id></mixed-citation></ref>
<ref id="ref11"><label>11.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Polidori</surname><given-names>MC</given-names></name></person-group>. <article-title>Preventing frailty and maintaining good health during aging</article-title>. <source>Inn Med Heidelb Ger</source>. (<year>2025</year>) <volume>66</volume>:<fpage>1039</fpage>&#x2013;<lpage>46</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00108-025-01982-6</pub-id>, <pub-id pub-id-type="pmid">40864248</pub-id></mixed-citation></ref>
<ref id="ref12"><label>12.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lai</surname><given-names>J</given-names></name> <name><surname>Cheng</surname><given-names>C</given-names></name> <name><surname>Liang</surname><given-names>T</given-names></name> <name><surname>Tang</surname><given-names>L</given-names></name> <name><surname>Guo</surname><given-names>X</given-names></name> <name><surname>Liu</surname><given-names>X</given-names></name></person-group>. <article-title>Development and multi-cohort validation of a machine learning-based simplified frailty assessment tool for clinical risk prediction</article-title>. <source>J Transl Med</source>. (<year>2025</year>) <volume>23</volume>:<fpage>921</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12967-025-06728-4</pub-id></mixed-citation></ref>
<ref id="ref13"><label>13.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dent</surname><given-names>E</given-names></name> <name><surname>Lien</surname><given-names>C</given-names></name> <name><surname>Lim</surname><given-names>WS</given-names></name> <name><surname>Wong</surname><given-names>WC</given-names></name> <name><surname>Wong</surname><given-names>CH</given-names></name> <name><surname>Ng</surname><given-names>TP</given-names></name> <etal/></person-group>. <article-title>The Asia-Pacific clinical practice guidelines for the management of frailty</article-title>. <source>J Am Med Dir Assoc</source>. (<year>2017</year>) <volume>18</volume>:<fpage>564</fpage>&#x2013;<lpage>75</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jamda.2017.04.018</pub-id></mixed-citation></ref>
<ref id="ref14"><label>14.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lyu</surname><given-names>H</given-names></name> <name><surname>Jiang</surname><given-names>W</given-names></name></person-group>. <article-title>Development and internal and external validation of a nomogram model for frailty risk among hospitalised older people using comprehensive geriatric assessment data</article-title>. <source>BMC Geriatr</source>. (<year>2023</year>) <volume>23</volume>:<fpage>712</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12877-023-04426-8</pub-id></mixed-citation></ref>
<ref id="ref15"><label>15.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Xiaodan</surname><given-names>L</given-names></name> <name><surname>Jianhua</surname><given-names>W</given-names></name> <name><surname>Jiantong</surname><given-names>S</given-names></name> <name><surname>Hui</surname><given-names>H</given-names></name> <name><surname>Yujia</surname><given-names>Z</given-names></name> <name><surname>Yaping</surname><given-names>C</given-names></name> <etal/></person-group>. <article-title>Methodology and steps for the production of a systematic evaluation of predictive models</article-title>. <source>Chin J Evid Based Med</source>. (<year>2023</year>) <volume>23</volume>:<fpage>602</fpage>&#x2013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.7507/1672-2531.202212112</pub-id></mixed-citation></ref>
<ref id="ref16"><label>16.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname><given-names>Y</given-names></name> <name><surname>Bang</surname><given-names>H</given-names></name> <name><surname>Kim</surname><given-names>DJ</given-names></name></person-group>. <article-title>How to establish clinical prediction models</article-title>. <source>Endocrinol Metab</source>. (<year>2016</year>) <volume>31</volume>:<fpage>38</fpage>&#x2013;<lpage>44</lpage>. doi: <pub-id pub-id-type="doi">10.3803/EnM.2016.31.1.38</pub-id>, <pub-id pub-id-type="pmid">26996421</pub-id></mixed-citation></ref>
<ref id="ref17"><label>17.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kong</surname><given-names>L-N</given-names></name> <name><surname>Yang</surname><given-names>L</given-names></name> <name><surname>Lyu</surname><given-names>Q</given-names></name> <name><surname>Liu</surname><given-names>D-X</given-names></name> <name><surname>Yang</surname><given-names>J</given-names></name></person-group>. <article-title>Risk prediction models for frailty in older adults: A systematic review and critical appraisal</article-title>. <source>Int J Nurs Stud</source>. (<year>2025</year>) <volume>167</volume>:<fpage>105068</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ijnurstu.2025.105068</pub-id>, <pub-id pub-id-type="pmid">40184783</pub-id></mixed-citation></ref>
<ref id="ref18"><label>18.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rajula</surname><given-names>HSR</given-names></name> <name><surname>Verlato</surname><given-names>G</given-names></name> <name><surname>Manchia</surname><given-names>M</given-names></name> <name><surname>Antonucci</surname><given-names>N</given-names></name> <name><surname>Fanos</surname><given-names>V</given-names></name></person-group>. <article-title>Comparison of conventional statistical methods with machine learning in medicine: diagnosis, drug development, and treatment</article-title>. <source>Medicina (Mex)</source>. (<year>2020</year>) <volume>56</volume>:<fpage>455</fpage>. doi: <pub-id pub-id-type="doi">10.3390/medicina56090455</pub-id></mixed-citation></ref>
<ref id="ref19"><label>19.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Buch</surname><given-names>VH</given-names></name> <name><surname>Ahmed</surname><given-names>I</given-names></name> <name><surname>Maruthappu</surname><given-names>M</given-names></name></person-group>. <article-title>Artificial intelligence in medicine: current trends and future possibilities</article-title>. <source>Br J Gen Pract</source>. (<year>2018</year>) <volume>68</volume>:<fpage>143</fpage>&#x2013;<lpage>4</lpage>. doi: <pub-id pub-id-type="doi">10.3399/bjgp18X695213</pub-id>, <pub-id pub-id-type="pmid">29472224</pub-id></mixed-citation></ref>
<ref id="ref20"><label>20.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Collins</surname><given-names>GS</given-names></name> <name><surname>Moons</surname><given-names>KGM</given-names></name> <name><surname>Dhiman</surname><given-names>P</given-names></name> <name><surname>Riley</surname><given-names>RD</given-names></name> <name><surname>Beam</surname><given-names>AL</given-names></name> <name><surname>Van Calster</surname><given-names>B</given-names></name> <etal/></person-group>. <article-title>TRIPOD+AI statement: updated guidance for reporting clinical prediction models that use regression or machine learning methods</article-title>. <source>BMJ</source>. (<year>2024</year>):<fpage>e078378</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmj-2023-078378</pub-id>, <pub-id pub-id-type="pmid">38626948</pub-id></mixed-citation></ref>
<ref id="ref21"><label>21.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yuxin</surname><given-names>C</given-names></name> <name><surname>Yongfen</surname><given-names>L</given-names></name> <name><surname>Xiaorong</surname><given-names>H</given-names></name> <name><surname>Jie</surname><given-names>Y</given-names></name> <name><surname>Dieer</surname><given-names>H</given-names></name></person-group>. <article-title>Systematic evaluation of the effectiveness of machine learning models applied to the prediction of debilitating risks in community-dwelling older adults</article-title>. <source>Geriatr Res</source>. (<year>2025</year>) <volume>6</volume>:<fpage>49</fpage>&#x2013;<lpage>55</lpage>. doi: <pub-id pub-id-type="doi">10.3969/j.issn.2096-9058.2025.01.010</pub-id></mixed-citation></ref>
<ref id="ref22"><label>22.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Moons</surname><given-names>KGM</given-names></name> <name><surname>Damen</surname><given-names>JAA</given-names></name> <name><surname>Kaul</surname><given-names>T</given-names></name> <name><surname>Hooft</surname><given-names>L</given-names></name> <name><surname>Andaur Navarro</surname><given-names>C</given-names></name> <name><surname>Dhiman</surname><given-names>P</given-names></name> <etal/></person-group>. <article-title>PROBAST+AI: an updated quality, risk of bias, and applicability assessment tool for prediction models using regression or artificial intelligence methods</article-title>. <source>BMJ</source>. (<year>2025</year>) <volume>388</volume>:<fpage>e082505</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmj-2024-082505</pub-id>, <pub-id pub-id-type="pmid">40127903</pub-id></mixed-citation></ref>
<ref id="ref23"><label>23.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Snell</surname><given-names>KIE</given-names></name> <name><surname>Levis</surname><given-names>B</given-names></name> <name><surname>Damen</surname><given-names>JAA</given-names></name> <name><surname>Dhiman</surname><given-names>P</given-names></name> <name><surname>Debray</surname><given-names>TPA</given-names></name> <name><surname>Hooft</surname><given-names>L</given-names></name> <etal/></person-group>. <article-title>Transparent reporting of multivariable prediction models for individual prognosis or diagnosis: checklist for systematic reviews and meta-analyses (TRIPOD-SRMA)</article-title>. <source>BMJ</source>. (<year>2023</year>) <volume>381</volume>:<fpage>e073538</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmj-2022-073538</pub-id>, <pub-id pub-id-type="pmid">37137496</pub-id></mixed-citation></ref>
<ref id="ref24"><label>24.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Page</surname><given-names>MJ</given-names></name> <name><surname>McKenzie</surname><given-names>JE</given-names></name> <name><surname>Bossuyt</surname><given-names>PM</given-names></name> <name><surname>Boutron</surname><given-names>I</given-names></name> <name><surname>Hoffmann</surname><given-names>TC</given-names></name> <name><surname>Mulrow</surname><given-names>CD</given-names></name> <etal/></person-group>. <article-title>The PRISMA 2020 statement: an updated guideline for reporting systematic reviews</article-title>. <source>BMJ</source>. (<year>2021</year>) <volume>372</volume>:<fpage>n71</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmj.n71</pub-id>, <pub-id pub-id-type="pmid">33782057</pub-id></mixed-citation></ref>
<ref id="ref25"><label>25.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Moons</surname><given-names>KGM</given-names></name> <name><surname>De Groot</surname><given-names>JAH</given-names></name> <name><surname>Bouwmeester</surname><given-names>W</given-names></name> <name><surname>Vergouwe</surname><given-names>Y</given-names></name> <name><surname>Mallett</surname><given-names>S</given-names></name> <name><surname>Altman</surname><given-names>DG</given-names></name> <etal/></person-group>. <article-title>Critical appraisal and data extraction for systematic reviews of prediction modelling studies: the CHARMS checklist</article-title>. <source>PLoS Med</source>. (<year>2014</year>) <volume>11</volume>:<fpage>e1001744</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pmed.1001744</pub-id>, <pub-id pub-id-type="pmid">25314315</pub-id></mixed-citation></ref>
<ref id="ref26"><label>26.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Altman</surname><given-names>DG</given-names></name> <name><surname>Bland</surname><given-names>JM</given-names></name></person-group>. <article-title>How to obtain the confidence interval from a P value</article-title>. <source>BMJ</source>. (<year>2011</year>) <volume>343</volume>:<fpage>d2090</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmj.d2090</pub-id>, <pub-id pub-id-type="pmid">21824904</pub-id></mixed-citation></ref>
<ref id="ref27"><label>27.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Debray</surname><given-names>TP</given-names></name> <name><surname>Damen</surname><given-names>JA</given-names></name> <name><surname>Riley</surname><given-names>RD</given-names></name> <name><surname>Snell</surname><given-names>K</given-names></name> <name><surname>Reitsma</surname><given-names>JB</given-names></name> <name><surname>Hooft</surname><given-names>L</given-names></name> <etal/></person-group>. <article-title>A framework for meta-analysis of prediction model studies with binary and time-to-event outcomes</article-title>. <source>Stat Methods Med Res</source>. (<year>2019</year>) <volume>28</volume>:<fpage>2768</fpage>&#x2013;<lpage>86</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0962280218785504</pub-id>, <pub-id pub-id-type="pmid">30032705</pub-id></mixed-citation></ref>
<ref id="ref28"><label>28.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>DerSimonian</surname><given-names>R</given-names></name> <name><surname>Laird</surname><given-names>N</given-names></name></person-group>. <article-title>Meta-analysis in clinical trials revisited</article-title>. <source>Contemp Clin Trials</source>. (<year>2015</year>) <volume>45</volume>:<fpage>139</fpage>&#x2013;<lpage>45</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cct.2015.09.002</pub-id>, <pub-id pub-id-type="pmid">26343745</pub-id></mixed-citation></ref>
<ref id="ref29"><label>29.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Thorlund</surname><given-names>K</given-names></name> <name><surname>Wetterslev</surname><given-names>J</given-names></name> <name><surname>Awad</surname><given-names>T</given-names></name> <name><surname>Thabane</surname><given-names>L</given-names></name> <name><surname>Gluud</surname><given-names>C</given-names></name></person-group>. <article-title>Comparison of statistical inferences from the DerSimonian-Laird and alternative random-effects model meta-analyses - an empirical assessment of 920 Cochrane primary outcome meta-analyses</article-title>. <source>Res Synth Methods</source>. (<year>2011</year>) <volume>2</volume>:<fpage>238</fpage>&#x2013;<lpage>53</lpage>. doi: <pub-id pub-id-type="doi">10.1002/jrsm.53</pub-id>, <pub-id pub-id-type="pmid">26061888</pub-id></mixed-citation></ref>
<ref id="ref30"><label>30.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dong</surname><given-names>Y</given-names></name> <name><surname>Wang</surname><given-names>Q</given-names></name> <name><surname>Zhang</surname><given-names>K</given-names></name> <name><surname>Wang</surname><given-names>X</given-names></name> <name><surname>Liu</surname><given-names>H</given-names></name> <name><surname>Chen</surname><given-names>Y</given-names></name> <etal/></person-group>. <article-title>Development and validation of a prediction model of frailty risk in community-dwelling older adults: from a national longitudinal survey</article-title>. <source>Public Health</source>. (<year>2025</year>) <volume>240</volume>:<fpage>63</fpage>&#x2013;<lpage>70</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.puhe.2024.12.055</pub-id>, <pub-id pub-id-type="pmid">39874915</pub-id></mixed-citation></ref>
<ref id="ref31"><label>31.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fan</surname><given-names>S</given-names></name> <name><surname>Ye</surname><given-names>J</given-names></name> <name><surname>Xu</surname><given-names>Q</given-names></name> <name><surname>Peng</surname><given-names>R</given-names></name> <name><surname>Hu</surname><given-names>B</given-names></name> <name><surname>Pei</surname><given-names>Z</given-names></name> <etal/></person-group>. <article-title>Digital health technology combining wearable gait sensors and machine learning improve the accuracy in prediction of frailty</article-title>. <source>Front Public Health</source>. (<year>2023</year>) <volume>11</volume>:<fpage>1169083</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpubh.2023.1169083</pub-id></mixed-citation></ref>
<ref id="ref32"><label>32.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname><given-names>L</given-names></name> <name><surname>Chen</surname><given-names>H</given-names></name> <name><surname>Liang</surname><given-names>Z</given-names></name></person-group>. <article-title>Enhancing the convenience of frailty index assessment for elderly Chinese people with machine learning methods</article-title>. <source>Sci Rep</source>. (<year>2024</year>) <volume>14</volume>:<fpage>23227</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-024-74194-x</pub-id>, <pub-id pub-id-type="pmid">39369089</pub-id></mixed-citation></ref>
<ref id="ref33"><label>33.</label><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Jung</surname><given-names>H</given-names></name> <name><surname>Kim</surname><given-names>M</given-names></name> <name><surname>Won</surname><given-names>CW</given-names></name> <name><surname>Kim</surname><given-names>J</given-names></name> <name><surname>Mun</surname><given-names>K-R</given-names></name></person-group>. <article-title>Machine learning-based classification and risk factor analysis of frailty in Korean community-dwelling older adults</article-title> In: <source>2023 45th annual international conference of the IEEE engineering in medicine &#x0026; biology society (EMBC)</source>. <publisher-loc>Sydney, Australia</publisher-loc>: <publisher-name>IEEE</publisher-name> (<year>2023</year>). <fpage>1</fpage>&#x2013;<lpage>4</lpage>.</mixed-citation></ref>
<ref id="ref34"><label>34.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>Q</given-names></name> <name><surname>Yang</surname><given-names>L</given-names></name> <name><surname>Shi</surname><given-names>Z</given-names></name> <name><surname>Yu</surname><given-names>J</given-names></name> <name><surname>Si</surname><given-names>H</given-names></name> <name><surname>Jin</surname><given-names>Y</given-names></name> <etal/></person-group>. <article-title>Development and validation of a preliminary clinical support system for measuring the probability of incident 2-year (pre)frailty among community-dwelling older adults: A prospective cohort study</article-title>. <source>Int J Med Inform</source>. (<year>2023</year>) <volume>177</volume>:<fpage>105138</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2023.105138</pub-id>, <pub-id pub-id-type="pmid">37516037</pub-id></mixed-citation></ref>
<ref id="ref35"><label>35.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Qi</surname><given-names>L</given-names></name> <name><surname>Liu</surname><given-names>J</given-names></name> <name><surname>Song</surname><given-names>X</given-names></name> <name><surname>Wang</surname><given-names>X</given-names></name> <name><surname>Yang</surname><given-names>M</given-names></name> <name><surname>Cao</surname><given-names>X</given-names></name> <etal/></person-group>. <article-title>Determinants and risk prediction models for frailty among community-living older adults in eastern China</article-title>. <source>Front Public Health</source>. (<year>2025</year>) <volume>13</volume>:<fpage>1518472</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpubh.2025.1518472</pub-id></mixed-citation></ref>
<ref id="ref36"><label>36.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname><given-names>Y</given-names></name> <name><surname>Jia</surname><given-names>M</given-names></name> <name><surname>Xiang</surname><given-names>C</given-names></name> <name><surname>Fang</surname><given-names>Y</given-names></name></person-group>. <article-title>Latent trajectories of frailty and risk prediction models among geriatric community dwellers: an interpretable machine learning perspective</article-title>. <source>BMC Geriatr</source>. (<year>2022</year>) <volume>22</volume>:<fpage>900</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12877-022-03576-5</pub-id></mixed-citation></ref>
<ref id="ref37"><label>37.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname><given-names>M</given-names></name> <name><surname>Liu</surname><given-names>Y</given-names></name> <name><surname>Miura</surname><given-names>KW</given-names></name> <name><surname>Matsumoto</surname><given-names>M</given-names></name> <name><surname>Jiao</surname><given-names>D</given-names></name> <name><surname>Zhu</surname><given-names>Z</given-names></name> <etal/></person-group>. <article-title>Identification and prediction of frailty among community-dwelling older Japanese adults based on Bayesian network analysis: a cross-sectional and longitudinal study</article-title>. <source>BMC Public Health</source>. (<year>2024</year>) <volume>24</volume>:<fpage>2141</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12889-024-19697-y</pub-id></mixed-citation></ref>
<ref id="ref38"><label>38.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname><given-names>Y</given-names></name> <name><surname>Lin</surname><given-names>S</given-names></name> <name><surname>Huang</surname><given-names>X</given-names></name> <name><surname>Li</surname><given-names>N</given-names></name> <name><surname>Zheng</surname><given-names>J</given-names></name> <name><surname>Huang</surname><given-names>F</given-names></name> <etal/></person-group>. <article-title>The identification and prediction of frailty based on Bayesian network analysis in a community-dwelling older population</article-title>. <source>BMC Geriatr</source>. (<year>2022</year>) <volume>22</volume>:<fpage>847</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12877-022-03520-7</pub-id></mixed-citation></ref>
<ref id="ref39"><label>39.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>W</given-names></name> <name><surname>Wang</surname><given-names>J</given-names></name> <name><surname>Xie</surname><given-names>F</given-names></name> <name><surname>Wang</surname><given-names>X</given-names></name> <name><surname>Dong</surname><given-names>S</given-names></name> <name><surname>Luo</surname><given-names>N</given-names></name> <etal/></person-group>. <article-title>Development and validation of machine learning models to predict frailty risk for elderly</article-title>. <source>J Adv Nurs</source>. (<year>2024</year>) <volume>80</volume>:<fpage>5064</fpage>&#x2013;<lpage>75</lpage>. doi: <pub-id pub-id-type="doi">10.1111/jan.16192</pub-id>, <pub-id pub-id-type="pmid">38605460</pub-id></mixed-citation></ref>
<ref id="ref40"><label>40.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shmueli</surname><given-names>G</given-names></name></person-group>. <article-title>To explain or to predict?</article-title> <source>Stat Sci</source>. (<year>2010</year>) <volume>25</volume>:<fpage>289</fpage>&#x2013;<lpage>310</lpage>. doi: <pub-id pub-id-type="doi">10.1214/10-STS330</pub-id></mixed-citation></ref>
<ref id="ref41"><label>41.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Andersen</surname><given-names>PK</given-names></name> <name><surname>Geskus</surname><given-names>RB</given-names></name> <name><surname>de Witte</surname><given-names>T</given-names></name> <name><surname>Putter</surname><given-names>H</given-names></name></person-group>. <article-title>Competing risks in epidemiology: possibilities and pitfalls</article-title>. <source>Int J Epidemiol</source>. (<year>2012</year>) <volume>41</volume>:<fpage>861</fpage>&#x2013;<lpage>70</lpage>. doi: <pub-id pub-id-type="doi">10.1093/ije/dyr213</pub-id>, <pub-id pub-id-type="pmid">22253319</pub-id></mixed-citation></ref>
<ref id="ref42"><label>42.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>Q</given-names></name> <name><surname>Wang</surname><given-names>Q</given-names></name> <name><surname>Wang</surname><given-names>D</given-names></name> <name><surname>Lao</surname><given-names>J</given-names></name> <name><surname>Yang</surname><given-names>Y</given-names></name> <name><surname>Tang</surname><given-names>F</given-names></name> <etal/></person-group>. <article-title>Construction and application of a mortality risk prediction model for patients with lung squamous cell carcinoma: a competing risk analysis</article-title>. <source>J Cancer Res Ther</source>. (<year>2025</year>) <volume>21</volume>:<fpage>810</fpage>&#x2013;<lpage>7</lpage>. doi: <pub-id pub-id-type="doi">10.4103/jcrt.jcrt_791_25</pub-id>, <pub-id pub-id-type="pmid">40905864</pub-id></mixed-citation></ref>
<ref id="ref43"><label>43.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>Z</given-names></name> <name><surname>Wang</surname><given-names>S</given-names></name> <name><surname>Xu</surname><given-names>Z</given-names></name> <name><surname>Sun</surname><given-names>Y</given-names></name> <name><surname>Zhou</surname><given-names>X</given-names></name> <name><surname>Zhou</surname><given-names>R</given-names></name> <etal/></person-group>. <article-title>Frailty risk prediction models in maintenance hemodialysis patients: a systematic review and meta-analysis of studies from China</article-title>. <source>Ren Fail</source>. (<year>2025</year>) <volume>47</volume>:<fpage>2500663</fpage>. doi: <pub-id pub-id-type="doi">10.1080/0886022X.2025.2500663</pub-id></mixed-citation></ref>
<ref id="ref44"><label>44.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Collard</surname><given-names>RM</given-names></name> <name><surname>Boter</surname><given-names>H</given-names></name> <name><surname>Schoevers</surname><given-names>RA</given-names></name> <name><surname>Oude Voshaar</surname><given-names>RC</given-names></name></person-group>. <article-title>Prevalence of frailty in community-dwelling older persons: a systematic review</article-title>. <source>J Am Geriatr Soc</source>. (<year>2012</year>) <volume>60</volume>:<fpage>1487</fpage>&#x2013;<lpage>92</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1532-5415.2012.04054.x</pub-id>, <pub-id pub-id-type="pmid">22881367</pub-id></mixed-citation></ref>
<ref id="ref45"><label>45.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dent</surname><given-names>E</given-names></name> <name><surname>Kowal</surname><given-names>P</given-names></name> <name><surname>Hoogendijk</surname><given-names>EO</given-names></name></person-group>. <article-title>Frailty measurement in research and clinical practice: a review</article-title>. <source>Eur J Intern Med</source>. (<year>2016</year>) <volume>31</volume>:<fpage>3</fpage>&#x2013;<lpage>10</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ejim.2016.03.007</pub-id>, <pub-id pub-id-type="pmid">27039014</pub-id></mixed-citation></ref>
<ref id="ref46"><label>46.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sison</surname><given-names>SDM</given-names></name> <name><surname>Shi</surname><given-names>SM</given-names></name> <name><surname>Kim</surname><given-names>KM</given-names></name> <name><surname>Steinberg</surname><given-names>N</given-names></name> <name><surname>Jeong</surname><given-names>S</given-names></name> <name><surname>McCarthy</surname><given-names>EP</given-names></name> <etal/></person-group>. <article-title>A crosswalk of commonly used frailty scales</article-title>. <source>J Am Geriatr Soc</source>. (<year>2023</year>) <volume>71</volume>:<fpage>3189</fpage>. doi: <pub-id pub-id-type="doi">10.1111/jgs.18453</pub-id>, <pub-id pub-id-type="pmid">37289180</pub-id></mixed-citation></ref>
<ref id="ref47"><label>47.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Blodgett</surname><given-names>J</given-names></name> <name><surname>Theou</surname><given-names>O</given-names></name> <name><surname>Kirkland</surname><given-names>S</given-names></name> <name><surname>Andreou</surname><given-names>P</given-names></name> <name><surname>Rockwood</surname><given-names>K</given-names></name></person-group>. <article-title>Frailty in NHANES: comparing the frailty index and phenotype</article-title>. <source>Arch Gerontol Geriatr</source>. (<year>2015</year>) <volume>60</volume>:<fpage>464</fpage>&#x2013;<lpage>70</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.archger.2015.01.016</pub-id>, <pub-id pub-id-type="pmid">25697060</pub-id></mixed-citation></ref>
<ref id="ref48"><label>48.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname><given-names>Y-C</given-names></name> <name><surname>Chen</surname><given-names>C-T</given-names></name> <name><surname>Shen</surname><given-names>S-F</given-names></name> <name><surname>Chen</surname><given-names>L-K</given-names></name> <name><surname>Peng</surname><given-names>L-N</given-names></name> <name><surname>Tung</surname><given-names>H-H</given-names></name></person-group>. <article-title>Comparative analysis of frailty identification tools in community services across the Asia-Pacific: a systematic review and meta-analysis</article-title>. <source>J Nutr Health Aging</source>. (<year>2025</year>) <volume>29</volume>:<fpage>100496</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jnha.2025.100496</pub-id>, <pub-id pub-id-type="pmid">39889374</pub-id></mixed-citation></ref>
<ref id="ref49"><label>49.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vo</surname><given-names>NT</given-names></name> <name><surname>Tu</surname><given-names>YK</given-names></name> <name><surname>Lin</surname><given-names>KC</given-names></name> <name><surname>Chiu</surname><given-names>HY</given-names></name> <name><surname>Huang</surname><given-names>HC</given-names></name></person-group>. <article-title>Diagnostic accuracy of the FRAIL scale, Groningen frailty Indicator, Tilburg frailty Indicator, and PRISMA-7 for frailty screening among older adults in community settings: a systematic review and network meta-analysis</article-title>. <source>The Gerontologist</source>. (<year>2024</year>) <volume>64</volume>:<fpage>gnae008</fpage>. doi: <pub-id pub-id-type="doi">10.1093/geront/gnae008</pub-id>, <pub-id pub-id-type="pmid">38332716</pub-id></mixed-citation></ref>
<ref id="ref50"><label>50.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Aguayo</surname><given-names>GA</given-names></name> <name><surname>Donneau</surname><given-names>A-F</given-names></name> <name><surname>Vaillant</surname><given-names>MT</given-names></name> <name><surname>Schritz</surname><given-names>A</given-names></name> <name><surname>Franco</surname><given-names>OH</given-names></name> <name><surname>Stranges</surname><given-names>S</given-names></name> <etal/></person-group>. <article-title>Agreement between 35 published frailty scores in the general population</article-title>. <source>Am J Epidemiol</source>. (<year>2017</year>) <volume>186</volume>:<fpage>420</fpage>. doi: <pub-id pub-id-type="doi">10.1093/aje/kwx061</pub-id>, <pub-id pub-id-type="pmid">28633404</pub-id></mixed-citation></ref>
<ref id="ref51"><label>51.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Martin</surname><given-names>GP</given-names></name> <name><surname>Riley</surname><given-names>RD</given-names></name> <name><surname>Ensor</surname><given-names>J</given-names></name> <name><surname>Grant</surname><given-names>SW</given-names></name></person-group>. <article-title>Statistical primer: sample size considerations for developing and validating clinical prediction models</article-title>. <source>Eur J Cardiothorac Surg</source>. (<year>2025</year>) <volume>67</volume>:<fpage>ezaf142</fpage>. doi: <pub-id pub-id-type="doi">10.1093/ejcts/ezaf142</pub-id></mixed-citation></ref>
<ref id="ref52"><label>52.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Altman</surname><given-names>DG</given-names></name> <name><surname>Royston</surname><given-names>P</given-names></name></person-group>. <article-title>The cost of dichotomising continuous variables</article-title>. <source>BMJ</source>. (<year>2006</year>) <volume>332</volume>:<fpage>1080</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmj.332.7549.1080</pub-id>, <pub-id pub-id-type="pmid">16675816</pub-id></mixed-citation></ref>
<ref id="ref53"><label>53.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Thoresen</surname><given-names>M</given-names></name></person-group>. <article-title>Spurious interaction as a result of categorization</article-title>. <source>BMC Med Res Methodol</source>. (<year>2019</year>) <volume>19</volume>:<fpage>28</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12874-019-0667-2</pub-id></mixed-citation></ref>
<ref id="ref54"><label>54.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Arnaud</surname><given-names>E</given-names></name> <name><surname>Elbattah</surname><given-names>M</given-names></name> <name><surname>Ammirati</surname><given-names>C</given-names></name> <name><surname>Dequen</surname><given-names>G</given-names></name> <name><surname>Ghazali</surname><given-names>DA</given-names></name></person-group>. <article-title>Predictive models in emergency medicine and their missing data strategies: a systematic review</article-title>. <source>NPJ Digit Med</source>. (<year>2023</year>) <volume>6</volume>:<fpage>28</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41746-023-00770-6</pub-id></mixed-citation></ref>
<ref id="ref55"><label>55.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nijman</surname><given-names>S</given-names></name> <name><surname>Leeuwenberg</surname><given-names>AM</given-names></name> <name><surname>Beekers</surname><given-names>I</given-names></name> <name><surname>Verkouter</surname><given-names>I</given-names></name> <name><surname>Jacobs</surname><given-names>J</given-names></name> <name><surname>Bots</surname><given-names>ML</given-names></name> <etal/></person-group>. <article-title>Missing data is poorly handled and reported in prediction model studies using machine learning: a literature review</article-title>. <source>J Clin Epidemiol</source>. (<year>2022</year>) <volume>142</volume>:<fpage>218</fpage>&#x2013;<lpage>29</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jclinepi.2021.11.023</pub-id>, <pub-id pub-id-type="pmid">34798287</pub-id></mixed-citation></ref>
<ref id="ref56"><label>56.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hong</surname><given-names>S</given-names></name> <name><surname>Lynn</surname><given-names>HS</given-names></name></person-group>. <article-title>Accuracy of random-forest-based imputation of missing data in the presence of non-normality, non-linearity, and interaction</article-title>. <source>BMC Med Res Methodol</source>. (<year>2020</year>) <volume>20</volume>:<fpage>199</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12874-020-01080-1</pub-id></mixed-citation></ref>
<ref id="ref57"><label>57.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kapoor</surname><given-names>S</given-names></name> <name><surname>Narayanan</surname><given-names>A</given-names></name></person-group>. <article-title>Leakage and the reproducibility crisis in machine-learning-based science</article-title>. <source>Patterns</source>. (<year>2023</year>) <volume>4</volume>:<fpage>100804</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.patter.2023.100804</pub-id>, <pub-id pub-id-type="pmid">37720327</pub-id></mixed-citation></ref>
<ref id="ref58"><label>58.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Alturayeif</surname><given-names>N</given-names></name> <name><surname>Hassine</surname><given-names>J</given-names></name></person-group>. <article-title>Data leakage detection in machine learning code: transfer learning, active learning, or low-shot prompting?</article-title> <source>PeerJ Comput Sci</source>. (<year>2025</year>) <volume>11</volume>:<fpage>e2730</fpage>. doi: <pub-id pub-id-type="doi">10.7717/peerj-cs.2730</pub-id>, <pub-id pub-id-type="pmid">40134878</pub-id></mixed-citation></ref>
<ref id="ref59"><label>59.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bernett</surname><given-names>J</given-names></name> <name><surname>Blumenthal</surname><given-names>DB</given-names></name> <name><surname>Grimm</surname><given-names>DG</given-names></name> <name><surname>Haselbeck</surname><given-names>F</given-names></name> <name><surname>Joeres</surname><given-names>R</given-names></name> <name><surname>Kalinina</surname><given-names>OV</given-names></name> <etal/></person-group>. <article-title>Guiding questions to avoid data leakage in biological machine learning applications</article-title>. <source>Nat Methods</source>. (<year>2024</year>) <volume>21</volume>:<fpage>1444</fpage>&#x2013;<lpage>53</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41592-024-02362-y</pub-id>, <pub-id pub-id-type="pmid">39122953</pub-id></mixed-citation></ref>
<ref id="ref60"><label>60.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vickers</surname><given-names>AJ</given-names></name> <name><surname>Elkin</surname><given-names>EB</given-names></name></person-group>. <article-title>Decision curve analysis: a novel method for evaluating prediction models</article-title>. <source>Med Decis Mak Int J Soc Med Decis Mak</source>. (<year>2006</year>) <volume>26</volume>:<fpage>565</fpage>&#x2013;<lpage>74</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0272989X06295361</pub-id>, <pub-id pub-id-type="pmid">17099194</pub-id></mixed-citation></ref>
<ref id="ref61"><label>61.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Van Calster</surname><given-names>B</given-names></name> <name><surname>McLernon</surname><given-names>DJ</given-names></name> <name><surname>van Smeden</surname><given-names>M</given-names></name> <name><surname>Wynants</surname><given-names>L</given-names></name> <name><surname>Steyerberg</surname><given-names>EW</given-names></name> <name><surname>Bossuyt</surname><given-names>P</given-names></name> <etal/></person-group>. <article-title>Calibration: the Achilles heel of predictive analytics</article-title>. <source>BMC Med</source>. (<year>2019</year>) <volume>17</volume>:<fpage>230</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12916-019-1466-7</pub-id></mixed-citation></ref>
<ref id="ref62"><label>62.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Davis</surname><given-names>SE</given-names></name> <name><surname>Greevy</surname><given-names>RA</given-names></name> <name><surname>Lasko</surname><given-names>TA</given-names></name> <name><surname>Walsh</surname><given-names>CG</given-names></name> <name><surname>Matheny</surname><given-names>ME</given-names></name></person-group>. <article-title>Detection of calibration drift in clinical prediction models to inform model updating</article-title>. <source>J Biomed Inform</source>. (<year>2020</year>) <volume>112</volume>:<fpage>103611</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103611</pub-id>, <pub-id pub-id-type="pmid">33157313</pub-id></mixed-citation></ref>
<ref id="ref63"><label>63.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Binuya</surname><given-names>MAE</given-names></name> <name><surname>Engelhardt</surname><given-names>EG</given-names></name> <name><surname>Schats</surname><given-names>W</given-names></name> <name><surname>Schmidt</surname><given-names>MK</given-names></name> <name><surname>Steyerberg</surname><given-names>EW</given-names></name></person-group>. <article-title>Methodological guidance for the evaluation and updating of clinical prediction models: a systematic review</article-title>. <source>BMC Med Res Methodol</source>. (<year>2022</year>) <volume>22</volume>:<fpage>316</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12874-022-01801-8</pub-id></mixed-citation></ref>
<ref id="ref64"><label>64.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Collins</surname><given-names>GS</given-names></name> <name><surname>de Groot</surname><given-names>JA</given-names></name> <name><surname>Dutton</surname><given-names>S</given-names></name> <name><surname>Omar</surname><given-names>O</given-names></name> <name><surname>Shanyinde</surname><given-names>M</given-names></name> <name><surname>Tajar</surname><given-names>A</given-names></name> <etal/></person-group>. <article-title>External validation of multivariable prediction models: a systematic review of methodological conduct and reporting</article-title>. <source>BMC Med Res Methodol</source>. (<year>2014</year>) <volume>14</volume>:<fpage>40</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1471-2288-14-40</pub-id></mixed-citation></ref>
<ref id="ref65"><label>65.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bates</surname><given-names>DW</given-names></name> <name><surname>Auerbach</surname><given-names>A</given-names></name> <name><surname>Schulam</surname><given-names>P</given-names></name> <name><surname>Wright</surname><given-names>A</given-names></name> <name><surname>Saria</surname><given-names>S</given-names></name></person-group>. <article-title>Reporting and implementing interventions involving machine learning and artificial intelligence</article-title>. <source>Ann Intern Med</source>. (<year>2020</year>) <volume>172</volume>:<fpage>S137</fpage>&#x2013;<lpage>44</lpage>. doi: <pub-id pub-id-type="doi">10.7326/M19-0872</pub-id>, <pub-id pub-id-type="pmid">32479180</pub-id></mixed-citation></ref>
<ref id="ref66"><label>66.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Siontis</surname><given-names>GCM</given-names></name> <name><surname>Tzoulaki</surname><given-names>I</given-names></name> <name><surname>Castaldi</surname><given-names>PJ</given-names></name> <name><surname>Ioannidis</surname><given-names>JPA</given-names></name></person-group>. <article-title>External validation of new risk prediction models is infrequent and reveals worse prognostic discrimination</article-title>. <source>J Clin Epidemiol</source>. (<year>2015</year>) <volume>68</volume>:<fpage>25</fpage>&#x2013;<lpage>34</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jclinepi.2014.09.007</pub-id>, <pub-id pub-id-type="pmid">25441703</pub-id></mixed-citation></ref>
<ref id="ref67"><label>67.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ramspek</surname><given-names>CL</given-names></name> <name><surname>Jager</surname><given-names>KJ</given-names></name> <name><surname>Dekker</surname><given-names>FW</given-names></name> <name><surname>Zoccali</surname><given-names>C</given-names></name> <name><surname>van Diepen</surname><given-names>M</given-names></name></person-group>. <article-title>External validation of prognostic models: what, why, how, when and where?</article-title> <source>Clin Kidney J</source>. (<year>2020</year>) <volume>14</volume>:<fpage>49</fpage>&#x2013;<lpage>58</lpage>. doi: <pub-id pub-id-type="doi">10.1093/ckj/sfaa188</pub-id></mixed-citation></ref>
<ref id="ref68"><label>68.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Linardatos</surname><given-names>P</given-names></name> <name><surname>Papastefanopoulos</surname><given-names>V</given-names></name> <name><surname>Kotsiantis</surname><given-names>S</given-names></name></person-group>. <article-title>Explainable AI: a review of machine learning interpretability methods</article-title>. <source>Entropy</source>. (<year>2020</year>) <volume>23</volume>:<fpage>18</fpage>. doi: <pub-id pub-id-type="doi">10.3390/e23010018</pub-id></mixed-citation></ref>
<ref id="ref69"><label>69.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Martin</surname><given-names>SA</given-names></name> <name><surname>Townend</surname><given-names>FJ</given-names></name> <name><surname>Barkhof</surname><given-names>F</given-names></name> <name><surname>Cole</surname><given-names>JH</given-names></name></person-group>. <article-title>Interpretable machine learning for dementia: a systematic review</article-title>. <source>Alzheimers Dement</source>. (<year>2023</year>) <volume>19</volume>:<fpage>2135</fpage>&#x2013;<lpage>49</lpage>. doi: <pub-id pub-id-type="doi">10.1002/alz.12948</pub-id></mixed-citation></ref>
<ref id="ref70"><label>70.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rajbahadur</surname><given-names>GK</given-names></name> <name><surname>Wang</surname><given-names>S</given-names></name> <name><surname>Kamei</surname><given-names>Y</given-names></name> <name><surname>Hassan</surname><given-names>AE</given-names></name></person-group>. <article-title>The impact of feature importance methods on the interpretation of defect classifiers</article-title>. <source>IEEE Trans Softw Eng</source>. (<year>2022</year>) <volume>48</volume>:<fpage>2245</fpage>&#x2013;<lpage>61</lpage>. doi: <pub-id pub-id-type="doi">10.1109/TSE.2021.3056941</pub-id></mixed-citation></ref>
<ref id="ref71"><label>71.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Howey</surname><given-names>R</given-names></name> <name><surname>Clark</surname><given-names>AD</given-names></name> <name><surname>Naamane</surname><given-names>N</given-names></name> <name><surname>Reynard</surname><given-names>LN</given-names></name> <name><surname>Pratt</surname><given-names>AG</given-names></name> <name><surname>Cordell</surname><given-names>HJ</given-names></name></person-group>. <article-title>A Bayesian network approach incorporating imputation of missing data enables exploratory analysis of complex causal biological relationships</article-title>. <source>PLoS Genet</source>. (<year>2021</year>) <volume>17</volume>:<fpage>e1009811</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pgen.1009811</pub-id>, <pub-id pub-id-type="pmid">34587167</pub-id></mixed-citation></ref>
<ref id="ref72"><label>72.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kyrimi</surname><given-names>E</given-names></name> <name><surname>Dube</surname><given-names>K</given-names></name> <name><surname>Fenton</surname><given-names>N</given-names></name> <name><surname>Fahmi</surname><given-names>A</given-names></name> <name><surname>Neves</surname><given-names>MR</given-names></name> <name><surname>Marsh</surname><given-names>W</given-names></name> <etal/></person-group>. <article-title>Bayesian networks in healthcare: what is preventing their adoption?</article-title> <source>Artif Intell Med</source>. (<year>2021</year>) <volume>116</volume>:<fpage>102079</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.artmed.2021.102079</pub-id>, <pub-id pub-id-type="pmid">34020755</pub-id></mixed-citation></ref>
<ref id="ref73"><label>73.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ponce-Bobadilla</surname><given-names>AV</given-names></name> <name><surname>Schmitt</surname><given-names>V</given-names></name> <name><surname>Maier</surname><given-names>CS</given-names></name> <name><surname>Mensing</surname><given-names>S</given-names></name> <name><surname>Stodtmann</surname><given-names>S</given-names></name></person-group>. <article-title>Practical guide to SHAP analysis: explaining supervised machine learning model predictions in drug development</article-title>. <source>Clin Transl Sci</source>. (<year>2024</year>) <volume>17</volume>:<fpage>e70056</fpage>. doi: <pub-id pub-id-type="doi">10.1111/cts.70056</pub-id>, <pub-id pub-id-type="pmid">39463176</pub-id></mixed-citation></ref>
<ref id="ref74"><label>74.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vellido</surname><given-names>A</given-names></name></person-group>. <article-title>The importance of interpretability and visualization in machine learning for applications in medicine and health care</article-title>. <source>Neural Comput &#x0026; Applic</source>. (<year>2020</year>) <volume>32</volume>:<fpage>18069</fpage>&#x2013;<lpage>83</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00521-019-04051-w</pub-id></mixed-citation></ref>
<ref id="ref75"><label>75.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname><given-names>Y</given-names></name> <name><surname>Lapane</surname><given-names>KL</given-names></name> <name><surname>Tjia</surname><given-names>J</given-names></name> <name><surname>Baek</surname><given-names>J</given-names></name> <name><surname>Liu</surname><given-names>S-H</given-names></name> <name><surname>Ulbricht</surname><given-names>CM</given-names></name></person-group>. <article-title>Trajectories of physical frailty and cognitive impairment in older adults in United States nursing homes</article-title>. <source>BMC Geriatr</source>. (<year>2022</year>) <volume>22</volume>:<fpage>339</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12877-022-03012-8</pub-id></mixed-citation></ref>
<ref id="ref76"><label>76.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vetter</surname><given-names>TR</given-names></name></person-group>. <article-title>Systematic review and meta-analysis: sometimes bigger is indeed better</article-title>. <source>Anesth Analg</source>. (<year>2019</year>) <volume>128</volume>:<fpage>575</fpage>. doi: <pub-id pub-id-type="doi">10.1213/ANE.0000000000004014</pub-id>, <pub-id pub-id-type="pmid">30649072</pub-id></mixed-citation></ref>
<ref id="ref77"><label>77.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Christodoulou</surname><given-names>E</given-names></name> <name><surname>Ma</surname><given-names>J</given-names></name> <name><surname>Collins</surname><given-names>GS</given-names></name> <name><surname>Steyerberg</surname><given-names>EW</given-names></name> <name><surname>Verbakel</surname><given-names>JY</given-names></name> <name><surname>Van Calster</surname><given-names>B</given-names></name></person-group>. <article-title>A systematic review shows no performance benefit of machine learning over logistic regression for clinical prediction models</article-title>. <source>J Clin Epidemiol</source>. (<year>2019</year>) <volume>110</volume>:<fpage>12</fpage>&#x2013;<lpage>22</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jclinepi.2019.02.004</pub-id>, <pub-id pub-id-type="pmid">30763612</pub-id></mixed-citation></ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0002">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2806781/overview">Kofi Sarpong Adu-Manu</ext-link>, University of Ghana, Ghana</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0003">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/773361/overview">Mack Shelley</ext-link>, Iowa State University, United States</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3019245/overview">Adhan Efendi</ext-link>, National Chin-Yi University of Technology, Taiwan</p>
</fn>
</fn-group>
</back>
</article>