<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2026.1763139</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Development and clinical application of a postoperative complication prognosis prediction model for gastric cancer patients based on automated machine learning with body fat rate</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Xue</surname><given-names>Song</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Dong</surname><given-names>Xiangning</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Wei</surname><given-names>Jie</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Hao</surname><given-names>Jiqing</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3309027/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Department of Oncology, The First Affiliated Hospital of Anhui Medical University</institution>, <city>Hefei</city>, <state>Anhui</state>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>Department of Oncology, First People&#x2019;s Hospital of Chuzhou</institution>, <city>Chuzhou</city>, <state>Anhui</state>,&#xa0;<country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Jiqing Hao, <email xlink:href="mailto:haojiqing@ahmu.edu.cn">haojiqing@ahmu.edu.cn</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-03-03">
<day>03</day>
<month>03</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>16</volume>
<elocation-id>1763139</elocation-id>
<history>
<date date-type="received">
<day>08</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>13</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>04</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Xue, Dong, Wei and Hao.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Xue, Dong, Wei and Hao</copyright-holder>
<license>
<ali:license_ref start_date="2026-03-03">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Objective</title>
<p>To develop an automated machine learning (AutoML) framework integrating body composition indices&#x2014;notably Body Fat Rate (BFR)&#x2014;and clinicopathological features for predicting postoperative complications in gastric cancer patients, addressing limitations of traditional body mass index (BMI) assessment and enhancing clinical translatability.</p>
</sec>
<sec>
<title>Methods</title>
<p>In this retrospective cohort study, 1,023 gastric cancer patients undergoing radical gastrectomy (January 2020&#x2013;January 2025) were enrolled across two hospitals (716 training, 307 testing). A dual-optimization workflow included: (1) Simultaneous feature selection and hyperparameter tuning via the Improved Hike Optimization Algorithm (IHOA); (2) Class imbalance mitigation using synthetic minority oversampling technique (SMOTE). Model performance was evaluated through accuracy, sensitivity, specificity, F1-score, area under the receiver operating characteristic curve (AUC-ROC), area under the precision-recall curve (AUC-PR), calibration curves, and decision curve analysis (DCA). Feature robustness was validated using least absolute shrinkage and selection operator regression, while SHapley Additive exPlanations (SHAP) interpreted predictor contributions. A MATLAB-based proof-of-concept prototype visualization tool was developed for implementation.</p>
</sec>
<sec>
<title>Results</title>
<p>In independent testing, AutoML maintained robust performance (ROC-AUC = 0.9380, PR-AUC = 0.9262). DCA revealed greater net clinical benefit across risk thresholds (1%&#x2013;93%) compared to conventional methods, with sustained high-level stability confirming superior generalizability. Calibration curves demonstrated optimal probabilistic prediction (lowest test-set Brier score = 0.111). SHAP analysis identified BFR, visceral fat density (VFD), visceral fat area (VFA), skeletal muscle area (SMA), C-reactive protein (CRP), BMI, Age and lymphadenectomy extent as key predictors.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>The AutoML prediction model developed in this study achieves both high precision and strong interpretability. Its visualized tool effectively overcomes barriers to clinical translation, providing intelligent decision support for early warning and personalized intervention of postoperative complications in gastric cancer.</p>
</sec>
</abstract>
<kwd-group>
<kwd>body fat rate</kwd>
<kwd>explainable artificial intelligence (XAI)</kwd>
<kwd>gastric cancer</kwd>
<kwd>improved hike optimization algorithm</kwd>
<kwd>machine learning</kwd>
<kwd>postoperative complications</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This study was supported by: Key Project of Scientific Research in Universities of Anhui Province (Project No.: 2022AH050763); Anhui Medical University Youth Science Fund (Project No.: 2022xkj080).</funding-statement>
</funding-group>
<counts>
<fig-count count="7"/>
<table-count count="4"/>
<equation-count count="1"/>
<ref-count count="28"/>
<page-count count="15"/>
<word-count count="6390"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Gastrointestinal Cancers: Gastric and Esophageal Cancers</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Gastric cancer, a highly prevalent malignant tumor of the digestive system globally, exhibits both incidence and mortality rates ranking among the highest for malignancies in China, posing a severe threat to population well-being (<xref ref-type="bibr" rid="B1">1</xref>). Surgical resection serves as the primary curative approach for gastric cancer; however, the risk of postoperative recurrence and metastasis remains elevated, with a 5-year survival rate of merely 30%&#x2013;40% and significant interindividual prognostic heterogeneity (<xref ref-type="bibr" rid="B2">2</xref>). Thus, accurate postoperative complication risk assessment and personalized treatment strategies are crucial for improving patient survival outcomes. Traditional prognostic evaluation systems predominantly rely on pathological indicators such as tumor stage and differentiation grade. While clinically valuable to some extent, these parameters fail to comprehensively reflect patients&#x2019; systemic status and disease progression potential, limiting assessment precision (<xref ref-type="bibr" rid="B3">3</xref>).</p>
<p>Advancing precision medicine has propelled multidimensional prognostic prediction models to the forefront of oncology research. Body Fat Rate (BFR), a vital indicator reflecting nutritional status and metabolic levels, has garnered widespread attention for its association with cancer prognosis. Studies confirm that abnormal BFR levels (either elevated or reduced) may heighten postoperative recurrence risk and shorten survival in gastric cancer patients by impairing immune function, exacerbating inflammatory responses, and altering tumor microenvironments (<xref ref-type="bibr" rid="B4">4</xref>). Notably, the traditional Body Mass Index (BMI), employed for obesity assessment, inadequately captures adipose tissue accumulation patterns and spatial distribution (<xref ref-type="bibr" rid="B5">5</xref>). In contrast, BFR measurement offers rapid evaluation with operational simplicity, low cost, and zero radiation exposure risk&#x2014;making it suitable for large-scale population screening. The incorporation of BFR represents a significant advance beyond conventional anthropometric indicators such as BMI. Unlike BMI, which quantifies general body mass without distinguishing adipose distribution or metabolic status, BFR specifically evaluates fat deposition patterns that directly modulate inflammatory cascades in surgical contexts. This physiological distinction provides a novel dimension for risk stratification previously unattainable through traditional nutritional assessments. Nevertheless, whether BFR serves as an independent predictor of postoperative complication risk in gastric cancer requires further investigation (<xref ref-type="bibr" rid="B6">6</xref>).</p>
<p>The emergence of Automated Machine Learning (AutoML) technology provides innovative solutions for mining and modeling complex medical data. Compared to conventional machine learning, AutoML automates feature engineering, model selection, and hyperparameter tuning&#x2014;reducing subjectivity and operational complexity while effectively uncovering latent data correlations to significantly enhance model performance and generalizability (<xref ref-type="bibr" rid="B7">7</xref>). Currently, AutoML has demonstrated promising applications in prognostic prediction for cancers such as lung and breast cancer, yet research integrating AutoML with BFR for postoperative complication risk assessment in gastric cancer remains scarce.</p>
<p>To address this gap, this study aims to integrate BFR, clinicopathological features, and laboratory test results of gastric cancer patients to construct a postoperative complication risk prediction model using AutoML technology. Through systematic validation of the model&#x2019;s predictive accuracy, stability, and clinical utility, we seek to elucidate the prognostic value of BFR in gastric cancer and provide novel insights for precision prevention and clinical management.</p>
</sec>
<sec id="s2">
<label>2</label>
<title>Methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Study participants and data collection</title>
<p>This retrospective cohort study enrolled 1,023 gastric cancer patients who underwent radical gastrectomy at The First Affiliated Hospital of Anhui Medical University (n=815) and Chuzhou First People&#x2019;s Hospital (n=208) from January 2020 to January 2025. Ethical approval (No. 83220465) was granted by the Institutional Review Board of The First Affiliated Hospital of Anhui Medical University, with waived informed consent in accordance with the Declaration of Helsinki. Patients were selected based on strict criteria:</p>
<p>Inclusion criteria: (1) Histopathologically confirmed non-metastatic gastric adenocarcinoma; (2) Radical gastrectomy performed; (3) No neoadjuvant radiotherapy or chemotherapy; (4) Complete clinical and follow-up records.</p>
<p>Exclusion criteria: (1) Non-gastric malignancy or distant metastasis; (2) Incomplete body composition data [BFR, BMI, Visceral Fat Density (VFD), Visceral Fat Area (VFA)]; (3) Concurrent malignancies.</p>
<p>Data were extracted from electronic medical records using structured templates and verified by two certified researchers. Collected features included: (1) Demographics: Age, sex. (2) Clinicopathological characteristics: AJCC 8th edition TNM stage (<xref ref-type="bibr" rid="B8">8</xref>), tumor location (cardia/body/antrum), histological grade (well-moderate/poor-undifferentiated), surgical approach (laparoscopic/open), lymphadenectomy extent (D1/D2). (3) Body composition metrics: BMI (kg/m&#xb2;) calculated from preoperative height/weight. VFD (g/cm&#xb3;), BFR (%), VFA (cm&#xb2;), Subcutaneous Fat Area (SFA, cm&#xb2;), and Skeletal Muscle Area (SMA, cm&#xb2;) derived from preoperative abdominal CT scans at L3 level using Slice-O-Matic software. (4) Preoperative laboratory markers (within 1 week pre-surgery): Serum albumin (ALB, g/L), prealbumin (PA, mg/L), hemoglobin (Hb, g/L), white blood cell count (WBC, &#xd7;10<sup>9</sup>/L), C-reactive protein (CRP, mg/L). (5) Outcome: Postoperative complications within 30 days (Clavien-Dindo grade &#x2265;II defining clinically significant events) (<xref ref-type="bibr" rid="B9">9</xref>).</p>
<p>This study minimized data loss at the source through stringent inclusion and exclusion criteria. In the final analytical sample, only a few variables exhibited minimal random missing values (all missing rates &#x2264;6.0%). To ensure sample completeness and statistical power for subsequent analyzes and predictive models, different single imputation strategies were adopted based on variable types and distribution characteristics: mean imputation was used for normally distributed continuous variables (e.g., SMA, ALB, Hb), while median imputation was applied to non-normally distributed continuous variables (e.g., BFR, VFA, VFD, WBC, CRP). All categorical variables were complete in this dataset; however, planned mode imputation would address minor missingness if present, as detailed in <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Data missingness and handling methods for study variables.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Feature</th>
<th valign="middle" align="center">Missing count<break/>(Missing rate)</th>
<th valign="middle" align="center">Handling method</th>
</tr>
</thead>
<tbody>
<tr>
<th valign="middle" colspan="3" align="left">Categorical variables</th>
</tr>
<tr>
<td valign="middle" align="left">Sex</td>
<td valign="middle" align="center">0 (0%)</td>
<td valign="middle" align="center">No missing</td>
</tr>
<tr>
<td valign="middle" align="left">TNM stage</td>
<td valign="middle" align="center">0 (0%)</td>
<td valign="middle" align="center">No missing</td>
</tr>
<tr>
<td valign="middle" align="left">Tumor location</td>
<td valign="middle" align="center">0 (0%)</td>
<td valign="middle" align="center">No missing</td>
</tr>
<tr>
<td valign="middle" align="left">Histological differentiation</td>
<td valign="middle" align="center">0 (0%)</td>
<td valign="middle" align="center">No missing</td>
</tr>
<tr>
<td valign="middle" align="left">Surgical approach</td>
<td valign="middle" align="center">0 (0%)</td>
<td valign="middle" align="center">No missing</td>
</tr>
<tr>
<td valign="middle" align="left">Lymphadenectomy</td>
<td valign="middle" align="center">0 (0%)</td>
<td valign="middle" align="center">No missing</td>
</tr>
<tr>
<th valign="middle" colspan="3" align="left">Continuous variables (Normally distributed, Mean &#xb1; SD)</th>
</tr>
<tr>
<td valign="middle" align="left">Age</td>
<td valign="middle" align="center">0 (0%)</td>
<td valign="middle" align="center">No missing</td>
</tr>
<tr>
<td valign="middle" align="left">BMI</td>
<td valign="middle" align="center">0 (0%)</td>
<td valign="middle" align="center">No missing</td>
</tr>
<tr>
<td valign="middle" align="left">SMA</td>
<td valign="middle" align="center">8 (3.2%)</td>
<td valign="middle" align="center">Mean imputation</td>
</tr>
<tr>
<td valign="middle" align="left">ALB</td>
<td valign="middle" align="center">5 (2.0%)</td>
<td valign="middle" align="center">Mean imputation</td>
</tr>
<tr>
<td valign="middle" align="left">Hb</td>
<td valign="middle" align="center">3 (1.2%)</td>
<td valign="middle" align="center">Mean imputation</td>
</tr>
<tr>
<th valign="middle" colspan="3" align="left">Continuous variables (Non-normally distributed, Median [Q1, Q3])</th>
</tr>
<tr>
<td valign="middle" align="left">BFR</td>
<td valign="middle" align="center">12 (4.8%)</td>
<td valign="middle" align="center">Median imputation</td>
</tr>
<tr>
<td valign="middle" align="left">VFA</td>
<td valign="middle" align="center">12 (4.8%)</td>
<td valign="middle" align="center">Median imputation</td>
</tr>
<tr>
<td valign="middle" align="left">SFA</td>
<td valign="middle" align="center">12 (4.8%)</td>
<td valign="middle" align="center">Median imputation</td>
</tr>
<tr>
<td valign="middle" align="left">VFD</td>
<td valign="middle" align="center">15 (6.0%)</td>
<td valign="middle" align="center">Median imputation</td>
</tr>
<tr>
<td valign="middle" align="left">PA</td>
<td valign="middle" align="center">5 (2.0%)</td>
<td valign="middle" align="center">Median imputation</td>
</tr>
<tr>
<td valign="middle" align="left">WBC</td>
<td valign="middle" align="center">10 (4.0%)</td>
<td valign="middle" align="center">Median imputation</td>
</tr>
<tr>
<td valign="middle" align="left">CRP</td>
<td valign="middle" align="center">10 (4.0%)</td>
<td valign="middle" align="center">Median imputation</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Automated machine learning</title>
<p>815 patients from The First Affiliated Hospital of Anhui Medical University served as the training set, while 208 patients from Chuzhou First People&#x2019;s Hospital constituted the testing set. All models were implemented in MATLAB 2024b. Five-fold cross-validation was applied to the training set to mitigate overfitting, and Synthetic Minority Over-sampling Technique (SMOTE) was executed on the training set to address class imbalance.</p>
<p>We propose an AutoML framework driven by the Improved Hike Optimization Algorithm (IHOA) to jointly optimize feature selection and hyperparameter tuning for predicting postoperative complications. The original Hike Optimization Algorithm (HOA) is a novel metaheuristic algorithm inspired by natural aurora phenomena. Key improvements were implemented: (1) Population initialization using Logistic chaotic mapping, mathematically defined as <inline-formula>
<mml:math display="inline" id="im1"><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>n</mml:mi><mml:mo>+</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>&#x3bc;</mml:mi><mml:msub><mml:mi>x</mml:mi><mml:mi>n</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mi>n</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> (where <inline-formula>
<mml:math display="inline" id="im2"><mml:mrow><mml:mi>&#x3bc;</mml:mi><mml:mo>&#x2208;</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:mn>3.57</mml:mn><mml:mo>,</mml:mo><mml:mn>4</mml:mn><mml:mo stretchy="false">]</mml:mo></mml:mrow></mml:math></inline-formula> denotes the chaotic parameter), which significantly enhances initial traversal in the solution space and facilitates escaping local optima; (2) A dynamic L&#xe9;vy flight strategy to adjust search step sizes, computed as <inline-formula>
<mml:math display="inline" id="im3"><mml:mrow><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mi>e</mml:mi><mml:mi>p</mml:mi><mml:mo>=</mml:mo><mml:mi>&#x3b1;</mml:mi><mml:mo>&#x2295;</mml:mo><mml:mi>L</mml:mi><mml:mi>e</mml:mi><mml:mo>'</mml:mo><mml:mi>v</mml:mi><mml:mi>y</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>&#x3b2;</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> (where <inline-formula>
<mml:math display="inline" id="im4"><mml:mi>&#x3b1;</mml:mi></mml:math></inline-formula> is the scale parameter, <inline-formula>
<mml:math display="inline" id="im5"><mml:mo>&#x2295;</mml:mo></mml:math></inline-formula> represents the dot product, and <inline-formula>
<mml:math display="inline" id="im6"><mml:mrow><mml:mi>L</mml:mi><mml:mi>e</mml:mi><mml:mo>'</mml:mo><mml:mi>v</mml:mi><mml:mi>y</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>&#x3b2;</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> follows a L&#xe9;vy distribution with exponent <inline-formula>
<mml:math display="inline" id="im7"><mml:mi>&#x3b2;</mml:mi></mml:math></inline-formula>). This strategy employs larger steps for global exploration in early iterations and adaptively reduces step sizes for local exploitation in later stages, achieving dynamic exploration-exploitation balance. The enhanced IHOA was first evaluated on the CEC2022 benchmark test functions to validate its superiority over the original HOA and other mainstream metaheuristic algorithms. At the empirical level, dual validation was performed through clinical prediction models: robustness testing via artificial injection of progressive data perturbations (0%&#x2013;15% noise and 0%&#x2013;30% missing values), alongside a feature selection module assessing model complexity control capabilities.</p>
<p>The core of this AutoML framework is a two-stage optimization workflow (pseudocode in <xref ref-type="supplementary-material" rid="SM1"><bold>Appendix A</bold></xref>). In Stage 1 (discrete space optimization), IHOA is applied to feature selection, where each candidate solution (i.e., individual position) is encoded as a binary vector representing a feature subset. Model-based feature importance weights (e.g., XGBoost) serve as prior knowledge to guide the IHOA search, with the fitness function being a weighted combination of performance metrics (e.g., AUC) evaluated on the validation set using a base classifier (e.g., logistic regression). This selects high-weight feature subsets with strong discriminative power and low redundancy. In Stage 2 (continuous space optimization), IHOA optimizes hyperparameters of the target prediction model&#x2014;integrating classical algorithms including support vector machines, random forests, and gradient boosting trees&#x2014;for the optimal subset identified in Stage 1. Hyperparameter combinations are encoded as continuous vectors to maximize prediction performance on the validation set. Finally, for comprehensive evaluation, the proposed framework was compared against six widely-used machine learning models: Logistic Regression (LR), Support Vector Machine (SVM), Adaptive Boosting (AdaBoost), Extreme Gradient Boosting (XGBoost), and LightGBM. All models were evaluated using identical training-testing datasets to ensure fairness. The technical workflow is shown in <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Technical workflow diagram.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1763139-g001.tif">
<alt-text content-type="machine-generated">Flowchart illustrating the development and evaluation of an improved PLO algorithm, progressing from research start through algorithm improvements, dual-stage optimization, comparison models, data processing, evaluation, interpretability, tool implementation, and culminating at research end.</alt-text>
</graphic></fig>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Evaluation metrics</title>
<p>A multidimensional evaluation system was established: (1) Classification performance: For the predictive model, six core metrics were adopted to systematically assess discriminative ability and stability in class-imbalanced scenarios: Accuracy (ACC), Sensitivity (SEN), Specificity (SPE), Precision (PRE), F1 score (harmonic mean of precision and recall), Area Under the ROC Curve (ROC-AUC), and Area Under the Precision-Recall Curve (PR-AUC). (2) Calibration performance: Calibration curves combined with the Brier score (lower scores indicate higher prediction accuracy) were used to evaluate probability prediction precision; the Hosmer&#x2013;Lemeshow test (&#x3c7;&#xb2; statistic) and Spiegelhalter test (z statistic) quantified calibration deviation (P &gt; 0.05 indicated good calibration). (3) Clinical application: Decision Curve Analysis (DCA) was applied to quantify clinical utility by calculating the net benefit (NB) at different threshold probabilities:</p>
<disp-formula>
<mml:math display="block" id="M1"><mml:mrow><mml:mi>N</mml:mi><mml:mi>B</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mi>N</mml:mi></mml:mfrac><mml:mo>&#x2212;</mml:mo><mml:mfrac><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mi>N</mml:mi></mml:mfrac><mml:mo>&#xd7;</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mi>p</mml:mi><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mrow></mml:math>
</disp-formula>
<p>where <italic>TP</italic> is true positives, <italic>FP</italic> is false positives, <italic>N</italic> is total sample size, and pt is the risk threshold. By comparing <italic>NB</italic> with reference lines for traditional intervention strategies, the effective interval for model-assisted decision-making was validated.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Interpretability analysis</title>
<p>Post AutoML feature screening, robustness was verified via LASSO regression, followed by SHapley Additive exPlanations (SHAP) for clinical interpretability: AutoML feature screening: Automatically identified prognosis-associated features. LASSO regression: Validated feature sparsity and stability using regularization. SHAP analysis: By calculating Shapley values for each feature, quantitative attribution of feature contributions to individual predictions was achieved; summary plots were comprehensively used to display global feature importance rankings, while waterfall plots, decision path plots, and force plots were employed to visually illustrate the interpretation process of specific prediction cases, thereby systematically revealing the model&#x2019;s intrinsic decision-making logic.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Interactive tool development</title>
<p>A proof-of-concept clinical decision support tool was developed using MATLAB 2024a App Designer due to its accelerated prototyping workflow for model-visualization integration and seamless compatibility with existing statistical preprocessing pipelines (Statistical Package for the Social Sciences, SPSS), integrating the optimal machine learning model.</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Statistical analyzes</title>
<p>All study data were uniformly imported into the SPSS 26.0 statistical analysis platform for standardized processing. Continuous variables with normal distribution were expressed as mean &#xb1; standard deviation (x&#x304;&#xb1; s), while those with non-normal distribution were denoted as median (interquartile range) (M [IQR]); categorical variables were expressed as frequency and percentage (n(%)). For inter-group comparisons, continuous variables first underwent normality testing: if both groups conformed to normal distribution, univariate t-test was applied; otherwise, Mann-Whitney U test was used. Categorical variables were compared using Pearson&#x2019;s chi-square test. Statistical significance was determined based on p-values (two-tailed test, significance threshold &#x3b1;=0.05), and results were presented in tabular formats.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Characteristics of study participants</title>
<p>A total of 1,023 subjects were included, with a mean age of 62.65 &#xb1; 10.16 years. Among them, 686 (67.06%) were male and 337 (32.94%) were female. The comparison of general characteristics between the training set and testing set is presented in <xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>. The results demonstrate balanced distributions across most demographic and clinical baseline features (P &gt; 0.05), with statistically significant differences observed only in isolated variables. Such limited discrepancies following random partitioning more closely reflect the natural variability inherent in real-world data, avoiding idealization biases that may arise from artificial overmatching. This consequently enhances the extrapolation potential and reliability of the models developed in this study for broader clinical scenarios.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Baseline characteristics of enrolled participants.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Features</th>
<th valign="middle" align="center">Training set (n=815)</th>
<th valign="middle" align="center">Testing set (n=208)</th>
<th valign="middle" align="center">Statistic</th>
<th valign="middle" align="center">P-value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Postoperative complications, n (%)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center">&#x3c7;&#xb2;=1.326</td>
<td valign="middle" align="center">0.250</td>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;No</td>
<td valign="middle" align="center">689 (84.54)</td>
<td valign="middle" align="center">169 (81.25)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Yes</td>
<td valign="middle" align="center">126 (15.46)</td>
<td valign="middle" align="center">39 (18.75)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Age (years), Mean &#xb1; SD</td>
<td valign="middle" align="center">62.54 &#xb1; 10.15</td>
<td valign="middle" align="center">63.07 &#xb1; 10.21</td>
<td valign="middle" align="center">t=-0.873</td>
<td valign="middle" align="center">0.383</td>
</tr>
<tr>
<td valign="middle" align="left">Sex, n(%)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center">&#x3c7;&#xb2;=1.161</td>
<td valign="middle" align="center">0.281</td>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Female</td>
<td valign="middle" align="center">275 (33.74)</td>
<td valign="middle" align="center">62 (29.81)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Male</td>
<td valign="middle" align="center">540 (66.26)</td>
<td valign="middle" align="center">146 (70.19)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">TNM stage, n(%)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center">&#x3c7;&#xb2;=2.466</td>
<td valign="middle" align="center">0.482</td>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;I</td>
<td valign="middle" align="center">238 (29.20)</td>
<td valign="middle" align="center">72 (34.62)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;II</td>
<td valign="middle" align="center">250 (30.67)</td>
<td valign="middle" align="center">60 (28.85)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;III</td>
<td valign="middle" align="center">281 (34.48)</td>
<td valign="middle" align="center">64 (30.77)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;IV</td>
<td valign="middle" align="center">46 (5.64)</td>
<td valign="middle" align="center">12 (5.77)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Tumor location, n(%)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center">&#x3c7;&#xb2;=2.734</td>
<td valign="middle" align="center">0.255</td>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Cardia</td>
<td valign="middle" align="center">170 (20.86)</td>
<td valign="middle" align="center">53 (25.48)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Gastric antrum</td>
<td valign="middle" align="center">369 (45.28)</td>
<td valign="middle" align="center">83 (39.90)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Gastric body</td>
<td valign="middle" align="center">276 (33.87)</td>
<td valign="middle" align="center">72 (34.62)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Histological differentiation, n(%)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center">&#x3c7;&#xb2;=2.264</td>
<td valign="middle" align="center">0.519</td>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Moderately differentiated</td>
<td valign="middle" align="center">264 (32.39)</td>
<td valign="middle" align="center">68 (32.69)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Poorly differentiated</td>
<td valign="middle" align="center">366 (44.91)</td>
<td valign="middle" align="center">87 (41.83)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Undifferentiated</td>
<td valign="middle" align="center">93 (11.41)</td>
<td valign="middle" align="center">22 (10.58)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Well-differentiated</td>
<td valign="middle" align="center">92 (11.29)</td>
<td valign="middle" align="center">31 (14.90)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Surgical approach, n(%)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center">&#x3c7;&#xb2;=0.208</td>
<td valign="middle" align="center">0.649</td>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Laparoscopic</td>
<td valign="middle" align="center">523 (64.17)</td>
<td valign="middle" align="center">137 (65.87)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;Open Surgery</td>
<td valign="middle" align="center">292 (35.83)</td>
<td valign="middle" align="center">71 (34.13)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">Lymphadenectomy, n(%)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
<td valign="middle" align="center">&#x3c7;&#xb2;=11.847</td>
<td valign="middle" align="center">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;D1</td>
<td valign="middle" align="center">141 (17.30)</td>
<td valign="middle" align="center">58 (27.88)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">&#x2003;D2</td>
<td valign="middle" align="center">674 (82.70)</td>
<td valign="middle" align="center">150 (72.12)</td>
<td valign="middle" align="center"/>
<td valign="middle" align="center"/>
</tr>
<tr>
<td valign="middle" align="left">BMI (kg/m&#xb2;), Mean &#xb1; SD</td>
<td valign="middle" align="center">22.82 &#xb1; 3.45</td>
<td valign="middle" align="center">22.88 &#xb1; 3.10</td>
<td valign="middle" align="center">t=-0.276</td>
<td valign="middle" align="center">0.782</td>
</tr>
<tr>
<td valign="middle" align="left">BFR (%), M [Q1, Q3]</td>
<td valign="middle" align="center">28.6 [24.2, 33.0]</td>
<td valign="middle" align="center">28.6 [24.3, 33.6]</td>
<td valign="middle" align="center">Z=-0.294</td>
<td valign="middle" align="center">0.769</td>
</tr>
<tr>
<td valign="middle" align="left">VFA (cm&#xb2;), M [Q1, Q3]</td>
<td valign="middle" align="center">100.7 [64.2, 130.6]</td>
<td valign="middle" align="center">106.7 [76.7, 147.6]</td>
<td valign="middle" align="center">Z=-2.809</td>
<td valign="middle" align="center">0.005</td>
</tr>
<tr>
<td valign="middle" align="left">SFA (cm&#xb2;), M [Q1, Q3]</td>
<td valign="middle" align="center">121.4 [87.7, 154.0]</td>
<td valign="middle" align="center">121.0 [86.5, 156.0]</td>
<td valign="middle" align="center">Z=0.208</td>
<td valign="middle" align="center">0.836</td>
</tr>
<tr>
<td valign="middle" align="left">SMA (cm&#xb2;), Mean &#xb1; SD</td>
<td valign="middle" align="center">119.04 &#xb1; 25.95</td>
<td valign="middle" align="center">118.40 &#xb1; 24.13</td>
<td valign="middle" align="center">t=0.338</td>
<td valign="middle" align="center">0.735</td>
</tr>
<tr>
<td valign="middle" align="left">VFD (g/cm&#xb3;), M [Q1, Q3]</td>
<td valign="middle" align="center">0.84 [0.77, 0.91]</td>
<td valign="middle" align="center">0.84 [0.78, 0.92]</td>
<td valign="middle" align="center">Z=-0.336</td>
<td valign="middle" align="center">0.737</td>
</tr>
<tr>
<td valign="middle" align="left">ALB (g/L), Mean &#xb1; SD</td>
<td valign="middle" align="center">38.47 &#xb1; 5.33</td>
<td valign="middle" align="center">38.48 &#xb1; 5.74</td>
<td valign="middle" align="center">t=-0.036</td>
<td valign="middle" align="center">0.971</td>
</tr>
<tr>
<td valign="middle" align="left">PA (mg/L), M [Q1, Q3]</td>
<td valign="middle" align="center">209.0 [176.5, 245.0]</td>
<td valign="middle" align="center">217.0 [175.8, 253.0]</td>
<td valign="middle" align="center">Z=-0.327</td>
<td valign="middle" align="center">0.744</td>
</tr>
<tr>
<td valign="middle" align="left">Hb (g/L), Mean &#xb1; SD</td>
<td valign="middle" align="center">124.22 &#xb1; 18.20</td>
<td valign="middle" align="center">125.23 &#xb1; 18.19</td>
<td valign="middle" align="center">t=-0.716</td>
<td valign="middle" align="center">0.474</td>
</tr>
<tr>
<td valign="middle" align="left">WBC (&#xd7;109/L), M [Q1, Q3]</td>
<td valign="middle" align="center">6.4 [5.1, 7.9]</td>
<td valign="middle" align="center">6.5 [5.2, 7.7]</td>
<td valign="middle" align="center">Z=0.358</td>
<td valign="middle" align="center">0.720</td>
</tr>
<tr>
<td valign="middle" align="left">CRP (mg/L), M [Q1, Q3]</td>
<td valign="middle" align="center">5.0 [0.6, 9.6]</td>
<td valign="middle" align="center">7.3 [1.5, 11.7]</td>
<td valign="middle" align="center">Z=-3.011</td>
<td valign="middle" align="center">0.002</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Comparative analysis of improved swarm intelligence algorithm performance</title>
<p>The IHOA demonstrated significant optimization advantages through standardized testing (see <xref ref-type="supplementary-material" rid="SM1"><bold>Appendix B</bold></xref>). By artificially injecting progressive data perturbations, this study evaluated the performance of the prognosis prediction model based on real-world clinical data. Experimental results revealed that all intelligent algorithms exhibited declining performance trends as perturbation intensity increased (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>). Under original data conditions, the five algorithms achieved an average prediction accuracy of AUC = 0.84; however, under extreme perturbations (15% noise + 30% missing values), model performance substantially decreased to an average AUC = 0.46&#x2014;a relative decline of 45.4%. Critically, the IHOA algorithm exhibited optimal stability: its prediction accuracy decreased from AUC = 0.91 under original conditions to AUC = 0.73 in high-perturbation scenarios, with a relative decrease rate (19.7%) markedly lower than other algorithm groups (all &gt;36%).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Robustness comparison of intelligent algorithms in predicting composite postoperative complication risk.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1763139-g002.tif">
<alt-text content-type="machine-generated">Box plot comparing the robustness of five AI algorithms (IHOA, HOA, ALO, HHO, WOA) for composite outcome prediction across increasing data interference scenarios, showing decreasing AUC performance with more noise and missing data; a dashed red line marks the clinical acceptance threshold at 0.7 AUC.</alt-text>
</graphic></fig>
<p>At the key feature identification level, the IHOA algorithm demonstrated superior concise characteristics (<xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>). It consistently screened 8 highly correlated predictors (average correlation coefficient r=0.67, SD = 0.08)&#x2014;a 26% reduction compared to the average 10.8 features selected by other algorithms. This feature refinement mechanism effectively reduced model complexity while maintaining predictive accuracy.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Clinical feature analysis and feature selection optimization.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1763139-g003.tif">
<alt-text content-type="machine-generated">Bar chart on the left shows feature-outcome correlation strengths for medical variables, with highest correlations for CRP, VFD, SMA, VFA, BFR, BMI, and lymph node dissection, all exceeding 0.6. Table on the right compares feature selection across five models by check marks or star symbols, indicating which variables each model selected for analysis.</alt-text>
</graphic></fig>
<p>Note: This figure demonstrates the stability performance of five intelligent algorithms (IHOA/HOA/ALO/HHO/WOA) under increasing data interference scenarios. The boxplots represent the distribution of cross-validated AUC values from 10 repeated experiments, while the scatter points indicate single experimental results. Algorithm color coding: IHOA (forest green), HOA (blue), ALO (red), HHO (purple), WOA (cyan). The red dashed line indicates the clinically acceptable threshold (AUC = 0.7), values below which are considered insufficient for clinical reference.</p>
<p>Note: This study compared the correlation strength between 18 clinical features and postoperative complication risk, and evaluated the feature selection performance of the IHOA algorithm against other optimization algorithms (HOA, ALO, HHO, WOA). The left panel displays the correlation coefficients (r) between each feature and the outcomes, with dark blue indicating highly correlated features (r&gt;0.5), light blue indicating weakly correlated features (r &#x2264; 0.5), and the gray dashed line representing the correlation threshold of 0.5. The right panel shows the feature selection results of the algorithms, where dark green squares represent features selected by IHSO, and light blue squares represent features selected by other algorithms.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Model training outcomes</title>
<p>Six machine learning models were systematically evaluated on the training set for accuracy, sensitivity, specificity, F1-score, and area-under-curve metrics. The AutoML model demonstrated comprehensive superiority, achieving ROC-AUC of 0.9580 and PR-AUC of 0.9577 (<xref ref-type="table" rid="T3"><bold>Table&#xa0;3</bold></xref>; <xref ref-type="fig" rid="f4"><bold>Figures&#xa0;4A, B</bold></xref>). Notably, AutoML exhibited exceptional F1-score (0.8855), indicating strong clinical utility in balancing precision-recall tradeoffs. The algorithm ultimately selected eight key features: BFR, VFA, VFD, SMA, CRP, lymphadenectomy extent, BMI and Age.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Performance metrics of prediction models.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Data set</th>
<th valign="middle" align="left">Models</th>
<th valign="middle" align="center">PRE</th>
<th valign="middle" align="center">SEN</th>
<th valign="middle" align="center">SPE</th>
<th valign="middle" align="center">ACC</th>
<th valign="middle" align="center">F1</th>
<th valign="middle" align="center">ROC-AUC (95% CI)</th>
<th valign="middle" align="center">PR-AUC (95% CI)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Training set</td>
<td valign="middle" align="left">LR</td>
<td valign="middle" align="center">0.7743</td>
<td valign="middle" align="center">0.6492</td>
<td valign="middle" align="center">0.8215</td>
<td valign="middle" align="center">0.7379</td>
<td valign="middle" align="center">0.7063</td>
<td valign="middle" align="center">0.7969 [0.785, 0.809]</td>
<td valign="middle" align="center">0.7893 [0.777, 0.802]</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">SVM</td>
<td valign="middle" align="center">0.6899</td>
<td valign="middle" align="center">0.7908</td>
<td valign="middle" align="center">0.6647</td>
<td valign="middle" align="center">0.7259</td>
<td valign="middle" align="center">0.7369</td>
<td valign="middle" align="center">0.8059 [0.793, 0.818]</td>
<td valign="middle" align="center">0.7829 [0.769, 0.797]</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Adaboost</td>
<td valign="middle" align="center">0.7714</td>
<td valign="middle" align="center">0.7631</td>
<td valign="middle" align="center">0.7866</td>
<td valign="middle" align="center">0.7752</td>
<td valign="middle" align="center">0.7672</td>
<td valign="middle" align="center">0.8510 [0.839, 0.863]</td>
<td valign="middle" align="center">0.8412 [0.829, 0.854]</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">XGBoost</td>
<td valign="middle" align="center">0.7601</td>
<td valign="middle" align="center">0.8723</td>
<td valign="middle" align="center">0.7402</td>
<td valign="middle" align="center">0.8043</td>
<td valign="middle" align="center">0.8123</td>
<td valign="middle" align="center">0.8812 [0.870, 0.892]</td>
<td valign="middle" align="center">0.8522 [0.840, 0.865]</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">LightGBM</td>
<td valign="middle" align="center">0.8787</td>
<td valign="middle" align="center">0.7800</td>
<td valign="middle" align="center">0.8984</td>
<td valign="middle" align="center">0.8409</td>
<td valign="middle" align="center">0.8264</td>
<td valign="middle" align="center">0.9161 [0.907, 0.925]</td>
<td valign="middle" align="center">0.9079 [0.898, 0.918]</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">AutoML</td>
<td valign="middle" align="center">0.9161</td>
<td valign="middle" align="center">0.8569</td>
<td valign="middle" align="center">0.9260</td>
<td valign="middle" align="center">0.8925</td>
<td valign="middle" align="center">0.8855</td>
<td valign="middle" align="center">0.9580 [0.951, 0.965]</td>
<td valign="middle" align="center">0.9577 [0.950, 0.965]</td>
</tr>
<tr>
<td valign="middle" align="left">Testing set</td>
<td valign="middle" align="left">LR</td>
<td valign="middle" align="center">0.6606</td>
<td valign="middle" align="center">0.7267</td>
<td valign="middle" align="center">0.6686</td>
<td valign="middle" align="center">0.6959</td>
<td valign="middle" align="center">0.6921</td>
<td valign="middle" align="center">0.7533 [0.725, 0.781]</td>
<td valign="middle" align="center">0.7395 [0.711, 0.768]</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">SVM</td>
<td valign="middle" align="center">0.6471</td>
<td valign="middle" align="center">0.7333</td>
<td valign="middle" align="center">0.6450</td>
<td valign="middle" align="center">0.6865</td>
<td valign="middle" align="center">0.6875</td>
<td valign="middle" align="center">0.7363 [0.708, 0.765]</td>
<td valign="middle" align="center">0.6954 [0.666, 0.725]</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Adaboost</td>
<td valign="middle" align="center">0.8116</td>
<td valign="middle" align="center">0.7467</td>
<td valign="middle" align="center">0.8462</td>
<td valign="middle" align="center">0.7994</td>
<td valign="middle" align="center">0.7778</td>
<td valign="middle" align="center">0.8293 [0.802, 0.857]</td>
<td valign="middle" align="center">0.8070 [0.779, 0.835]</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">XGBoost</td>
<td valign="middle" align="center">0.7877</td>
<td valign="middle" align="center">0.7667</td>
<td valign="middle" align="center">0.8166</td>
<td valign="middle" align="center">0.7931</td>
<td valign="middle" align="center">0.7770</td>
<td valign="middle" align="center">0.8483 [0.822, 0.875]</td>
<td valign="middle" align="center">0.8391 [0.812, 0.866]</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">LightGBM</td>
<td valign="middle" align="center">0.8029</td>
<td valign="middle" align="center">0.7333</td>
<td valign="middle" align="center">0.8402</td>
<td valign="middle" align="center">0.7900</td>
<td valign="middle" align="center">0.7666</td>
<td valign="middle" align="center">0.8323 [0.805, 0.860]</td>
<td valign="middle" align="center">0.8306 [0.803, 0.858]</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">AutoML</td>
<td valign="middle" align="center">0.9124</td>
<td valign="middle" align="center">0.8333</td>
<td valign="middle" align="center">0.9290</td>
<td valign="middle" align="center">0.8840</td>
<td valign="middle" align="center">0.8711</td>
<td valign="middle" align="center">0.9380 [0.917, 0.959]</td>
<td valign="middle" align="center">0.9262 [0.904, 0.948]</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Training and validation performance of prediction models. <bold>(A)</bold> Training ROC curve; <bold>(B)</bold> Training PR curve; <bold>(C)</bold> Test ROC curve; <bold>(D)</bold> Test PR curve; <bold>(E)</bold> Test DCA curve; <bold>(F)</bold> Test calibration curve.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1763139-g004.tif">
<alt-text content-type="machine-generated">Panel A shows a line ROC curve comparing six machine learning models for classification performance, with AutoML achieving the highest AUC. Panel B displays a precision-recall curve for the same models, with AutoML again outperforming others. Panel C presents another ROC curve for a different dataset, where AutoML yields the highest AUC among the models. Panel D shows a corresponding precision-recall curve for these models, also favoring AutoML in AUC. Panel E depicts a decision curve analysis, highlighting superior net benefit for AutoML across varying threshold probabilities. Panel F presents calibration curves comparing predicted probability to observed frequency, with AutoML showing the lowest Brier score.</alt-text>
</graphic></fig>
<p>In independent testing, AutoML maintained robust performance (ROC-AUC = 0.9380, PR-AUC = 0.9262; <xref ref-type="fig" rid="f4"><bold>Figures&#xa0;4C, D</bold></xref>). Decision curve analysis (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4E</bold></xref>) revealed greater net clinical benefit across risk thresholds (1%&#x2013;93%) compared to conventional methods, with sustained high-level stability confirming superior generalizability. Calibration curves (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4B</bold></xref>) demonstrated optimal probabilistic prediction (lowest test-set Brier score = 0.111).</p>
<p>Calibration statistics for all models are presented in <xref ref-type="table" rid="T4"><bold>Table&#xa0;4</bold></xref>. The Brier score demonstrated that the AutoML model (0.111) achieved the highest prediction accuracy, significantly outperforming other models (reduction of approximately 32&#x2013;49%). Calibration intercept analysis revealed that all models exhibited a mild overestimation tendency (intercepts ranged from &#x2013;0.151 to &#x2013;0.052). The AutoML&#x2019;s calibration intercept was closest to the ideal value of 0 (&#x2013;0.052), with minimal calibration bias, demonstrating significant superiority over other models. Calibration slope analysis indicated that AutoML&#x2019;s slope was closest to the ideal value of 1 (1.082), confirming its optimal balance between discrimination and calibration.</p>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>Calibration curve statistical results.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Model</th>
<th valign="middle" align="center">Brier score</th>
<th valign="middle" align="center">Calibration intercept</th>
<th valign="middle" align="center">Calibration slope</th>
<th valign="middle" align="center">Hosmer-Lemeshow &#x3c7;&#xb2;</th>
<th valign="middle" align="center">Hosmer-Lemeshow p-value</th>
<th valign="middle" align="center">Spiegelhalter z</th>
<th valign="middle" align="center">Spiegelhalter p-value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">LR</td>
<td valign="middle" align="center">0.203</td>
<td valign="middle" align="center">-0.132</td>
<td valign="middle" align="center">0.689</td>
<td valign="middle" align="center">19.110</td>
<td valign="middle" align="center">0.014</td>
<td valign="middle" align="center">-1.010</td>
<td valign="middle" align="center">0.311</td>
</tr>
<tr>
<td valign="middle" align="left">SVM</td>
<td valign="middle" align="center">0.216</td>
<td valign="middle" align="center">-0.139</td>
<td valign="middle" align="center">0.565</td>
<td valign="middle" align="center">29.850</td>
<td valign="middle" align="center">0.000</td>
<td valign="middle" align="center">-1.180</td>
<td valign="middle" align="center">0.239</td>
</tr>
<tr>
<td valign="middle" align="left">Adaboost</td>
<td valign="middle" align="center">0.168</td>
<td valign="middle" align="center">-0.151</td>
<td valign="middle" align="center">1.038</td>
<td valign="middle" align="center">20.850</td>
<td valign="middle" align="center">0.008</td>
<td valign="middle" align="center">-1.100</td>
<td valign="middle" align="center">0.269</td>
</tr>
<tr>
<td valign="middle" align="left">XGBoost</td>
<td valign="middle" align="center">0.161</td>
<td valign="middle" align="center">-0.090</td>
<td valign="middle" align="center">1.480</td>
<td valign="middle" align="center">11.400</td>
<td valign="middle" align="center">0.180</td>
<td valign="middle" align="center">-0.860</td>
<td valign="middle" align="center">0.388</td>
</tr>
<tr>
<td valign="middle" align="left">LightGBM</td>
<td valign="middle" align="center">0.164</td>
<td valign="middle" align="center">-0.095</td>
<td valign="middle" align="center">1.027</td>
<td valign="middle" align="center">10.820</td>
<td valign="middle" align="center">0.212</td>
<td valign="middle" align="center">-0.710</td>
<td valign="middle" align="center">0.478</td>
</tr>
<tr>
<td valign="middle" align="left">AutoML</td>
<td valign="middle" align="center">0.111</td>
<td valign="middle" align="center">-0.052</td>
<td valign="middle" align="center">1.082</td>
<td valign="middle" align="center">8.450</td>
<td valign="middle" align="center">0.391</td>
<td valign="middle" align="center">-0.450</td>
<td valign="middle" align="center">0.653</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The Hosmer-Lemeshow test showed that AutoML (&#x3c7;&#xb2;=8.450, p=0.391) passed the test with the highest p-value, indicating optimal calibration goodness-of-fit; LightGBM (&#x3c7;&#xb2;=10.820, p=0.212) and XGBoost (&#x3c7;&#xb2;=11.400, p=0.180) also passed the test, suggesting good calibration, while other models exhibited calibration bias (p&lt;0.05). Collectively, across all calibration metrics, the AutoML model demonstrated optimal performance in every dimension, validating its excellence in both prediction accuracy and calibration capability.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Key predictor analysis</title>
<sec id="s3_4_1">
<label>3.4.1</label>
<title>LASSO regression</title>
<p>LASSO regression identified 10 predictors within one standard error of minimum MSE (Lambda1SE): BFR, VFA, VFD, SMA, CRP, lymphadenectomy extent, BMI, ALB, SFA, and age, fully encompassing the AutoML-selected features (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref>).</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>LASSO regression results. <bold>(A)</bold> Coefficient trajectories; <bold>(B)</bold> Cross-validation error plot.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1763139-g005.tif">
<alt-text content-type="machine-generated">Panel A shows a cross-validated mean squared error (MSE) plot for Lasso regression, with error bars for each lambda value, and vertical lines marking LambdaMinMSE and Lambda1SE. Panel B displays a Lasso coefficient path plot with colored lines representing model coefficients across varying lambda, and the same vertical lines as in panel A.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_4_2">
<label>3.4.2</label>
<title>SHAP analysis</title>
<p>Feature importance ranking determined via SHAP analysis was: BFR &gt; VFD &gt; VFA &gt; SMA &gt; CRP &gt; BMI &gt; Age &gt; lymphadenectomy extent (<xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6A, B</bold></xref>). Analysis of decision paths across different risk levels (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6F</bold></xref>) reveals systematic differences in feature combinations between high-risk and low-risk patients. High-risk patients exhibit distinct rightward path deviations, indicating synergistic effects of multiple risk factors. Crucially, the interpretability analysis identified BFR as the foremost predictor through rigorous SHAP ranking, where optimal cutoff values synergistically interacted with visceral fat metrics to stratify complication risks. This multidimensional integration of body composition parameters enabled unprecedented granularity in predicting postoperative complication risk, with BFR contributing significantly to the model&#x2019;s discriminative ability.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>SHAP Interpretability Analysis. <bold>(A)</bold> The Shapley summary plot; <bold>(B)</bold> The Shapley feature importance plot; <bold>(C&#x2013;E)</bold> Waterfall plots illustrate the cumulative contribution process of each feature to individual patient predictions. The baseline value represents the model&#x2019;s average prediction for all patients, while feature contributions show how each feature affects the final prediction (red indicating increased risk, blue indicating decreased risk). The sum of all feature contributions yields the final predicted value; <bold>(F)</bold> The decision path plot compares decision pathways across multiple patients, demonstrating how different feature combinations lead to varying prediction outcomes. The horizontal axis shows predicted probabilities, the vertical axis lists features, and the curved pathways trace decision routes from baseline values to final predictions; <bold>(G&#x2013;I)</bold> Force plots visually demonstrate how each feature &#x201c;pushes&#x201d; predictions toward higher or lower risk directions. Red arrows indicate features pushing predictions toward higher risk, blue arrows indicate features pushing toward lower risk, with arrow length representing the magnitude of influence.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1763139-g006.tif">
<alt-text content-type="machine-generated">Multi-panel figure displaying SHAP analysis for a predictive model, including (A) a summary plot showing feature impact and importance, (B) a bar chart ranking features by average SHAP value, (C–E) waterfall plots visualizing individual patient feature contributions to prediction probabilities, (F) a decision path comparison line plot for multiple patients, and (G–I) force plots illustrating how features influence each patient's prediction outcome.</alt-text>
</graphic></fig>
<p>Case Interpretation.</p>
<p>Case 1: High-risk patient (ID 1, predicted probability: 83.85%).</p>
<p>This 56-year-old male had BFR = 34.9%, VFA = 120.0 cm&#xb2;, VFD = 0.73 g/cm&#xb3;, SMA = 126.87 cm&#xb2;, CRP = 11.1 mg/L, underwent D2 lymphadenectomy, and BMI = 25.8 kg/m&#xb2;. SHAP analysis identified two dominant risk drivers: VFD (SHAP = 0.3302) and BFR (SHAP = 0.2665). Suboptimal VFD (0.73 g/cm&#xb3; &lt; median 0.84 g/cm&#xb3;) suggesting inflammatory status was the primary risk amplifier, compounded by elevated BFR (34.9% &gt; median 28.6%). Moderate contributions came from VFA (SHAP = 0.0329) and CRP (SHAP = 0.0234). SMA&#x2019;s minor protective effect (SHAP=&#x2013;0.0052) was insufficient to counterbalance overall risk.</p>
<p>Case 2: Moderate-risk patient (ID 2, predicted probability: 50.23%).</p>
<p>This 63-year-old male had BFR = 29.8%, VFA = 128.7 cm&#xb2;, VFD = 0.81 g/cm&#xb3;, SMA = 69.53 cm&#xb2;, CRP = 2.5 mg/L, underwent D1 lymphadenectomy, and BMI = 24.4 kg/m&#xb2;. Severely reduced SMA (69.53 cm&#xb2; &lt; mean 119.04 cm&#xb2;) drove risk (SHAP = 0.2129), amplified by elevated VFA (128.7 cm&#xb2; &gt; median 100.7 cm&#xb2;; SHAP = 0.0835). Typical BFR (29.8% &#x2248; median 28.6%) and VFD (0.81 g/cm&#xb3; &#x2248; median 0.84 g/cm&#xb3;) contributed minimally (SHAP = 0.0300/0.0151). D1 lymphadenectomy slightly increased risk (SHAP = 0.0108), while protective age (SHAP=&#x2013;0.0160) and CRP (SHAP=&#x2013;0.0012) partially offset hazards.</p>
<p>Case 3: Low-risk patient (ID 3, predicted probability: 1.04%).</p>
<p>This 64-year-old male had BFR = 25.4%, VFA = 106.9 cm&#xb2;, VFD = 0.89 g/cm&#xb3;, SMA = 128.88 cm&#xb2;, CRP = 8.0 mg/L, underwent D2 lymphadenectomy, and BMI = 23.97 kg/m&#xb2;. Synergistic protective effects were observed: reduced BFR (25.4% &lt; median 28.6%; SHAP=&#x2013;0.0810), optimal VFD (0.89 g/cm&#xb3; &gt; median 0.84 g/cm&#xb3;; SHAP=&#x2013;0.0209), and SMA near mean (SHAP=&#x2013;0.0182). Elevated CRP (8.0 mg/L) was counteracted by dominant protective features. This case exemplifies the model&#x2019;s ability to identify low-risk profiles when multiple favorable factors coexist.</p>
</sec>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Interactive clinical tool</title>
<p>A proof-of-concept prototype visualization tool was developed that integrates the seven core predictors, providing support for analyzing the model&#x2019;s decision logic in a research context. As demonstrated in <xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7</bold></xref>, clinicians input feature values on the dashboard to instantly compute postoperative complication risk.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Visual interface demonstrating real-time risk assessment.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1763139-g007.tif">
<alt-text content-type="machine-generated">Postoperative complication risk prediction system interface for gastric cancer patients displaying input fields for clinical data, action buttons for Start, Save, Clean, and Help, and a result section indicating an eighty-three point eight five percent high risk of complications.</alt-text>
</graphic></fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>Gastric cancer incidence remains persistently high worldwide, with significant associations to obesity and metabolic diseases. Research indicates that higher BMI and visceral fat area (VFA) increase gastric cancer risk (<xref ref-type="bibr" rid="B10">10</xref>). Although treatment technology continues to advance, postoperative complications and tumor recurrence still pose severe threats to patient survival and prognosis (<xref ref-type="bibr" rid="B11">11</xref>). Consequently, identifying effective predictive indicators to improve surgical outcomes has become crucial.</p>
<p>The features selected were BFR, VFD, VFA, SMA, CRP, BMI, Age, lymphadenectomy extent. SHAP analysis showed identical importance ranking, confirming these as key predictors. This correlation occurs because SHAP values directly reflect features&#x2019; explanatory power: body composition metrics rank highest due to their strong nonlinear, highly specific relationship with prognosis. These indicators comprehensively reflect the body&#x2019;s antitumor &#x201c;baseline status,&#x201d; providing critical predictive information (<xref ref-type="bibr" rid="B12">12</xref>). BFR had the highest mean absolute SHAP value, indicating its strongest independent contribution, and SHAP patterns are consistent with prior biological hypotheses proposing BFR as an integrated biomarker linking nutrition metabolism and immune function (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B14">14</xref>). Beyond predictive superiority, BFR&#x2019;s clinical implementation offers practical advantages: as a radiation-free assessment requiring only non-specialized equipment, it substantially reduces operational costs compared to CT-derived indices while capturing pathophysiological processes like sarcopenic obesity&#x2014;patterns fundamentally invisible to BMI-based assessments. This positions BFR not merely as a supplementary metric, but as a paradigm-shifting biomarker that redefines perioperative risk evaluation frameworks. VFA and VFD influenced prognosis through direct mechanisms affecting tumor metastasis (<xref ref-type="bibr" rid="B15">15</xref>). SMA&#x2019;s importance stems from its supportive role in bodily repair and antitumor immunity (<xref ref-type="bibr" rid="B16">16</xref>). CRP&#x2019;s prognostic &#x201c;warning function&#x201d; amplified above 10 mg/L, but its independent SHAP contribution ranked lower than body composition metrics due to its dependence on metabolic status, though still higher than treatment-related indicators (<xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B18">18</xref>). As a categorical variable, lymphadenectomy extent affects prognosis primarily through surgical standardization quality, with D2 dissection plus CRP&gt;10 mg/L representing a high-risk combination requiring enhanced monitoring (<xref ref-type="bibr" rid="B19">19</xref>). BMI had the lowest SHAP importance because it cannot distinguish detrimental visceral obesity from protective muscle mass (<xref ref-type="bibr" rid="B20">20</xref>).</p>
<p>This study systematically evaluated six machine learning models for postoperative complication risk prediction in gastric cancer patients, demonstrating AutoML&#x2019;s superior robustness in independent testing. The significantly enhanced predictive calibration performance of AutoML models relative to alternatives stems from their ability to integrate multidimensional indicators, including body composition parameters (BFR, VFA), inflammatory markers (CRP), clinical treatment variables (lymphadenectomy extent), and nutritional metrics (BMI), which encompass continuous and categorical data types with inherent inter-feature correlations (<xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B22">22</xref>). Unlike traditional machine learning approaches like logistic regression and random forests, requiring manual feature selection, encoding, and dimensionality reduction&#x2014;processes vulnerable to human errors causing omission of critical features or introduction of redundant information&#x2014;AutoML employs automated feature engineering modules. These automatically identify distribution patterns across feature types, performing missing value imputation, outlier handling, feature interaction construction (e.g., BFR&#xd7;CRP multiplicative terms), and high-dimensional feature reduction. This comprehensively captures nonlinear relationships within multi-source data, overcoming performance bottlenecks caused by imperfect feature engineering in conventional models (<xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B24">24</xref>). Furthermore, AutoML enables unified modeling of multimodal data without manual format conversion, significantly improving adaptability to complex prognostic indicator systems (<xref ref-type="bibr" rid="B25">25</xref>). The integrated model search framework exhaustively explores preset model libraries (including logistic regression, random forests, XGBoost) while automatically evaluating generalization capabilities through cross-validation. Concurrently, intelligent algorithms such as Bayesian optimization and grid search efficiently optimize hyperparameters (learning rate, tree depth, regularization coefficients), rapidly identifying globally optimal parameter configurations within limited computational resources. This automated workflow substantially reduces technical barriers to model development, allowing rapid generation of clinically viable models without requiring specialized machine learning expertise, thereby meeting clinical demands for efficient predictive tool development (<xref ref-type="bibr" rid="B26">26</xref>&#x2013;<xref ref-type="bibr" rid="B28">28</xref>). Despite the robust discriminative capability of the model, potential clinical harms associated with misclassification warrant careful deliberation. False-positive predictions may precipitate unnecessary surveillance imaging or invasive procedures, thereby elevating healthcare expenditures and radiation exposure risks. Conversely, false negatives could delay critical interventions for conditions including anastomotic leaks and peritoneal metastases, potentially exacerbating prognostic outcomes through postponed therapeutic measures. To quantitatively mitigate these risks, our decision curve analysis demonstrates how model-guided decision-making outperforms conventional clinical strategies, particularly reducing overtreatment at threshold probabilities exceeding 20%. We therefore emphasize that predictions should be interpreted solely as probabilistic clinical decision support tools, not as definitive diagnostic determinants, to safeguard patient safety during implementation. Implementation Pathway: The integrated clinical decision support tool developed using MATLAB App Designer provides an executable solution for routine perioperative risk stratification. This platform enables surgeons to input patient-specific metrics &#x2013; including demographics, clinicopathological characteristics, and crucially, body composition parameters &#x2013; to generate real-time, individualized complication probability estimates visualized through interpretable SHAP plots. For the CDSS interface, no formal usability testing, clinician feedback collection, or decision-impact analysis has been conducted in this research phase. Its purpose is solely to visually demonstrate interpretability mechanisms, not as a clinical deployment-ready system. To enhance accessibility and mitigate implementation barriers related to VFA/VFD quantification via specialist-dependent CT analyzes, our framework strategically incorporates BFR as a radiation-free, cost-effective surrogate biomarker validated through feature interaction analysis. Future deployment will leverage multicenter cohorts to refine data interoperability via blockchain-secured protocols, standardizing variable acquisition while minimizing heterogeneity linked to regional treatment variations. This dual approach positions the model for phased integration into preoperative assessment clinics, ultimately guiding nutritional interventions and surgical planning.</p>
<p>This study established a comprehensive research framework covering &#x201c;data processing-model refinement-practical validation&#x201d; through systematic approaches. Despite these achievements, the following limitations persist: (1) Data limitations: The single-center design inherently restricts external validity and introduces potential selection bias from institutional treatment protocols. Completeness was constrained by clinical practice variations &#x2014; some medical institutions failed to comprehensively collect body composition indicators such as BFR and VFD due to diagnostic workflow disparities or inadequate documentation standards. This resulted in missing key features for certain samples. Although AutoML-based automated imputation strategies (including median imputation) were applied, potential impacts on the model&#x2019;s precision in capturing data characteristics remain. Furthermore, regarding performance generalization to a third hospital setting, our external validation using Chuzhou First People&#x2019;s Hospital data acknowledges significant barriers as hospitals with differing CT imaging protocols or alternative measurement methods (e.g., bioelectrical impedance vs. CT-based VFD) may exhibit substantial feature distribution shifts. On the other hand, the end points of this study were only limited to the prediction of postoperative complication risk, and the long-term outcomes were not further observed and analyzed. (2) Model limitations: The &#x201c;black-box&#x201d; nature of AutoML integrated modeling remains unresolved. While SHAP analysis quantifies feature importance (confirming BFR as a dominant predictor), it cannot visually reveal complex nonlinear interactions among features. Clinicians face high interpretation barriers to understanding the model&#x2019;s decision logic, impeding clinical translation efficiency. (3) Implementation challenges: Core indicators like BFR and VFA/VFD require quantitative abdominal CT analysis&#x2014;a non-routine practice in postoperative care that increases costs and patient burden, reducing clinical accessibility. Critically, if BFR distributions differ substantially across hospitals (e.g., due to population demographics or measurement protocols), the model&#x2019;s dependency on this predictor may require retraining or adaptive recalibration via local data. Our median imputation method partially mitigates missing data but cannot resolve systemic protocol variations. Unaccounted confounders&#x2014;including regional disparities in surgical quality (lymphadenectomy standards) and genetic heterogeneity&#x2014; could degrade predictive efficacy in real-world applications. Future multi-center collaborations must establish standardized body composition assessment protocols using low-cost alternatives and explicitly test robustness against &#xb1;20-30% BFR distribution shifts through prospective validation. Future work must enhance model adaptability by incorporating broader clinical contextual variables. Future directions include: Optimizing data management through multicenter prospective cohort studies with large samples to establish unified data collection protocols, reducing heterogeneity. Blockchain technology and intelligent data entry systems will be introduced to minimize human error and improve accuracy. Concurrently, techniques like multiple imputation and Generative Adversarial Networks (GANs) will repair missing data to enhance dataset quality. Improving model performance entails developing low-cost alternatives for body composition assessment to reduce implementation barriers. Prospective clinical validation across healthcare tiers will refine generalizability in primary hospitals. Mobile or Hospital Information System (HIS)-integrated prediction tools enabling automated data import and real-time forecasting will be created to maximize clinical utility.</p>
</sec>
<sec id="s5">
<label>5</label>
<title>Summary</title>
<p>This research establishes an AutoML framework for predicting gastric cancer surgical outcomes, identifying eight core prognostic features and validating BFR as the dominant predictor through SHAP analysis. Though demonstrating excellent performance, clinical implementation requires overcoming data heterogeneity and model interpretability challenges. Future work will optimize practical application through multi-center collaboration and technical innovations.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p></sec>
<sec id="s7" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by the Biomedical Ethics Committee of Anhui Medical University. The studies were conducted in accordance with the local legislation and institutional requirements. The ethics committee/institutional review board waived the requirement of written informed consent for participation from the participants or the participants&#x2019; legal guardians/next of kin because of the retrospective nature of this study, which utilized anonymized data extracted from electronic medical records, the ethics committee granted a waiver for individual informed consent.</p></sec>
<sec id="s8" sec-type="author-contributions">
<title>Author contributions</title>
<p>SX: Data curation, Formal analysis, Investigation, Methodology, Software, Writing &#x2013; original draft. XD: Data curation, Formal analysis, Investigation, Writing &#x2013; review &amp; editing. JW: Data curation, Formal analysis, Investigation, Writing &#x2013; review &amp; editing. JH: Funding acquisition, Methodology, Project administration, Resources, Writing &#x2013; review &amp; editing.</p></sec>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s11" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s12" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s13" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fonc.2026.1763139/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fonc.2026.1763139/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="DataSheet1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="DataSheet2.docx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yasuda</surname> <given-names>T</given-names></name>
<name><surname>Wang</surname> <given-names>YA</given-names></name>
</person-group>. 
<article-title>Gastric cancer immunosuppressive microenvironment heterogeneity: implications for therapy development</article-title>. <source>Trends Cancer</source>. (<year>2024</year>) <volume>10</volume>:<page-range>627&#x2013;42</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.trecan.2024.03.008</pub-id>, PMID: <pub-id pub-id-type="pmid">38600020</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<label>2</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>R&#xf6;cken</surname> <given-names>C</given-names></name>
</person-group>. 
<article-title>Predictive biomarkers in gastric cancer</article-title>. <source>J Cancer Res Clin Oncol</source>. (<year>2023</year>) <volume>149</volume>:<page-range>467&#x2013;81</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00432-022-04408-0</pub-id>, PMID: <pub-id pub-id-type="pmid">36260159</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<label>3</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Xia</surname> <given-names>JY</given-names></name>
<name><surname>Aadam</surname> <given-names>AA</given-names></name>
</person-group>. 
<article-title>Advances in screening and detection of gastric cancer</article-title>. <source>J Surg Onco</source>. (<year>2022</year>) <volume>125</volume>:<page-range>1104&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/jso.26844</pub-id>, PMID: <pub-id pub-id-type="pmid">35481909</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<label>4</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Tao</surname> <given-names>C</given-names></name>
<name><surname>Hong</surname> <given-names>W</given-names></name>
<name><surname>Yin</surname> <given-names>P</given-names></name>
<name><surname>Wu</surname> <given-names>S</given-names></name>
<name><surname>Fan</surname> <given-names>L</given-names></name>
<name><surname>Lei</surname> <given-names>Z</given-names></name>
<etal/>
</person-group>. 
<article-title>Nomogram based on body composition and prognostic nutritional index predicts survival after curative resection of gastric cancer</article-title>. <source>Acad Radiol</source>. (<year>2024</year>) <volume>31</volume>:<page-range>1940&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.acra.2023.10.057</pub-id>, PMID: <pub-id pub-id-type="pmid">37981487</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<label>5</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Jiang</surname> <given-names>X</given-names></name>
<name><surname>Ding</surname> <given-names>L</given-names></name>
<name><surname>Guo</surname> <given-names>Y</given-names></name>
<name><surname>Miao</surname> <given-names>X</given-names></name>
<name><surname>Zhao</surname> <given-names>K</given-names></name>
<name><surname>Chen</surname> <given-names>L</given-names></name>
<etal/>
</person-group>. 
<article-title>Association of metabolic syndrome and frailty with postoperative complications in older gastric cancer patients: a body composition perspective</article-title>. <source>Cancer Med</source>. (<year>2024</year>) <volume>13</volume>:<elocation-id>70194</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/cam4.70194</pub-id>, PMID: <pub-id pub-id-type="pmid">39315666</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<label>6</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shuto</surname> <given-names>K</given-names></name>
<name><surname>Nabeya</surname> <given-names>Y</given-names></name>
<name><surname>Mori</surname> <given-names>M</given-names></name>
<name><surname>Yamazaki</surname> <given-names>M</given-names></name>
<name><surname>Kosugi</surname> <given-names>C</given-names></name>
<name><surname>Narushima</surname> <given-names>K</given-names></name>
<etal/>
</person-group>. 
<article-title>Postoperative changes in body composition predict long-term prognosis in patients with gastric cancer</article-title>. <source>Cancers (Basel)</source>. (<year>2025</year>) <volume>17</volume>:<elocation-id>738</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/cancers17050738</pub-id>, PMID: <pub-id pub-id-type="pmid">40075586</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<label>7</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chen</surname> <given-names>Y</given-names></name>
<name><surname>Wang</surname> <given-names>B</given-names></name>
<name><surname>Zhao</surname> <given-names>Y</given-names></name>
<name><surname>Shao</surname> <given-names>X</given-names></name>
<name><surname>Wang</surname> <given-names>M</given-names></name>
<name><surname>Ma</surname> <given-names>F</given-names></name>
<etal/>
</person-group>. 
<article-title>Metabolomic machine learning predictor for diagnosis and prognosis of gastric cancer</article-title>. <source>Nat Commun</source>. (<year>2024</year>) <volume>15</volume>:<fpage>1657</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-024-46043-y</pub-id>, PMID: <pub-id pub-id-type="pmid">38395893</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<label>8</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sun</surname> <given-names>X</given-names></name>
<name><surname>Zhao</surname> <given-names>Y</given-names></name>
<name><surname>Wang</surname> <given-names>X</given-names></name>
<name><surname>Lin</surname> <given-names>Y</given-names></name>
<name><surname>Zhang</surname> <given-names>P</given-names></name>
<name><surname>Yin</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>Prognostic utility of the newstage system integrating tumor regression grade and lymph node status for locally advanced gastric cancer treated with neoadjuvant chemoimmunotherapy</article-title>. <source>Int J Surg</source>. (<year>2025</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.1097/JS9.0000000000004119</pub-id>, PMID: <pub-id pub-id-type="pmid">41347286</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<label>9</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Tzelves</surname> <given-names>L</given-names></name>
<name><surname>Geraghty</surname> <given-names>R</given-names></name>
<name><surname>Mourmouris</surname> <given-names>P</given-names></name>
<name><surname>Chatzikrachtis</surname> <given-names>N</given-names></name>
<name><surname>Karavitakis</surname> <given-names>M</given-names></name>
<name><surname>Somani</surname> <given-names>B</given-names></name>
<etal/>
</person-group>. 
<article-title>Shockwave Lithotripsy Complications According to Modified Clavien-Dindo Grading System. A Systematic Review and meta-regression analysis in a sample of 115 randomized controlled trials</article-title>. <source>Eur Urol Focus</source>. (<year>2022</year>) <volume>8</volume>:<page-range>1452&#x2013;60</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.euf.2021.11.002</pub-id>, PMID: <pub-id pub-id-type="pmid">34848163</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<label>10</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Matsuoka</surname> <given-names>T</given-names></name>
<name><surname>Yashiro</surname> <given-names>M</given-names></name>
</person-group>. 
<article-title>Bioinformatics analysis and validation of potential markers associated with prediction and prognosis of gastric cancer</article-title>. <source>Int J Mol Sci</source>. (<year>2024</year>) <volume>25</volume>:<elocation-id>5880</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms25115880</pub-id>, PMID: <pub-id pub-id-type="pmid">38892067</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<label>11</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Jiang</surname> <given-names>Y</given-names></name>
<name><surname>Zhou</surname> <given-names>K</given-names></name>
<name><surname>Sun</surname> <given-names>Z</given-names></name>
<name><surname>Wang</surname> <given-names>H</given-names></name>
<name><surname>Xie</surname> <given-names>J</given-names></name>
<name><surname>Zhang</surname> <given-names>T</given-names></name>
<etal/>
</person-group>. 
<article-title>Non-invasive tumor microenvironment evaluation and treatment response prediction in gastric cancer using deep learning radiomics</article-title>. <source>Cell Rep Med</source>. (<year>2023</year>) <volume>4</volume>:<elocation-id>101146</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.xcrm.2023.101146</pub-id>, PMID: <pub-id pub-id-type="pmid">37557177</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<label>12</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sy-Janairo</surname> <given-names>MLL</given-names></name>
<name><surname>Janairo</surname> <given-names>JIB</given-names></name>
</person-group>. 
<article-title>Non-endoscopic applications of machine learning in gastric cancer: a systematic review</article-title>. <source>J Gastrointest Cancer</source>. (<year>2024</year>) <volume>55</volume>:<fpage>47</fpage>&#x2013;<lpage>64</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12029-023-00960-1</pub-id>, PMID: <pub-id pub-id-type="pmid">37477782</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<label>13</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>J</given-names></name>
<name><surname>Xu</surname> <given-names>S</given-names></name>
<name><surname>Zhu</surname> <given-names>F</given-names></name>
<name><surname>Shen</surname> <given-names>F</given-names></name>
<name><surname>Zhang</surname> <given-names>T</given-names></name>
<name><surname>Wan</surname> <given-names>X</given-names></name>
<etal/>
</person-group>. 
<article-title>Multi-omics combined with machine learning facilitating the diagnosis of gastric cancer</article-title>. <source>Curr Med Chem</source>. (<year>2024</year>) <volume>31</volume>:<page-range>6692&#x2013;712</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2174/0109298673284520240112055108</pub-id>, PMID: <pub-id pub-id-type="pmid">38351697</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<label>14</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Demirhan</surname> <given-names>DB</given-names></name>
<name><surname>Ylmaz</surname> <given-names>H</given-names></name>
<name><surname>Erol</surname> <given-names>H</given-names></name>
<name><surname>Kayili</surname> <given-names>HM</given-names></name>
<name><surname>Salih</surname> <given-names>B</given-names></name>
</person-group>. 
<article-title>Prediction of gastric cancer by machine learning integrated with mass spectrometry-based N-glycomics</article-title>. <source>Analyst</source>. (<year>2023</year>) <volume>148</volume>:<page-range>2073&#x2013;80</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1039/d2an02057b</pub-id>, PMID: <pub-id pub-id-type="pmid">37009642</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<label>15</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cai</surname> <given-names>ZR</given-names></name>
<name><surname>Zheng</surname> <given-names>YQ</given-names></name>
<name><surname>Hu</surname> <given-names>Y</given-names></name>
<name><surname>Ma</surname> <given-names>MY</given-names></name>
<name><surname>Wu</surname> <given-names>YJ</given-names></name>
<name><surname>Liu</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>Construction of exosome non-coding RNA feature for non-invasive, early detection of gastric cancer patients by machine learning: a multi-cohort study</article-title>. <source>Gut</source>. (<year>2025</year>) <volume>74</volume>:<page-range>884&#x2013;93</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/gutjnl-2024-333522</pub-id>, PMID: <pub-id pub-id-type="pmid">39753334</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<label>16</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Qiu</surname> <given-names>B</given-names></name>
<name><surname>Zheng</surname> <given-names>Y</given-names></name>
<name><surname>Liu</surname> <given-names>S</given-names></name>
<name><surname>Song</surname> <given-names>R</given-names></name>
<name><surname>Wu</surname> <given-names>L</given-names></name>
<name><surname>Lu</surname> <given-names>C</given-names></name>
<etal/>
</person-group>. 
<article-title>Multitask deep learning based on longitudinal CT images facilitates prediction of lymph node metastasis and survival in chemotherapy-treated gastric cancer</article-title>. <source>Cancer Res</source>. (<year>2025</year>) <volume>85</volume>:<page-range>2527&#x2013;36</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1158/0008-5472.CAN-24-4190</pub-id>, PMID: <pub-id pub-id-type="pmid">40305075</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<label>17</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Azari</surname> <given-names>H</given-names></name>
<name><surname>Nazari</surname> <given-names>E</given-names></name>
<name><surname>Mohit</surname> <given-names>R</given-names></name>
<name><surname>Asadnia</surname> <given-names>A</given-names></name>
<name><surname>Maftooh</surname> <given-names>M</given-names></name>
<name><surname>Nassiri</surname> <given-names>M</given-names></name>
<etal/>
</person-group>. 
<article-title>Machine learning algorithms reveal potential miRNAs biomarkers in gastric cancer</article-title>. <source>Sci Rep</source>. (<year>2023</year>) <volume>13</volume>:<fpage>6147</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-023-32332-x</pub-id>, PMID: <pub-id pub-id-type="pmid">37061507</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<label>18</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Du</surname> <given-names>H</given-names></name>
<name><surname>Yang</surname> <given-names>Q</given-names></name>
<name><surname>Ge</surname> <given-names>A</given-names></name>
<name><surname>Zhao</surname> <given-names>C</given-names></name>
<name><surname>Ma</surname> <given-names>Y</given-names></name>
<name><surname>Wang</surname> <given-names>S</given-names></name>
</person-group>. 
<article-title>Explainable machine learning models for early gastric cancer diagnosis</article-title>. <source>Sci Rep</source>. (<year>2024</year>) <volume>14</volume>:<fpage>17457</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-024-67892-z</pub-id>, PMID: <pub-id pub-id-type="pmid">39075116</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<label>19</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shi</surname> <given-names>Y</given-names></name>
<name><surname>Fan</surname> <given-names>H</given-names></name>
<name><surname>Li</surname> <given-names>L</given-names></name>
<name><surname>Hou</surname> <given-names>Y</given-names></name>
<name><surname>Qian</surname> <given-names>F</given-names></name>
<name><surname>Zhuang</surname> <given-names>M</given-names></name>
<etal/>
</person-group>. 
<article-title>The value of machine learning approaches in the diagnosis of early gastric cancer: a systematic review and meta-analysis</article-title>. <source>World J Surg Oncol</source>. (<year>2024</year>) <volume>22</volume>:<fpage>40</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12957-024-03321-9</pub-id>, PMID: <pub-id pub-id-type="pmid">38297303</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<label>20</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Jiang</surname> <given-names>Y</given-names></name>
<name><surname>Zhang</surname> <given-names>Z</given-names></name>
<name><surname>Yuan</surname> <given-names>Q</given-names></name>
<name><surname>Wang</surname> <given-names>W</given-names></name>
<name><surname>Wang</surname> <given-names>H</given-names></name>
<name><surname>Li</surname> <given-names>T</given-names></name>
<etal/>
</person-group>. 
<article-title>Predicting peritoneal recurrence and disease-free survival from CT images in gastric cancer with multitask deep learning: a retrospective study</article-title>. <source>Lancet Digit Health</source>. (<year>2022</year>) <volume>4</volume>:<page-range>340&#x2013;50</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S2589-7500(22)00040-1</pub-id>, PMID: <pub-id pub-id-type="pmid">35461691</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<label>21</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sinnarasan</surname> <given-names>VSP</given-names></name>
<name><surname>Paul</surname> <given-names>D</given-names></name>
<name><surname>Das</surname> <given-names>R</given-names></name>
<name><surname>Venkatesan</surname> <given-names>A</given-names></name>
</person-group>. 
<article-title>Gastric cancer biomarker candidates identified by machine learning and integrative bioinformatics: toward personalized medicine</article-title>. <source>OMICS</source>. (<year>2023</year>) <volume>27</volume>:<page-range>260&#x2013;72</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1089/omi.2023.0015</pub-id>, PMID: <pub-id pub-id-type="pmid">37229622</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<label>22</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hong</surname> <given-names>QQ</given-names></name>
<name><surname>Yan</surname> <given-names>S</given-names></name>
<name><surname>Zhao</surname> <given-names>YL</given-names></name>
<name><surname>Fan</surname> <given-names>L</given-names></name>
<name><surname>Yang</surname> <given-names>L</given-names></name>
<name><surname>Zhang</surname> <given-names>WB</given-names></name>
<etal/>
</person-group>. 
<article-title>Machine learning identifies the risk of complications after laparoscopic radical gastrectomy for gastric cancer</article-title>. <source>World J Gastroenterol</source>. (<year>2024</year>) <volume>30</volume>:<fpage>79</fpage>&#x2013;<lpage>90</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3748/wjg.v30.i1.79</pub-id>, PMID: <pub-id pub-id-type="pmid">38293327</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<label>23</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>HW</given-names></name>
<name><surname>Zhu</surname> <given-names>ZY</given-names></name>
<name><surname>Sun</surname> <given-names>YF</given-names></name>
<name><surname>Yuan</surname> <given-names>CY</given-names></name>
<name><surname>Wang</surname> <given-names>MH</given-names></name>
<name><surname>Wang</surname> <given-names>N</given-names></name>
<etal/>
</person-group>. 
<article-title>Machine learning algorithms able to predict the prognosis of gastric cancer patients treated with immune checkpoint inhibitors</article-title>. <source>World J Gastroenterol</source>. (<year>2024</year>) <volume>30</volume>:<page-range>4354&#x2013;66</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3748/wjg.v30.i40.4354</pub-id>, PMID: <pub-id pub-id-type="pmid">39494097</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<label>24</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zheng</surname> <given-names>X</given-names></name>
<name><surname>Wang</surname> <given-names>R</given-names></name>
<name><surname>Zhang</surname> <given-names>X</given-names></name>
<name><surname>Sun</surname> <given-names>Y</given-names></name>
<name><surname>Zhang</surname> <given-names>H</given-names></name>
<name><surname>Zhao</surname> <given-names>Z</given-names></name>
<etal/>
</person-group>. 
<article-title>A deep learning model and human-machine fusion for prediction of EBV-associated gastric cancer from histopathology</article-title>. <source>Nat Commun</source>. (<year>2022</year>) <volume>13</volume>:<fpage>2790</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-022-30459-5</pub-id>, PMID: <pub-id pub-id-type="pmid">35589792</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<label>25</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhou</surname> <given-names>CM</given-names></name>
<name><surname>Wang</surname> <given-names>Y</given-names></name>
<name><surname>Yang</surname> <given-names>JJ</given-names></name>
<name><surname>Zhu</surname> <given-names>Y</given-names></name>
</person-group>. 
<article-title>Predicting postoperative gastric cancer prognosis based on inflammatory factors and machine learning technology</article-title>. <source>BMC Med Inform Decis Mak</source>. (<year>2023</year>) <volume>23</volume>:<fpage>53</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12911-023-02150-2</pub-id>, PMID: <pub-id pub-id-type="pmid">37004065</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<label>26</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Arai</surname> <given-names>J</given-names></name>
<name><surname>Aoki</surname> <given-names>T</given-names></name>
<name><surname>Sato</surname> <given-names>M</given-names></name>
<name><surname>Niikura</surname> <given-names>R</given-names></name>
<name><surname>Suzuki</surname> <given-names>N</given-names></name>
<name><surname>Ishibashi</surname> <given-names>R</given-names></name>
<etal/>
</person-group>. 
<article-title>Machine learning-based personalized prediction of gastric cancer incidence using the endoscopic and histologic findings at the initial endoscopy</article-title>. <source>Gastrointest Endosc</source>. (<year>2022</year>) <volume>95</volume>:<page-range>864&#x2013;72</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.gie.2021.12.033</pub-id>, PMID: <pub-id pub-id-type="pmid">34998795</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<label>27</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hu</surname> <given-names>Y</given-names></name>
<name><surname>Wang</surname> <given-names>B</given-names></name>
<name><surname>Shi</surname> <given-names>C</given-names></name>
<name><surname>Ren</surname> <given-names>P</given-names></name>
<name><surname>Zhang</surname> <given-names>C</given-names></name>
<name><surname>Wang</surname> <given-names>Z</given-names></name>
<etal/>
</person-group>. 
<article-title>A machine learning approach to risk-stratification of gastric cancer based on tumour-infiltrating immune cell profiles</article-title>. <source>Ann Med</source>. (<year>2025</year>) <volume>57</volume>:<elocation-id>2489007</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/07853890.2025.2489007</pub-id>, PMID: <pub-id pub-id-type="pmid">40208029</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<label>28</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bai</surname> <given-names>Z</given-names></name>
<name><surname>Wang</surname> <given-names>H</given-names></name>
<name><surname>Han</surname> <given-names>J</given-names></name>
<name><surname>An</surname> <given-names>J</given-names></name>
<name><surname>Yang</surname> <given-names>Z</given-names></name>
<name><surname>Mo</surname> <given-names>X</given-names></name>
</person-group>. 
<article-title>Multiomics integration and machine learning reveal prognostic programmed cell death signatures in gastric cancer</article-title>. <source>Sci Rep</source>. (<year>2024</year>) <volume>14</volume>:<fpage>31060</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-024-82233-w</pub-id>, PMID: <pub-id pub-id-type="pmid">39730893</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1183145">Md. Rizwanullah</ext-link>, Jamia Hamdard University, India</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1782261">Mohd Rabi Bazaz</ext-link>, University of Wisconsin-Madison, United States</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1782261">Mohd Rihan</ext-link>, USF Health, United States</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3045929">Shahnawaz Ahmad</ext-link>, Jamia Hamdard University, India</p></fn>
</fn-group>
</back>
</article>