<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2026.1770037</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Development and validation of a pathomics-driven machine learning model for individualized prediction of neoadjuvant chemotherapy response and early recurrence in HR-positive, HER2-negative breast cancer</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Yue</surname><given-names>Jiaxian</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Liu</surname><given-names>Jiaxiang</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2151311/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Kang</surname><given-names>Xiyu</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Yuan</surname><given-names>Pei</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname><given-names>Wei</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname><given-names>Zhanyu</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Shang</surname><given-names>Chao</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Shang</surname><given-names>Qingyao</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/824602/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname><given-names>Guangyu</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Dong</surname><given-names>Xubin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/954032/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname><given-names>Tianxiao</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Yang</surname><given-names>Dongmin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Wang</surname><given-names>Shuhao</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Yang</surname><given-names>Chenxuan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Ying</surname><given-names>Jianming</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1636175/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Wang</surname><given-names>Xin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/768683/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Department of Breast Surgical Oncology, National Cancer Center/National Clinical Research Center for Cancer/Cancer Hospital, Chinese Academy of Medical Sciences and Peking Union Medical College</institution>, <city>Beijing</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>Beijing Tsinghua Changgung Hospital, School of Clinical Medicine, Tsinghua University</institution>, <city>Beijing</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff3"><label>3</label><institution>Department of Pathology, National Cancer Center/National Clinical Research Center for Cancer/Cancer Hospital, Chinese Academy of Medical Sciences and Peking Union Medical College</institution>, <city>Beijing</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff4"><label>4</label><institution>Thorough Lab, Thorough Future</institution>, <city>Beijing</city>,&#xa0;<country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Xin Wang, <email xlink:href="mailto:xinwang@vip.126.com">xinwang@vip.126.com</email>; Jianming Ying, <email xlink:href="mailto:jmying@cicams.ac.cn">jmying@cicams.ac.cn</email>; Chenxuan Yang, <email xlink:href="mailto:yangcx13@foxmail.com">yangcx13@foxmail.com</email>; Shuhao Wang, <email xlink:href="mailto:to@shuhao.wang">to@shuhao.wang</email></corresp>
<fn fn-type="equal" id="fn003">
<label>&#x2020;</label>
<p>These authors have contributed equally to this work and share first authorship</p></fn>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-23">
<day>23</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>16</volume>
<elocation-id>1770037</elocation-id>
<history>
<date date-type="received">
<day>17</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>09</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>14</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Yue, Liu, Kang, Yuan, Wang, Wang, Shang, Shang, Li, Dong, Wang, Yang, Wang, Yang, Ying and Wang.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Yue, Liu, Kang, Yuan, Wang, Wang, Shang, Shang, Li, Dong, Wang, Yang, Wang, Yang, Ying and Wang</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-23">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Hormone receptor (HR)-positive, human epidermal growth factor receptor 2 (HER2)-negative breast cancer is the most prevalent subtype among women but has a modest response to neoadjuvant chemotherapy (NAC). Accurately predicting NAC efficacy and recurrence risk remains challenging, as conventional clinical and molecular markers have limited predictive power. Advances in digital pathology and artificial intelligence now enable quantitative pathomics analysis, offering new opportunities for precise prediction and prognostic assessment.</p>
</sec>
<sec>
<title>Methods</title>
<p>In this retrospective study, 162 HR-positive, HER2-negative breast cancer patients treated with NAC between 2014 and 2021 were included. Hematoxylin and eosin (H&amp;E)-stained pretreatment biopsy slides were digitized and analyzed using Vision Transformer (ViT) and Unified Network for Image (UNI) deep learning models to extract pathomic features. Thirteen clinical variables were collected. After least absolute shrinkage and selection operator (LASSO)-based feature selection, multiple machine learning models were developed for both response prediction and prognostic evaluation of recurrence, with performance evaluated by receiver operating characteristic (ROC) curves, area under the curve (AUC), sensitivity, specificity, confusion matrix, calibration curves, and decision curve analysis (DCA). Furthermore, SHapley Additive exPlanations (SHAP) was used to rank the importance of features for each model.</p>
</sec>
<sec>
<title>Results</title>
<p>The CatBoost model achieved the best predictive performance (AUC = 0.900 in training and 0.848 in validation) when a combination of clinical and pathomics-derived variables was used. Key predictive factors included Ki-67 expression, age, histological grade, PR status, and prominent pathomic features. A Kaplan&#x2013;Meier survival plot indicated that regardless of stratification by MP grade or pCR status, there was no significant difference in recurrence status or survival outcomes between the two groups in this cohort. Furthermore, the recurrence models developed mainly using pathomics were strongly accurate for predicting 1-year recurrence (AUC = 0.907 in training and 0.769 in validation).</p>
</sec>
<sec>
<title>Conclusions</title>
<p>Integrating pathomic features with clinical variables via machine learning enables robust pretreatment prediction of NAC efficacy and short-term recurrence in HR-positive, HER2-negative breast cancer. This approach has the potential to offer a clinically practical tool to optimize individualized therapy and improve patient management, highlighting the translational value of AI-powered digital pathology in breast cancer care.</p>
</sec>
</abstract>
<kwd-group>
<kwd>artificial intelligence</kwd>
<kwd>breast cancer</kwd>
<kwd>HR-positive/HER2-Negative</kwd>
<kwd>machine learning</kwd>
<kwd>neoadjuvant chemotherapy</kwd>
<kwd>pathomics</kwd>
<kwd>prediction</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This research was supported by the Beijing Natural Science Foundation (JQ23032 granted to XW), (7252119 granted to CY), (L259071 granted to JL), National Natural Science Foundation of China (82373060 and 82573522 granted to XW), (82573118 and 82203688 granted to CY), Noncommunicable Chronic Diseases-National Science and Technology Major Project (2023ZD0502200 granted to XW), CAMS Innovation Fund for Medical Sciences (CIFMS) (2023-I2M-C&amp;T-A-009 granted to XW), Capital&#x2019;s Funds for Health Improvement and Re-search (CFH) (2024-2-4025 granted to XW), Beijing AI+Health Cultivation Innovation Project (No. Z241100007724001 granted to SW), Beijing Nova Program (No. 20240484628 granted to SW).</funding-statement>
</funding-group>
<counts>
<fig-count count="6"/>
<table-count count="4"/>
<equation-count count="0"/>
<ref-count count="43"/>
<page-count count="18"/>
<word-count count="8187"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Breast Cancer</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Breast cancer is among the most common malignant tumors among women, and as its incidence has continued to rise in recent years, it has become a leading cause of cancer-related mortality in women worldwide (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>). Among the molecular subtypes of breast cancer, the hormone receptor (HR)-positive, human epidermal growth factor receptor 2 (HER2)-negative subtype accounts for approximately 60&#x2013;70% of all cases and represents the most prevalent form of the disease (<xref ref-type="bibr" rid="B3">3</xref>). Although this subtype of breast cancer generally exhibits relatively indolent biological behavior and favorable long-term prognosis, a proportion of patients experience recurrence and progression during treatment. Optimizing treatment strategies and accurately predicting treatment response and prognosis in this population remain significant challenges in clinical management.</p>
<p>Neoadjuvant chemotherapy (NAC), a crucial component of comprehensive breast cancer management, can reduce tumor volume prior to surgery, thereby facilitating surgical intervention, increasing the breast-conserving rate, and providing a window for assessing tumor biological response (<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B5">5</xref>). However, patients with HR-positive, HER2-negative breast cancer generally exhibit a low pathological complete response (pCR) rate to NAC, with marked interindividual heterogeneity (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B7">7</xref>). Consequently, some patients are subjected to the toxicity of chemotherapy without benefitting from NAC, and they may even miss the optimal timing for surgery. Although previous studies have explored the predictive value of clinical parameters and conventional molecular pathological markers, there remains a lack of effective tools in current clinical practice to accurately predict NAC efficacy for this subtype prior to treatment (<xref ref-type="bibr" rid="B8">8</xref>, <xref ref-type="bibr" rid="B9">9</xref>). In addition, the survival benefit associated with pCR in this subtype remains controversial (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B11">11</xref>). Therefore, accurately identifying the high-risk population for recurrence after NAC and promptly adjusting therapeutic strategies are critical for maximizing patient benefit and improving survival outcomes.</p>
<p>Recent advances in digital pathology and artificial intelligence (AI) technologies have provided new approaches for addressing the aforementioned challenges. Pathomics, an emerging research methodology that enables high-throughput, automated, and quantitative feature extraction from digitized pathological slides, has been increasingly refined. This technique objectively and comprehensively reveals the histological heterogeneity and complexity of tumors, demonstrating promising applications in cancer diagnosis, prognostic assessment, and treatment response prediction (<xref ref-type="bibr" rid="B12">12</xref>&#x2013;<xref ref-type="bibr" rid="B14">14</xref>). Concurrently, machine learning (ML) algorithms, which simulate human behavior to enable intelligent learning and data processing, have become powerful tools for assisting in disease diagnosis and treatment (<xref ref-type="bibr" rid="B15">15</xref>).</p>
<p>In recent years, several studies have attempted to predict the efficacy of NAC in breast cancer by constructing models based on pathomics feature extraction combined with ML approaches. For example, li et&#xa0;al. (<xref ref-type="bibr" rid="B16">16</xref>) developed a pathomics-based model to predict the Residual Cancer Burden (RCB) score in breast cancer patients receiving NAC, while Fisher et&#xa0;al. (<xref ref-type="bibr" rid="B12">12</xref>)explored the role of ML integrated with digital pathology image analysis in predicting the response to NAC in triple-negative breast cancer. However, these studies generally did not focus on the HR-positive, HER2-negative subgroup, which is less sensitive to chemotherapy, and mostly targeted a single endpoint (such as pCR), rarely addressing early relapse risk, an equally critical factor for clinical decision-making, thereby limiting the models&#x2019; utility in personalized treatment and follow-up management.</p>
<p>In this context, in the present study, pathomic features with clinical data and multiple machine learning (ML) algorithms were used to develop a predictive model for the efficacy of neoadjuvant chemotherapy (NAC) in patients with HR-positive, HER2-negative breast cancer. Furthermore, the relationship between NAC response and patient prognosis was systematically analyzed, and the value of pathomic information in prognosis prediction was explored. By applying rigorous and reproducible modeling and validation procedures, the aim of this study was to provide an accurate and clinically practical tool for predicting therapeutic response and recurrence risk. Such a tool has the potential to optimize treatment decision-making and advance the implementation of precision therapy for this breast cancer subtype.</p>
</sec>
<sec id="s2">
<label>2</label>
<title>Methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Patient selection</title>
<p>In this retrospective study, patients who were diagnosed with breast cancer between Jan. 2014 and Dec. 2021 at the Cancer Hospital Chinese Academy of Medical Sciences were included (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>). The inclusion criteria were as follows: female patients (<xref ref-type="bibr" rid="B1">1</xref>) who were diagnosed with primary breast cancer by pathological examination (<xref ref-type="bibr" rid="B2">2</xref>), who underwent pre-NAC core needle biopsy and surgical treatment (<xref ref-type="bibr" rid="B3">3</xref>), whose biopsy pathology confirmed that they were hormone receptor-positive and HER2-negative, and (<xref ref-type="bibr" rid="B4">4</xref>) who underwent neoadjuvant therapy before surgery. The exclusion criteria were as follows (<xref ref-type="bibr" rid="B1">1</xref>): patients who were diagnosed with bilateral breast cancer (<xref ref-type="bibr" rid="B2">2</xref>), patients who underwent palliative surgery (<xref ref-type="bibr" rid="B3">3</xref>), patients who lacked biopsy H&amp;E-stained histopathological slide scan images or whose scan images were of low quality, and (<xref ref-type="bibr" rid="B4">4</xref>) patients who underwent neoadjuvant endocrine therapy. Patient information regarding age; clinical stage; tumor grade; ER, PR, and Ki67 levels; neoadjuvant chemotherapy regimen; surgical approach; postoperative pathological stage; height; weight; menopausal status; family history; tumor position; and metabolic indicators, including blood glucose, TG, and LDL-C levels, was collected from the medical records. Patients were followed up for a median duration of 66 months.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Flow diagram of patient cohort selection.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1770037-g001.tif">
<alt-text content-type="machine-generated">Flowchart showing selection of patients for a study from 20,833 breast cancer surgical cases between 2014 and 2021, filtering by HR+, HER2&#x2013; status and other criteria, leading to 162 eligible patients after exclusions.</alt-text>
</graphic></fig>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Pathology slide scanning and feature extraction</title>
<p>On the basis of Vision Transformer (ViT) and Unified Network for Image (UNI) pretrained models, an integrated framework was constructed in this study to enable efficient and precise feature extraction from pathological slides. The workflow comprised the following main stages:</p>
<sec id="s2_2_1">
<label>2.2.1</label>
<title>Input and image patching</title>
<p>Whole-slide images (WSIs) were obtained by scanning H&amp;E-stained histopathological slides from pre-neoadjuvant core needle biopsy specimens. To facilitate model processing, each WSI was divided into multiple image patches of size 224&#xd7;224 pixels as preprocessing. Each patch was independently processed for feature extraction in the subsequent steps.</p>
<p>Each 224&#xd7;224 patch was subdivided into nonoverlapping 16&#xd7;16 subpatches, which were then flattened into a sequence of patch tokens. Afterward, each patch token was linearly projected into a fixed-dimensional vector space, resulting in a set of patch embeddings. After linear projection, the input feature dimension was [<italic>B</italic>, <italic>N</italic>, <italic>D</italic>], where <inline-formula>
<mml:math display="inline" id="im1"><mml:mi>B</mml:mi></mml:math></inline-formula> denotes the batch size (set to 2 in this study), <inline-formula>
<mml:math display="inline" id="im2"><mml:mi>N</mml:mi></mml:math></inline-formula> is the number of tokens per image (<inline-formula>
<mml:math display="inline" id="im3"><mml:mrow><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:mn>224</mml:mn><mml:mo stretchy="false">/</mml:mo><mml:mn>16</mml:mn><mml:mo stretchy="false">)</mml:mo><mml:mo>&#xd7;</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:mn>224</mml:mn><mml:mo stretchy="false">/</mml:mo><mml:mn>16</mml:mn><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mn>196</mml:mn></mml:mrow></mml:math></inline-formula>), and <inline-formula>
<mml:math display="inline" id="im4"><mml:mi>D</mml:mi></mml:math></inline-formula> is the embedding dimension (<inline-formula>
<mml:math display="inline" id="im5"><mml:mrow><mml:mi>D</mml:mi><mml:mo>=</mml:mo><mml:mn>1024</mml:mn></mml:mrow></mml:math></inline-formula>). An additional class token (CLS token) was added to the sequence of the patch embeddings to aggregate the global information from the entire image.</p>
</sec>
<sec id="s2_2_2">
<label>2.2.2</label>
<title>Transformer encoder</title>
<p>The patch embeddings, including the CLS token, were input into a transformer encoder. Through the multihead self-attention mechanism, the encoder modeled global interactions among all the patches, thereby capturing long-range dependencies and contextual information. The output of the transformer encoder maintained the dimensionality [<italic>B</italic>, <italic>N</italic>, <italic>D</italic>], meaning that each patch token was represented by a contextually enhanced feature vector.</p>
</sec>
<sec id="s2_2_3">
<label>2.2.3</label>
<title>Global feature aggregation (Global pooling)</title>
<p>The output of the transformer encoder underwent global average pooling, aggregating the feature vectors from all the patch tokens to generate a global semantic representation of the entire image. The resulting feature dimension was [<italic>B</italic>, <italic>D</italic>], indicating that each image was encoded as a 1024-dimensional feature vector. This feature vector was subsequently saved for downstream analyses or further processing.</p>
</sec>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Prediction model construction and validation</title>
<p>The construction and validation process of the prediction model is illustrated in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;S1</bold></xref>. The detailed steps are as follows:</p>
<sec id="s2_3_1">
<label>2.3.1</label>
<title>Construction of training and validation sets with feature selection via LASSO regression</title>
<p>The model construction and validation processes were conducted with R 4.3.1. A total of 162 patients were randomly divided into a training set and a validation set in a 70% to 30% ratio. Given the relatively low number of positive events, stratified splitting was employed to ensure balanced event distribution. For patients with multiple slides, the mean of each pathomic feature across slides was calculated to construct models at the patient level.</p>
<p>Least absolute shrinkage and selection operator (LASSO) regression was applied to both clinical variables and the previously extracted 1024-dimensional pathomic features to identify variables for subsequent model construction (clinical variables excluded any postneoadjuvant information such as post-operative pathological stage). Prior to lasso regression, variables with zero standard deviation (SD = 0) were removed to eliminate noninformative features and reduce noise and computational burden. After the above data preprocessing steps, a 10-fold cross-validation approach (with the number of folds reduced to as few as 2 if the number of positive events was insufficient) was used. The optimal regularization parameter &#x3bb; was chosen on the basis of an &#x201c;acceptable AUC loss threshold&#x201d;, balancing model performance with the retention of potential predictive variables. This feature selection process was conducted exclusively within the training set.</p>
</sec>
<sec id="s2_3_2">
<label>2.3.2</label>
<title>Hyperparameter optimization</title>
<p>To determine the optimal hyperparameters for each model, 5-fold cross-validation combined with a global random search strategy was employed. The training set was randomly divided into five folds; for each iteration, four folds were used for model training with randomly selected hyperparameters, and the remaining fold served as the validation set to calculate the area under the curve (AUC) and Brier score. The process was repeated until each fold served as the validation set. The scoring metric was calculated as follows: <italic>Score</italic>=mean(AUC)&#x2212;<italic>&#x3b1;</italic>&#xd7;mean(Brier),(<italic>&#x3b1;</italic> = 0.5). This process was repeated 50 times, and the hyperparameter set with the highest score was selected for subsequent model construction.</p>
</sec>
<sec id="s2_3_3">
<label>2.3.3</label>
<title>Out-of-fold estimation for optimal tree number and model evaluation on the training set</title>
<p>To avoid optimism bias, out-of-fold (OOF) prediction (F = 5) was used to accurately assess model performance on the training set. To control model complexity, the outer training subset in each OOF split was divided into inner folds, and a 5-fold cross-validation was conducted to estimate the optimal number of iterations and train the model. Early stopping was applied during inner fold training, and the &#x201c;median&#x201d; number of best-trees from all folds was used as the robust number of iterations.</p>
<p>To increase the stability and predictive performance, a weighted ensemble model comprising five submodels was constructed: Each submodel randomly sampled a feature subset (80&#x2013;100% of the features were used). For each submodel, the mean AUC from the inner folds was recorded as the ensemble weight, and the median best-trees served as the fixed iteration count. Each submodel was retrained on the outer training subset using this fixed iteration number. Predictions were generated for the outer validation subset, and the mean AUC from the inner folds was used as the ensemble weight to aggregate the OOF probabilities, which represented the final training set predictions for each algorithm.</p>
</sec>
<sec id="s2_3_4">
<label>2.3.4</label>
<title>Platt calibration of OOF predictions</title>
<p>To align model-predicted probabilities with true event rates for reliable Brier scores and threshold-based decision-making, Platt calibration was performed on the OOF probabilities. The calibration function was defined as <inline-formula>
<mml:math display="inline" id="im6"><mml:mrow><mml:msub><mml:mi>p</mml:mi><mml:mrow><mml:mi>c</mml:mi><mml:mi>a</mml:mi><mml:mi>l</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>&#x3c3;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>a</mml:mi><mml:mo>+</mml:mo><mml:mi>b</mml:mi><mml:mo>&#xb7;</mml:mo><mml:mtext>logit</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:mi>p</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>, where <inline-formula>
<mml:math display="inline" id="im7"><mml:mi>&#x3c3;</mml:mi></mml:math></inline-formula> is the sigmoid function.</p>
</sec>
<sec id="s2_3_5">
<label>2.3.5</label>
<title>Retraining on the complete training set and validation</title>
<p>The final model was trained using the entire training set. For each submodel, a new feature subset was sampled. Inner folds of the complete training set were used to determine the mean AUC (ensemble weight) and median tree number (fixed iteration count). Each submodel was retrained on the full training set with a fixed iteration count, and all five submodels were saved. The ensemble model was then evaluated on the independent validation set to generate raw probability predictions, which were subsequently calibrated using the Platt calibrator fitted on the OOF results, providing the final probability estimates on the validation set.</p>
</sec>
<sec id="s2_3_6">
<label>2.3.6</label>
<title>Model evaluation</title>
<p>On the basis of the above training strategy, predictive models were constructed using five machine learning algorithms: CatBoost, random forest, LightGBM, XGBoost, and support vector machine (SVM). Model performance was assessed using receiver operating characteristic (ROC) curves, area under the curve (AUC), sensitivity, specificity, confusion matrix, calibration curves, and decision curve analysis (DCA). SHapley Additive exPlanations (SHAP) was used to rank the importance of features for each model.</p>
</sec>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Statistics</title>
<p>All the statistical analyses in this study were performed using R 4.3.1. The main analytical workflow included the description and comparison of baseline characteristics and clinical variables between the two groups, Kaplan&#x2013;Meier survival analyses with log-rank tests, and both univariable and multivariable Cox proportional hazards regression modeling. Unless otherwise specified, all the statistical tests were two-sided, and the significance threshold was set at P&lt;0.05. For comparisons of continuous variables between groups, the Shapiro&#x2013;Wilk test was first used within each group to assess the normality of the distribution. If both groups exhibited an approximately normal distribution, the Welch t test (not assuming equal variances) was applied; otherwise, the Wilcoxon rank-sum test (Mann&#x2013;Whitney U test) was used. For categorical variables, the Pearson chi-square test was used preferentially; when any expected cell count was less than 5 or the chi-square test could not be computed, Fisher&#x2019;s exact test was employed. To compare the prognostic outcomes between the two groups, a Kaplan&#x2013;Meier survival analysis was conducted according to the predefined grouping variable, and survival curves were plotted with P values derived from the log-rank test. Risk tables and reference lines for median survival are also displayed. To quantify the associations between each candidate variable and overall survival (OS) and disease-free survival (DFS), univariable and multivariable Cox proportional hazards regression analyses were performed, and the hazard ratio (HR) and its 95% confidence interval (CI) were reported. Candidate variables included age, cT, cN, surgical approach, ER, PR, Ki-67, grade, chemotherapy regimen, ypT stage, ypN stage, menopausal status, family history, BMI, LDL-C level, TG level, glucose level, MP grade, and pCR. Considering that the MPgrade and pCR may act as mediators of the effects of other variables on prognosis, these two variables were not included as adjustment factors when multivariable Cox proportional hazards models were constructed. For each candidate variable other than MPgrade or pCR, all the variables except MPgrade, pCR, and the variable under analysis itself were included as covariates (to avoid adjusting for the variable being analyzed).</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Ethics approval and consent to participate</title>
<p>All patient-related studies were approved by the Ethics Committee of National Cancer Center/Cancer Hospital, Chinese Academy of Medical Sciences and Peking Union Medical College(24/496-4776). All enrolled patients provided informed written consent.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Baseline characteristics of the enrolled patients</title>
<p><xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref> summarizes the baseline characteristics of all the patients in the study. A total of 162 breast cancer patients were enrolled, all of whom were HR-positive, HER2-negative and received neoadjuvant chemotherapy (NAC) (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>). The Miller&#x2013;Payne (MP) grading system was used to evaluate postoperative H&amp;E-stained histopathological slides, and patients were stratified into a response group and a nonresponse group according to MP grade. The response group comprised 34 patients (21%) with MP grades 4 (a marked reduction in invasive tumor cells by more than 90%) or 5 (no invasive tumor cells remaining in the tumor bed) (<xref ref-type="bibr" rid="B17">17</xref>), whereas the nonresponse group included 128 patients (79%) with MP grades 1, 2, or 3. There were significant differences between the two groups in terms of age at diagnosis, menopausal status, surgical approach, estrogen receptor (ER) expression, progesterone receptor (PR) expression, Ki-67 index, and histological grade (all P&lt;0.05). Specifically, compared with patients in the nonresponse group, patients in the response group were younger at diagnosis (43.65 vs. 52.02 years), with a greater proportion of premenopausal women (73.5% vs. 52.3%). Moreover, the rate of breast-conserving surgery (BCS) was greater in the response group (20.6% vs. 4.7%), reflecting the impact of NAC efficacy on surgical strategy. In terms of tumor biological features, the response group had lower ER (0.46 vs. 0.81) and PR (0.33 vs. 0.55) expression but a higher Ki-67 index (0.49 vs. 0.27) and higher histological grade than the nonresponse group did, indicating that poorly differentiated and highly proliferative tumors&#x2014;biologically more similar to the triple-negative phenotype, despite being HR-positive, HER2-negative&#x2014;may be more sensitive to chemotherapy. No significant differences in other clinical variables, including tumor stage, chemotherapy regimen, body mass index (BMI), family history, or metabolic parameters, were detected between the two groups (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Clinical characteristics of patients.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Characteristics</th>
<th valign="middle" align="left">Category</th>
<th valign="middle" align="left">Nonresponse (n=128)</th>
<th valign="middle" align="left">Response (n=34)</th>
<th valign="middle" align="left">P value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Age</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left">52.02 &#xb1; 11.68</td>
<td valign="middle" align="left">43.65 &#xb1; 10.63</td>
<td valign="middle" align="left">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="left">Clinical Stage</td>
<td valign="middle" align="left">II</td>
<td valign="middle" align="left">30 (23.4%)</td>
<td valign="middle" align="left">9 (26.5%)</td>
<td valign="middle" align="left">0.887</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">III</td>
<td valign="middle" align="left">98 (76.6%)</td>
<td valign="middle" align="left">25 (73.5%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">cT</td>
<td valign="middle" align="left">1</td>
<td valign="middle" align="left">14 (10.9%)</td>
<td valign="middle" align="left">2 (5.9%)</td>
<td valign="middle" align="left">0.397</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">2</td>
<td valign="middle" align="left">65 (50.8%)</td>
<td valign="middle" align="left">22 (64.7%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">3</td>
<td valign="middle" align="left">16 (12.5%)</td>
<td valign="middle" align="left">5 (14.7%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">4</td>
<td valign="middle" align="left">33 (25.8%)</td>
<td valign="middle" align="left">5 (14.7%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">cN</td>
<td valign="middle" align="left">0</td>
<td valign="middle" align="left">12 (9.4%)</td>
<td valign="middle" align="left">1 (2.9%)</td>
<td valign="middle" align="left">0.626</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">1</td>
<td valign="middle" align="left">34 (26.6%)</td>
<td valign="middle" align="left">9 (26.5%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">2</td>
<td valign="middle" align="left">45 (35.2%)</td>
<td valign="middle" align="left">15 (44.1%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">3</td>
<td valign="middle" align="left">37 (28.9%)</td>
<td valign="middle" align="left">9 (26.5%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">Surgery</td>
<td valign="middle" align="left">BCS</td>
<td valign="middle" align="left">6 (4.7%)</td>
<td valign="middle" align="left">7 (20.6%)</td>
<td valign="middle" align="left">0.007</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Mastectomy</td>
<td valign="middle" align="left">122 (95.3%)</td>
<td valign="middle" align="left">27 (79.4%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">ER</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left">0.81 &#xb1; 0.19</td>
<td valign="middle" align="left">0.46 &#xb1; 0.39</td>
<td valign="middle" align="left">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="left">PR</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left">0.55 &#xb1; 0.31</td>
<td valign="middle" align="left">0.33 &#xb1; 0.31</td>
<td valign="middle" align="left">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="left">KI67</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left">0.27 &#xb1; 0.14</td>
<td valign="middle" align="left">0.49 &#xb1; 0.28</td>
<td valign="middle" align="left">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="left">Grade</td>
<td valign="middle" align="left">I</td>
<td valign="middle" align="left">9 (7.0%)</td>
<td valign="middle" align="left">0 (0.0%)</td>
<td valign="middle" align="left">&lt;0.001</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">II</td>
<td valign="middle" align="left">105 (82.0%)</td>
<td valign="middle" align="left">21 (61.8%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">III</td>
<td valign="middle" align="left">14 (10.9%)</td>
<td valign="middle" align="left">13 (38.2%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">Tumor Position</td>
<td valign="middle" align="left">L</td>
<td valign="middle" align="left">66 (51.6%)</td>
<td valign="middle" align="left">18 (52.9%)</td>
<td valign="middle" align="left">1.000</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">62 (48.4%)</td>
<td valign="middle" align="left">16 (47.1%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">Chemotherapy Regimen</td>
<td valign="middle" align="left">AT-based</td>
<td valign="middle" align="left">105 (82.0%)</td>
<td valign="middle" align="left">27 (79.4%)</td>
<td valign="middle" align="left">0.727</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">A-based</td>
<td valign="middle" align="left">3 (2.3%)</td>
<td valign="middle" align="left">0 (0.0%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">T-based</td>
<td valign="middle" align="left">20 (15.6%)</td>
<td valign="middle" align="left">7 (20.6%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">Height</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left">159.39 &#xb1; 5.67</td>
<td valign="middle" align="left">159.62 &#xb1; 4.88</td>
<td valign="middle" align="left">0.817</td>
</tr>
<tr>
<td valign="middle" align="left">Weight</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left">62.86 &#xb1; 10.20</td>
<td valign="middle" align="left">60.24 &#xb1; 8.96</td>
<td valign="middle" align="left">0.147</td>
</tr>
<tr>
<td valign="middle" align="left">BMI</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left">24.77 &#xb1; 4.13</td>
<td valign="middle" align="left">23.60 &#xb1; 2.98</td>
<td valign="middle" align="left">0.201</td>
</tr>
<tr>
<td valign="middle" align="left">Menopausal Status</td>
<td valign="middle" align="left">NO</td>
<td valign="middle" align="left">67 (52.3%)</td>
<td valign="middle" align="left">25 (73.5%)</td>
<td valign="middle" align="left">0.043</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">YES</td>
<td valign="middle" align="left">61 (47.7%)</td>
<td valign="middle" align="left">9 (26.5%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">Family History</td>
<td valign="middle" align="left">NO</td>
<td valign="middle" align="left">92 (71.9%)</td>
<td valign="middle" align="left">20 (58.8%)</td>
<td valign="middle" align="left">0.209</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">YES</td>
<td valign="middle" align="left">36 (28.1%)</td>
<td valign="middle" align="left">14 (41.2%)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">LDL-C</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left">3.12 &#xb1; 0.86</td>
<td valign="middle" align="left">2.90 &#xb1; 0.94</td>
<td valign="middle" align="left">0.204</td>
</tr>
<tr>
<td valign="middle" align="left">TG</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left">1.44 &#xb1; 1.01</td>
<td valign="middle" align="left">1.18 &#xb1; 0.66</td>
<td valign="middle" align="left">0.148</td>
</tr>
<tr>
<td valign="middle" align="left">Glucose</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left">5.78 &#xb1; 1.67</td>
<td valign="middle" align="left">5.65 &#xb1; 1.59</td>
<td valign="middle" align="left">0.263</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Construction and validation of the predictive model for neoadjuvant chemotherapy response</title>
<p>The workflow for model construction is shown in <xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>. For each patient, 13 clinical variables and 1,024 pathological feature variables were extracted on the basis of the scanning and feature extraction of core needle biopsy H&amp;E-stained histopathological slides. To mitigate the risk of model overfitting due to an excessive number of variables, least absolute shrinkage and selection operator (LASSO) regression was employed for further variable selection. In LASSO regression, the optimal set of retained variables is determined by the choice of the regularization parameter &#x3bb;. We utilized 10-fold cross-validation and selected the optimal &#x3bb; based on a prespecified &#x201c;acceptable AUC loss threshold,&#x201d; which balances model performance and the retention of potentially informative predictors; specifically, the maximum absolute decrease in the area under the curve (AUC) was set to 0.01 (<xref ref-type="fig" rid="f3"><bold>Figures&#xa0;3A, B</bold></xref>). Ultimately, 55 variables were retained for model development, comprising six clinical variables&#x2014;PR (progesterone receptor), Ki-67, glucose, BMI, age, and histological grade&#x2014;and 49 pathological feature variables. Multiple machine learning models, including CatBoost, random forest, LightGBM, XGBoost, and support vector machine (SVM), were subsequently developed, and their predictive performances were assessed on both the training and validation cohorts (<xref ref-type="fig" rid="f3"><bold>Figures&#xa0;3C, D</bold></xref>; <xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>). Among these models, CatBoost demonstrated the best performance in the validation set, with an AUC of 0.848, a sensitivity of 0.818, a Brier score of 0.103, and a strong specificity of 0.795, all of which indicate excellent predictive accuracy and stability (<xref ref-type="fig" rid="f4"><bold>Figures&#xa0;4A, B</bold></xref>). Further assessment revealed that the confusion matrix for CatBoost contained a large number of true positives and true negatives (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4C</bold></xref>). Decision curve analysis (DCA) revealed that the net benefit curve of the model exceeded that of both the &#x201c;treat all&#x201d; and &#x201c;treat none&#x201d; strategies (representing scenarios where all or none of the patients received NAC, respectively), further supporting its clinical utility (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4D</bold></xref>). In addition, calibration curve analysis demonstrated good concordance between the predicted and observed probabilities of NAC response (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4E</bold></xref>). On the basis of these comprehensive assessments, the CatBoost model was selected as the final predictive model. Finally, analysis of the top 20 most important variables included in the CatBoost model revealed that Ki-67 ranked as the second most influential predictor. Other clinical variables in the top 20 included age, histological grade, and PR, which is consistent with our previous analysis of baseline patient characteristics (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4F</bold></xref>). The remaining top predictors were pathological feature variables, highlighting the critical role of pathology-derived features in the prediction of NAC response.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Workflow of study. The clinical information of 162 HR+/HER2- breast cancer patients and HE-stained pathological slide images from core needle biopsies before neoadjuvant chemotherapy were retrospectively collected. The ViT and UNI pretrained models were used to extract features, ultimately yielding 1024 pathological features. These features were combined with 13 collected clinical information features, and LASSO regression was used for feature selection. Selected features were subsequently obtained for efficacy prediction and the construction of the prognostic model. The validation and performance evaluation of the models were subsequently performed on the validation set, and the importance ranking of the features included in the models was determined. HE, hematoxylin and eosin; ViT, Vision Trans-former; UNI, Unified Network for Image; LASSO, least absolute shrinkage and selection operator.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1770037-g002.tif">
<alt-text content-type="machine-generated">Flowchart depicting a machine learning workflow for medical prognostic modeling. Steps include training and validation sets, feature extraction from images and clinical data, feature selection with LASSO, model construction for efficacy and recurrence prediction, and model validation categorizing responses and prognosis, followed by model evaluation and feature analysis.</alt-text>
</graphic></fig>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Selection process for the feature and machine learning algorithm for the nac efficacy prediction model. <bold>(A, B)</bold> Cross-validation curves and coefficient regularization paths from LASSO regression for feature selection; the optimal regularization parameter &#x3bb; was chosen on the basis of an &#x201c;acceptable AUC loss threshold&#x201d;. <bold>(C, D)</bold> Summary of the ROC curves and AUC values obtained for the multiple machine learning models in the training set (70%) and validation set (30%).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1770037-g003.tif">
<alt-text content-type="machine-generated">Four-panel data visualization showing: panel A, a cross-validated AUC plot with error bars for different log lambda values; panel B, LASSO coefficient paths across log lambda values; panel C, training ROC curves for five classifiers with AUC values, SVM performing best; panel D, validation ROC curves for the same classifiers with AUC values, Catboost showing the highest validation AUC.</alt-text>
</graphic></fig>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Summary of the AUC values and predictive efficacy metrics obtained for the multiple machine learning models in the training set (70%) and validation set (30%).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" colspan="7" align="center">Training set</th>
</tr>
<tr>
<th valign="middle" align="left">Models</th>
<th valign="middle" align="left">AUC</th>
<th valign="middle" align="left">Sensitivity</th>
<th valign="middle" align="left">Specificity</th>
<th valign="middle" align="left">Accuracy</th>
<th valign="middle" align="left">Threshold</th>
<th valign="middle" align="left">Brier</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Catboost</td>
<td valign="middle" align="left">0.900</td>
<td valign="middle" align="left">0.870</td>
<td valign="middle" align="left">0.820</td>
<td valign="middle" align="left">0.830</td>
<td valign="middle" align="left">0.126</td>
<td valign="middle" align="left">0.113</td>
</tr>
<tr>
<td valign="middle" align="left">RF</td>
<td valign="middle" align="left">0.911</td>
<td valign="middle" align="left">0.913</td>
<td valign="middle" align="left">0.831</td>
<td valign="middle" align="left">0.848</td>
<td valign="middle" align="left">0.242</td>
<td valign="middle" align="left">0.113</td>
</tr>
<tr>
<td valign="middle" align="left">lightGBM</td>
<td valign="middle" align="left">0.944</td>
<td valign="middle" align="left">0.957</td>
<td valign="middle" align="left">0.876</td>
<td valign="middle" align="left">0.893</td>
<td valign="middle" align="left">0.083</td>
<td valign="middle" align="left">0.082</td>
</tr>
<tr>
<td valign="middle" align="left">Xgboost</td>
<td valign="middle" align="left">0.874</td>
<td valign="middle" align="left">0.870</td>
<td valign="middle" align="left">0.775</td>
<td valign="middle" align="left">0.795</td>
<td valign="middle" align="left">0.210</td>
<td valign="middle" align="left">0.127</td>
</tr>
<tr>
<td valign="middle" align="left">SVM</td>
<td valign="middle" align="left">0.997</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.966</td>
<td valign="middle" align="left">0.973</td>
<td valign="middle" align="left">0.331</td>
<td valign="middle" align="left">0.033</td>
</tr>
<tr>
<th valign="middle" colspan="7" align="center">Validation set</th>
</tr>
<tr>
<th valign="middle" align="left">Models</th>
<th valign="middle" align="left">AUC</th>
<th valign="middle" align="left">Sensitivity</th>
<th valign="middle" align="left">Specificity</th>
<th valign="middle" align="left">Accuracy</th>
<th valign="middle" align="left">Threshold</th>
<th valign="middle" align="left">Brier</th>
</tr>
<tr>
<td valign="middle" align="left">Catboost</td>
<td valign="middle" align="left">0.848</td>
<td valign="middle" align="left">0.818</td>
<td valign="middle" align="left">0.795</td>
<td valign="middle" align="left">0.8</td>
<td valign="middle" align="left">0.241</td>
<td valign="middle" align="left">0.103</td>
</tr>
<tr>
<td valign="middle" align="left">RF</td>
<td valign="middle" align="left">0.834</td>
<td valign="middle" align="left">0.545</td>
<td valign="middle" align="left">0.949</td>
<td valign="middle" align="left">0.86</td>
<td valign="middle" align="left">0.407</td>
<td valign="middle" align="left">0.11</td>
</tr>
<tr>
<td valign="middle" align="left">lightGBM</td>
<td valign="middle" align="left">0.734</td>
<td valign="middle" align="left">0.909</td>
<td valign="middle" align="left">0.462</td>
<td valign="middle" align="left">0.56</td>
<td valign="middle" align="left">0.117</td>
<td valign="middle" align="left">0.155</td>
</tr>
<tr>
<td valign="middle" align="left">Xgboost</td>
<td valign="middle" align="left">0.8</td>
<td valign="middle" align="left">0.818</td>
<td valign="middle" align="left">0.718</td>
<td valign="middle" align="left">0.74</td>
<td valign="middle" align="left">0.21</td>
<td valign="middle" align="left">0.122</td>
</tr>
<tr>
<td valign="middle" align="left">SVM</td>
<td valign="middle" align="left">0.765</td>
<td valign="middle" align="left">0.545</td>
<td valign="middle" align="left">0.846</td>
<td valign="middle" align="left">0.78</td>
<td valign="middle" align="left">0.29</td>
<td valign="middle" align="left">0.206</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Evaluation of the predictive performance of the NAC efficacy prediction model. <bold>(A, B)</bold> The ROC curves and AUC values obtained for the CatBoost model in the training set (70%) and validation set (30%). <bold>(C)</bold> Confusion matrix yielded by the CatBoost model on the validation set. <bold>(D)</bold> Decision curve analysis (DCA) of the CatBoost model on the validation set. <bold>(E)</bold> Calibration curves of the CatBoost model in the validation set. <bold>(F)</bold> Feature importance ranking of the CatBoost model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1770037-g004.tif">
<alt-text content-type="machine-generated">Panel A shows a ROC curve for training data with an AUC of 0.900, while panel B displays the validation ROC curve with an AUC of 0.848, both reflecting CatBoost model performance. Panel C contains a confusion matrix on validation data, summarizing true positives, false positives, false negatives, and true negatives for MPgrade predictions. Panel D depicts a decision curve analysis for validation, illustrating model net benefit compared to &#x201c;treat all&#x201d; or &#x201c;treat none&#x201d; strategies across threshold probabilities. Panel E presents a calibration curve comparing predicted probabilities to observed event rates, indicating model reliability. Panel F is a horizontal bar chart listing the top 20 features contributing to the CatBoost model, with their respective importance percentages.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Construction and validation of the recurrence prediction model</title>
<p>For patients with HR-positive, HER2-negative breast cancer, the efficacy of neoadjuvant chemotherapy (NAC) not only plays a crucial role in optimizing surgical strategies but also draws considerable attention to its association with patient prognosis. Therefore, we divided the patients into two groups according to whether their MP grade reached 4 or 5 and whether a pCR was achieved. On the basis of the follow-up data, we constructed Kaplan&#x2013;Meier (KM) survival plots for each group, with a median follow-up period of 66 months. The results indicate that regardless of stratification by MP grade or pCR status, there was no significant difference in recurrence status or survival outcomes between the two groups (<xref ref-type="fig" rid="f5"><bold>Figures&#xa0;5A-D</bold></xref>). To further investigate potential risk factors influencing prognosis in this population, we performed both univariable and multivariable Cox proportional hazards regression analyses (<xref ref-type="table" rid="T3"><bold>Table&#xa0;3</bold></xref>; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>). The results revealed that extreme age groups at diagnosis (20&#x2013;30 years, hazard ratio [HR]=6.32, p=0.017; 71&#x2013;80 years, HR = 7.29, p=0.045), clinical N stage III (HR = 2.37, p=0.033), low PR expression (0&#x2013;25%; HR = 2.60, p=0.049), and MP grade 2 (HR = 4.07, p=0.003) were associated with an increased risk of recurrence. Conversely, clinical T stage I before NAC (HR = 0.20, p=0.031) and pathological T stage 0 after NAC (HR = 0.14, p=0.015) were protective factors against recurrence. Similarly, in the multivariable Cox regression analysis of survival outcomes, we observed consistent findings (<xref ref-type="table" rid="T4"><bold>Table&#xa0;4</bold></xref>; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S2</bold></xref>). Low age at diagnosis (20&#x2013;30 years; HR = 9.52, p=0.043), low PR expression (0&#x2013;25%; HR = 6.23, p=0.027), high Ki-67 expression (51&#x2013;75%; HR = 6.35, p=0.045), and MP grade 1 (HR = 12.35, p=0.021) or 2 (HR = 11.82, p=0.001) were associated with a higher risk of mortality. In contrast, compared with pathological T stage 1 disease, pathological T stage 0 disease after NAC was associated with a lower risk of mortality (HR = 0.02, p=0.026). Although these findings revealed certain risk factors linked to prognosis in HR-positive, HER2-negative breast cancer patients receiving NAC, no single variable emerged as a strong independent prognostic indicator for this population. Therefore, we next investigated the utility of machine learning models incorporating pathomic features for predicting patient prognosis. Following the previously established modeling strategy, we developed CatBoost models to predict recurrence at 1, 3, and 5 years after treatment. The results demonstrated that the model performed well in predicting 1-year recurrence, achieving an area under the curve (AUC) of 0.907 in the training set and 0.769 in the validation set, with a sensitivity of 0.857 (<xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6A-C</bold></xref>). Furthermore, decision curve analysis (DCA) demonstrated that the net benefit of the model exceeded that of both the &#x201c;treat all&#x201d; and &#x201c;treat none&#x201d; strategies (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6D</bold></xref>). In addition, the calibration curve showed good agreement between the predicted and observed recurrence probabilities (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6E</bold></xref>). Collectively, these findings support the potential clinical applicability of the recurrence prediction model. We also ranked the feature importance within the CatBoost model and found that the top-ranked variable was a pathomics feature. Among the top ten most important features, all except ER expression were pathomic variables (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6F</bold></xref>). These findings indicate that pathomic features may have greater potential than traditional clinical parameters for predicting recurrence and identifying high-risk subgroups among HR-positive, HER2-negative breast cancer patients.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Survival curves stratified by NAC efficacy groups. <bold>(A)</bold> Disease-free survival curves stratified according to whether patients achieved MP4.5. <bold>(B)</bold> Disease-free survival curves stratified according to whether patients achieved pCR. <bold>(C)</bold> Overall survival curves stratified according to whether patients achieved MP4.5. <bold>(D)</bold> Overall survival curves stratified according to whether patients achieved pCR. Log-rank tests were used to compare two overall survival curves.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1770037-g005.tif">
<alt-text content-type="machine-generated">Four-panel figure containing Kaplan-Meier survival curves. Panel A compares disease-free survival (DFS) by MIPgrade, showing overlapping curves with a p-value of 0.33. Panel B compares DFS by PCR status, also with overlapping curves and p-value of 0.26. Panel C compares overall survival (OS) by MIPgrade with similar trends, p-value 0.91. Panel D compares OS by PCR status, p-value 0.28. Each panel includes risk tables and time points on the x-axis up to approximately 120 months. No statistically significant differences are indicated between groups.</alt-text>
</graphic></fig>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Multivariate Cox regression analysis for disease-free survival.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Variable</th>
<th valign="top" align="center">Group</th>
<th valign="top" align="center">HR (DFS)</th>
<th valign="top" align="center">CI 95</th>
<th valign="top" align="center">P value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" rowspan="6" align="center">Age</td>
<td valign="top" align="center">20-30</td>
<td valign="top" align="center">6.32</td>
<td valign="top" align="center">(1.38-28.96)</td>
<td valign="top" align="center">0.017</td>
</tr>
<tr>
<td valign="top" align="center">31-40</td>
<td valign="top" align="center">2.11</td>
<td valign="top" align="center">(0.74-6.02)</td>
<td valign="top" align="center">0.163</td>
</tr>
<tr>
<td valign="top" align="center">41-50</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">51-60</td>
<td valign="top" align="center">1.39</td>
<td valign="top" align="center">(0.48-4.06)</td>
<td valign="top" align="center">0.541</td>
</tr>
<tr>
<td valign="top" align="center">61-70</td>
<td valign="top" align="center">1.22</td>
<td valign="top" align="center">(0.36-4.18)</td>
<td valign="top" align="center">0.751</td>
</tr>
<tr>
<td valign="top" align="center">71-80</td>
<td valign="top" align="center">7.29</td>
<td valign="top" align="center">(1.04-50.97)</td>
<td valign="top" align="center">0.045</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">cT stage</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">0.20</td>
<td valign="top" align="center">(0.05-0.86)</td>
<td valign="top" align="center">0.031</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">2.05</td>
<td valign="top" align="center">(0.69-6.06)</td>
<td valign="top" align="center">0.196</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">0.94</td>
<td valign="top" align="center">(0.38-2.35)</td>
<td valign="top" align="center">0.898</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">cN stage</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0.88</td>
<td valign="top" align="center">(0.19-4.1)</td>
<td valign="top" align="center">0.869</td>
</tr>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">0.89</td>
<td valign="top" align="center">(0.36-2.2)</td>
<td valign="top" align="center">0.808</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">2.37</td>
<td valign="top" align="center">(1.07-5.23)</td>
<td valign="top" align="center">0.033</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">Surgery</td>
<td valign="top" align="center">BCS</td>
<td valign="top" align="center">2.58</td>
<td valign="top" align="center">(0.87-7.69)</td>
<td valign="top" align="center">0.089</td>
</tr>
<tr>
<td valign="top" align="center">Mastectomy</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">ER</td>
<td valign="top" align="center">0-0.25</td>
<td valign="top" align="center">0.76</td>
<td valign="top" align="center">(0.21-2.77)</td>
<td valign="top" align="center">0.679</td>
</tr>
<tr>
<td valign="top" align="center">0.26-0.5</td>
<td valign="top" align="center">2.67</td>
<td valign="top" align="center">(0.7-10.16)</td>
<td valign="top" align="center">0.15</td>
</tr>
<tr>
<td valign="top" align="center">0.51-0.75</td>
<td valign="top" align="center">1.92</td>
<td valign="top" align="center">(0.81-4.55)</td>
<td valign="top" align="center">0.14</td>
</tr>
<tr>
<td valign="top" align="center">0.76-1</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">PR</td>
<td valign="top" align="center">0-0.25</td>
<td valign="top" align="center">2.60</td>
<td valign="top" align="center">(1-6.76)</td>
<td valign="top" align="center">0.049</td>
</tr>
<tr>
<td valign="top" align="center">0.26-0.5</td>
<td valign="top" align="center">1.62</td>
<td valign="top" align="center">(0.6-4.37)</td>
<td valign="top" align="center">0.338</td>
</tr>
<tr>
<td valign="top" align="center">0.51-0.75</td>
<td valign="top" align="center">1.94</td>
<td valign="top" align="center">(0.78-4.8)</td>
<td valign="top" align="center">0.152</td>
</tr>
<tr>
<td valign="top" align="center">0.76-1</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">Ki67</td>
<td valign="top" align="center">0-0.25</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">0.26-0.5</td>
<td valign="top" align="center">1.49</td>
<td valign="top" align="center">(0.71-3.1)</td>
<td valign="top" align="center">0.289</td>
</tr>
<tr>
<td valign="top" align="center">0.51-0.75</td>
<td valign="top" align="center">0.80</td>
<td valign="top" align="center">(0.23-2.76)</td>
<td valign="top" align="center">0.727</td>
</tr>
<tr>
<td valign="top" align="center">0.76-1</td>
<td valign="top" align="center">0.92</td>
<td valign="top" align="center">(0.2-4.28)</td>
<td valign="top" align="center">0.918</td>
</tr>
<tr>
<td valign="top" rowspan="3" align="center">Grade</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">0.00</td>
<td valign="top" align="center">(0-Inf)</td>
<td valign="top" align="center">0.996</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">1.74</td>
<td valign="top" align="center">(0.66-4.57)</td>
<td valign="top" align="center">0.261</td>
</tr>
<tr>
<td valign="top" rowspan="3" align="center">Chemotherapy regimen</td>
<td valign="top" align="center">AT-based</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">A-based</td>
<td valign="top" align="center">0.00</td>
<td valign="top" align="center">(0-Inf)</td>
<td valign="top" align="center">0.999</td>
</tr>
<tr>
<td valign="top" align="center">T-based</td>
<td valign="top" align="center">1.30</td>
<td valign="top" align="center">(0.51-3.32)</td>
<td valign="top" align="center">0.589</td>
</tr>
<tr>
<td valign="top" rowspan="5" align="center">ypT stage</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0.14</td>
<td valign="top" align="center">(0.03-0.69)</td>
<td valign="top" align="center">0.015</td>
</tr>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">0.74</td>
<td valign="top" align="center">(0.36-1.55)</td>
<td valign="top" align="center">0.428</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">1.76</td>
<td valign="top" align="center">(0.49-6.38)</td>
<td valign="top" align="center">0.386</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">5.05</td>
<td valign="top" align="center">(0.94-27.15)</td>
<td valign="top" align="center">0.059</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">ypN stage</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1.08</td>
<td valign="top" align="center">(0.27-4.26)</td>
<td valign="top" align="center">0.917</td>
</tr>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">0.62</td>
<td valign="top" align="center">(0.24-1.6)</td>
<td valign="top" align="center">0.322</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">0.47</td>
<td valign="top" align="center">(0.16-1.33)</td>
<td valign="top" align="center">0.154</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">Menopausal status</td>
<td valign="top" align="center">No</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">Yes</td>
<td valign="top" align="center">0.73</td>
<td valign="top" align="center">(0.25-2.12)</td>
<td valign="top" align="center">0.569</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">Family history</td>
<td valign="top" align="center">No</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">Yes</td>
<td valign="top" align="center">0.57</td>
<td valign="top" align="center">(0.28-1.15)</td>
<td valign="top" align="center">0.114</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">BMI</td>
<td valign="top" align="center">&lt;18.4</td>
<td valign="top" align="center">0.00</td>
<td valign="top" align="center">(0-Inf)</td>
<td valign="top" align="center">0.997</td>
</tr>
<tr>
<td valign="top" align="center">18.5-24.9</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">25-29.9</td>
<td valign="top" align="center">1.01</td>
<td valign="top" align="center">(0.49-2.06)</td>
<td valign="top" align="center">0.981</td>
</tr>
<tr>
<td valign="top" align="center">&gt;30</td>
<td valign="top" align="center">0.60</td>
<td valign="top" align="center">(0.17-2.09)</td>
<td valign="top" align="center">0.423</td>
</tr>
<tr>
<td valign="top" rowspan="3" align="center">LDL-C</td>
<td valign="top" align="center">&lt;1.88</td>
<td valign="top" align="center">1.05</td>
<td valign="top" align="center">(0.28-3.94)</td>
<td valign="top" align="center">0.948</td>
</tr>
<tr>
<td valign="top" align="center">1.89-4.21</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">&gt;4.22</td>
<td valign="top" align="center">0.90</td>
<td valign="top" align="center">(0.32-2.54)</td>
<td valign="top" align="center">0.848</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">TG</td>
<td valign="top" align="center">0-1.7</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">&gt;1.8</td>
<td valign="top" align="center">1.22</td>
<td valign="top" align="center">(0.51-2.9)</td>
<td valign="top" align="center">0.651</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">Glucose</td>
<td valign="top" align="center">3.9-6.1</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">&gt;6.2</td>
<td valign="top" align="center">0.50</td>
<td valign="top" align="center">(0.18-1.33)</td>
<td valign="top" align="center">0.164</td>
</tr>
<tr>
<td valign="top" rowspan="5" align="center">MPgrade</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1.67</td>
<td valign="top" align="center">(0.44-6.37)</td>
<td valign="top" align="center">0.452</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">4.07</td>
<td valign="top" align="center">(1.64-10.11)</td>
<td valign="top" align="center">0.003</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">1.39</td>
<td valign="top" align="center">(0.36-5.44)</td>
<td valign="top" align="center">0.635</td>
</tr>
<tr>
<td valign="top" align="center">5</td>
<td valign="top" align="center">0.00</td>
<td valign="top" align="center">(0-Inf)</td>
<td valign="top" align="center">0.999</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">PCR</td>
<td valign="top" align="center">No</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">Yes</td>
<td valign="top" align="center">0.60</td>
<td valign="top" align="center">(0.05-7.56)</td>
<td valign="top" align="center">0.693</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Evaluation of the predictive performance of the recurrence prediction model. <bold>(A, B)</bold> The ROC curves and AUC values obtained for the CatBoost model in the training set (70%) and validation set (30%). <bold>(C)</bold> Confusion matrix yielded by the CatBoost model on the validation set. <bold>(D)</bold> Decision curve analysis (DCA) of the CatBoost model on the validation set. <bold>(E)</bold> Calibration curves of the CatBoost model in the validation set. <bold>(F)</bold> Feature importance ranking of the CatBoost model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-16-1770037-g006.tif">
<alt-text content-type="machine-generated">Panel A shows a line graph of training ROC curves for one, three, and five-year recurrence prediction with reported AUCs; panel B displays similar ROC validation results. Panel C presents a confusion matrix for one-year recurrence validation, showing true positive, false positive, false negative, and true negative rates with respective counts and percentages. Panel D features a decision curve analysis for the one-year recurrence model, displaying net benefit across probability thresholds. Panel E shows a calibration curve comparing observed event rates versus predicted probabilities for one-year recurrence. Panel F is a horizontal bar chart ranking feature importance for the CatBoost model, listing variable names and corresponding importance percentages.</alt-text>
</graphic></fig>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>Multivariate Cox regression analysis for overall survival of patients.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Variable</th>
<th valign="top" align="center">Group</th>
<th valign="top" align="center">HR (OS)</th>
<th valign="top" align="center">CI 95</th>
<th valign="top" align="center">P value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" rowspan="6" align="center">Age</td>
<td valign="top" align="center">20-30</td>
<td valign="top" align="center">9.52</td>
<td valign="top" align="center">(1.07-84.81)</td>
<td valign="top" align="center">0.043</td>
</tr>
<tr>
<td valign="top" align="center">31-40</td>
<td valign="top" align="center">3.61</td>
<td valign="top" align="center">(0.62-20.95)</td>
<td valign="top" align="center">0.152</td>
</tr>
<tr>
<td valign="top" align="center">41-50</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">51-60</td>
<td valign="top" align="center">1.83</td>
<td valign="top" align="center">(0.38-8.84)</td>
<td valign="top" align="center">0.452</td>
</tr>
<tr>
<td valign="top" align="center">61-70</td>
<td valign="top" align="center">0.63</td>
<td valign="top" align="center">(0.05-7.26)</td>
<td valign="top" align="center">0.711</td>
</tr>
<tr>
<td valign="top" align="center">71-80</td>
<td valign="top" align="center">9.71</td>
<td valign="top" align="center">(0.39-244.12)</td>
<td valign="top" align="center">0.167</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">cT stage</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">0.19</td>
<td valign="top" align="center">(0.02-2.13)</td>
<td valign="top" align="center">0.178</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">3.41</td>
<td valign="top" align="center">(0.78-14.84)</td>
<td valign="top" align="center">0.102</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">1.27</td>
<td valign="top" align="center">(0.26-6.19)</td>
<td valign="top" align="center">0.767</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">cN stage</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0.00</td>
<td valign="top" align="center">(0-Inf)</td>
<td valign="top" align="center">0.998</td>
</tr>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">2.17</td>
<td valign="top" align="center">(0.57-8.19)</td>
<td valign="top" align="center">0.254</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">2.56</td>
<td valign="top" align="center">(0.72-9.15)</td>
<td valign="top" align="center">0.148</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">Surgery</td>
<td valign="top" align="center">BCS</td>
<td valign="top" align="center">0.80</td>
<td valign="top" align="center">(0.09-6.88)</td>
<td valign="top" align="center">0.841</td>
</tr>
<tr>
<td valign="top" align="center">Mastectomy</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">ER</td>
<td valign="top" align="center">0-0.25</td>
<td valign="top" align="center">2.29</td>
<td valign="top" align="center">(0.39-13.57)</td>
<td valign="top" align="center">0.36</td>
</tr>
<tr>
<td valign="top" align="center">0.26-0.5</td>
<td valign="top" align="center">1.65</td>
<td valign="top" align="center">(0.16-17.36)</td>
<td valign="top" align="center">0.676</td>
</tr>
<tr>
<td valign="top" align="center">0.51-0.75</td>
<td valign="top" align="center">1.97</td>
<td valign="top" align="center">(0.5-7.85)</td>
<td valign="top" align="center">0.335</td>
</tr>
<tr>
<td valign="top" align="center">0.76-1</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">PR</td>
<td valign="top" align="center">0-0.25</td>
<td valign="top" align="center">6.23</td>
<td valign="top" align="center">(1.23-31.53)</td>
<td valign="top" align="center">0.027</td>
</tr>
<tr>
<td valign="top" align="center">0.26-0.5</td>
<td valign="top" align="center">2.84</td>
<td valign="top" align="center">(0.64-12.54)</td>
<td valign="top" align="center">0.167</td>
</tr>
<tr>
<td valign="top" align="center">0.51-0.75</td>
<td valign="top" align="center">1.14</td>
<td valign="top" align="center">(0.17-7.66)</td>
<td valign="top" align="center">0.896</td>
</tr>
<tr>
<td valign="top" align="center">0.76-1</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">Ki67</td>
<td valign="top" align="center">0-0.25</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">0.26-0.5</td>
<td valign="top" align="center">1.30</td>
<td valign="top" align="center">(0.37-4.61)</td>
<td valign="top" align="center">0.685</td>
</tr>
<tr>
<td valign="top" align="center">0.51-0.75</td>
<td valign="top" align="center">6.35</td>
<td valign="top" align="center">(1.04-38.7)</td>
<td valign="top" align="center">0.045</td>
</tr>
<tr>
<td valign="top" align="center">0.76-1</td>
<td valign="top" align="center">6.30</td>
<td valign="top" align="center">(0.33-120.65)</td>
<td valign="top" align="center">0.222</td>
</tr>
<tr>
<td valign="top" rowspan="3" align="center">Grade</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">0.00</td>
<td valign="top" align="center">(0-Inf)</td>
<td valign="top" align="center">0.998</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">0.73</td>
<td valign="top" align="center">(0.17-3.02)</td>
<td valign="top" align="center">0.66</td>
</tr>
<tr>
<td valign="top" rowspan="3" align="center">Chemotherapy regimen</td>
<td valign="top" align="center">AT-based</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">A-based</td>
<td valign="top" align="center">0.00</td>
<td valign="top" align="center">(0-Inf)</td>
<td valign="top" align="center">0.999</td>
</tr>
<tr>
<td valign="top" align="center">T-based</td>
<td valign="top" align="center">0.36</td>
<td valign="top" align="center">(0.05-2.44)</td>
<td valign="top" align="center">0.294</td>
</tr>
<tr>
<td valign="top" rowspan="5" align="center">ypT stage</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0.02</td>
<td valign="top" align="center">(0-0.62)</td>
<td valign="top" align="center">0.026</td>
</tr>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">0.37</td>
<td valign="top" align="center">(0.11-1.22)</td>
<td valign="top" align="center">0.102</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">0.15</td>
<td valign="top" align="center">(0.01-1.71)</td>
<td valign="top" align="center">0.127</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">2.35</td>
<td valign="top" align="center">(0.12-46.86)</td>
<td valign="top" align="center">0.576</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">ypN stage</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0.14</td>
<td valign="top" align="center">(0.01-2.46)</td>
<td valign="top" align="center">0.179</td>
</tr>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">0.51</td>
<td valign="top" align="center">(0.1-2.57)</td>
<td valign="top" align="center">0.415</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">0.27</td>
<td valign="top" align="center">(0.04-1.97)</td>
<td valign="top" align="center">0.195</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">Menopausal status</td>
<td valign="top" align="center">No</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">Yes</td>
<td valign="top" align="center">0.20</td>
<td valign="top" align="center">(0.03-1.13)</td>
<td valign="top" align="center">0.068</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">Family History</td>
<td valign="top" align="center">No</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">Yes</td>
<td valign="top" align="center">0.38</td>
<td valign="top" align="center">(0.11-1.31)</td>
<td valign="top" align="center">0.125</td>
</tr>
<tr>
<td valign="top" rowspan="4" align="center">BMI</td>
<td valign="top" align="center">&lt;18.4</td>
<td valign="top" align="center">0.00</td>
<td valign="top" align="center">(0-Inf)</td>
<td valign="top" align="center">0.999</td>
</tr>
<tr>
<td valign="top" align="center">18.5-24.9</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">25-29.9</td>
<td valign="top" align="center">1.40</td>
<td valign="top" align="center">(0.45-4.36)</td>
<td valign="top" align="center">0.564</td>
</tr>
<tr>
<td valign="top" align="center">&gt;30</td>
<td valign="top" align="center">0.75</td>
<td valign="top" align="center">(0.09-6.63)</td>
<td valign="top" align="center">0.799</td>
</tr>
<tr>
<td valign="top" rowspan="3" align="center">LDL-C</td>
<td valign="top" align="center">&lt;1.88</td>
<td valign="top" align="center">0.21</td>
<td valign="top" align="center">(0.01-5.99)</td>
<td valign="top" align="center">0.363</td>
</tr>
<tr>
<td valign="top" align="center">1.89-4.21</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">&gt;4.22</td>
<td valign="top" align="center">2.26</td>
<td valign="top" align="center">(0.41-12.63)</td>
<td valign="top" align="center">0.352</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">TG</td>
<td valign="top" align="center">0-1.7</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">&gt;1.8</td>
<td valign="top" align="center">0.70</td>
<td valign="top" align="center">(0.19-2.59)</td>
<td valign="top" align="center">0.599</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">Glucose</td>
<td valign="top" align="center">3.9-6.1</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">&gt;6.2</td>
<td valign="top" align="center">0.90</td>
<td valign="top" align="center">(0.18-4.54)</td>
<td valign="top" align="center">0.9</td>
</tr>
<tr>
<td valign="top" rowspan="5" align="center">MPgrade</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">12.35</td>
<td valign="top" align="center">(1.47-103.76)</td>
<td valign="top" align="center">0.021</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">11.82</td>
<td valign="top" align="center">(2.61-53.65)</td>
<td valign="top" align="center">0.001</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">1.25</td>
<td valign="top" align="center">(0.15-10.46)</td>
<td valign="top" align="center">0.836</td>
</tr>
<tr>
<td valign="top" align="center">5</td>
<td valign="top" align="center">0.03</td>
<td valign="top" align="center">(0-Inf)</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">PCR</td>
<td valign="top" align="center">No</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">Reference</td>
<td valign="top" align="center">Reference</td>
</tr>
<tr>
<td valign="top" align="center">Yes</td>
<td valign="top" align="center">3.31e+10</td>
<td valign="top" align="center">(0-Inf)</td>
<td valign="top" align="center">0.999</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>In this study, we developed and validated a machine learning model based on the CatBoost algorithm to predict the efficacy of neoadjuvant chemotherapy (NAC) in patients with HR-positive, HER2-negative breast cancer. Furthermore, we investigated prognostic risk factors and evaluated the model performance in predicting recurrence in this patient population. Our findings demonstrate that by integrating pathomic features from pre-NAC biopsy histopathological slides with clinical data, the model achieves high accuracy in both treatment response prediction and recurrence risk stratification, highlighting its promising potential for clinical application.</p>
<p>Given the substantial clinical importance of predicting the response to NAC, numerous previous studies have focused on this topic. Liu et&#xa0;al. (<xref ref-type="bibr" rid="B18">18</xref>) and Wang et&#xa0;al. (<xref ref-type="bibr" rid="B19">19</xref>) developed predictive models based on patients&#x2019; clinical characteristics combined with MRI-based radiomics features to estimate NAC efficacy in HR-positive/HER2-negative breast cancer, achieving favorable predictive performance, with AUCs of 0.787 and 0.810 in the validation cohorts respectively, slightly lower than that observed in the present study (AUC = 0.848). However, unlike the current pathomics based approach, most radiomics driven models rely on manual delineation of regions of interest (ROIs), a process that is labor intensive and time consuming, thereby limiting their feasibility and scalability in routine clinical practice. In addition, li et&#xa0;al. (<xref ref-type="bibr" rid="B16">16</xref>) constructed a machine learning model based on pathomics features to predict NAC response across all breast cancer subtypes, achieving an AUC of 0.830 in the validation set. However, that study used CellProfiler to extract pathology features, whereas our study used the UNI algorithm, which can automatically segment and extract feature information from pathology slides. CellProfiler requires pathologists to preselect screenshots with the highest tumor cell content from segmented WSIs for subsequent feature extraction, which increases labor costs. In addition, unlike li et&#xa0;al., who chose a single SVM as the predictive algorithm, our study compared five different machine learning algorithms and built ensemble models to further improve predictive performance; this may explain why our study, focusing on the HR-positive, HER2-negative subgroup, was still able to achieve a higher AUC.</p>
<p>Unlike HER2-overexpressing or triple-negative breast cancer (TNBC), HR-positive, HER2-negative breast cancer is less sensitive to neoadjuvant chemotherapy (NAC). Previous studies have reported that the pCR rate in this population ranges from approximately 0&#x2013;18% (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B21">21</xref>). Consistent with these findings, our cohort had a pCR rate of 8.6%, with only 14 out of 162 patients achieving pCR following NAC. The lower sensitivity to chemotherapy in this subtype may be attributed to hormone dependency, lower cellular proliferation rates, and distinctive mutational characteristics of tumor cells (<xref ref-type="bibr" rid="B22">22</xref>). One of the goals of NAC is to reduce tumor volume so that patients who would otherwise require mastectomy may become eligible for breast-conserving surgery (BCS), thereby minimizing surgical trauma and improving quality of life (<xref ref-type="bibr" rid="B23">23</xref>), for these patients, achieving pCR is not always necessary for surgical de-escalation (<xref ref-type="bibr" rid="B24">24</xref>). For this reason, we selected Miller&#x2013;Payne (MP) grade as the primary endpoint for model prediction, with grades 4 and 5 indicating substantial tumor regression (<xref ref-type="bibr" rid="B17">17</xref>). In our cohort, the proportion of patients who ultimately underwent BCS was significantly greater among those with MP grades 4 or 5 than among those with grades 1, 2, or 3 (20.6% vs. 4.7%, P = 0.007). Previous research has also demonstrated that NAC increases the rate of breast conservation in this subgroup of patients (<xref ref-type="bibr" rid="B25">25</xref>&#x2013;<xref ref-type="bibr" rid="B29">29</xref>). Despite this benefit, only a small percentage of HR-positive, HER2-negative patients achieve high MP grades after NAC, which highlights the need to identify patients who are unlikely to benefit from chemotherapy in advance and avoid subjecting them to unnecessary toxicity. Currently, there are few robust tools for predicting NAC response in this population. Most prior models focus primarily on conventional clinical and molecular pathological markers, including hormone receptor status, the Ki-67 index, clinical tumor stage, and histological grade (<xref ref-type="bibr" rid="B8">8</xref>, <xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B30">30</xref>). In our study, we observed significant differences in these features between NAC-sensitive and NAC-insensitive patients, with the sensitive group generally being younger, exhibiting lower expression of estrogen receptor (ER) and progesterone receptor (PR), and having higher values for Ki-67 and histological grade. Most of these differences are molecular pathological features, suggesting that additional discriminative information may be embedded within pathological images. This rationale led us to integrate both pathomic features and clinical variables into our predictive model. Pathomic features were extracted from hematoxylin and eosin (H&amp;E)-stained whole-slide images (WSIs) of core needle biopsy specimens obtained prior to NAC. These images are readily available in clinical practice, cost effective, and offer high potential for clinical translation (<xref ref-type="bibr" rid="B31">31</xref>). For feature extraction, we utilized the UNI model, which had been pretrained on large-scale cancer image databases containing more than 100,000 H&amp;E-stained diagnostic-grade whole-slide images across 20 major tissue types, exceeding 77 terabytes in total. Through self-supervised and multitask learning, the UNI model captures complex morphological patterns and features from cancer histopathology, enabling efficient and accurate feature extraction even on new datasets (<xref ref-type="bibr" rid="B32">32</xref>). During the model development stage, we tested five commonly used machine learning algorithms and reported that CatBoost provided the highest accuracy and sensitivity in predicting NAC response. In future clinical applications, false-positive predictions present a greater risk, as misclassifying chemotherapy-insensitive patients as sensitive could deprive them of the opportunity for surgery. Given this consideration, CatBoost was selected as the optimal modeling strategy. As a decision tree-based algorithm, CatBoost is well suited for handling categorical and heterogeneous data, offering both robust accuracy and generalizability in medical prediction tasks (<xref ref-type="bibr" rid="B33">33</xref>&#x2013;<xref ref-type="bibr" rid="B36">36</xref>). All the steps of model construction were performed exclusively within the training set to ensure that no information leakage into the validation set occurred, thereby maintaining the integrity and reliability of the prediction results. For the final prediction model, we applied SHapley Additive exPlanations (SHAP) to interpret feature importance. As anticipated, in addition to previously reported clinical predictors such as PR and Ki-67, pathomic features were predominant among the most important variables. These findings support our hypothesis and highlight the value of pathomic data in predicting NAC response in patients with breast cancer. The model development process, from biopsy slide scanning and feature extraction to variable selection and model training, is fully reproducible and presents significant promise for future clinical translation.</p>
<p>The relationship between the efficacy of neoadjuvant chemotherapy (NAC) and patient prognosis remains an important area of investigation. Previous studies have reported that achieving pathological complete response (pCR) after NAC is often associated with improved prognosis (<xref ref-type="bibr" rid="B37">37</xref>&#x2013;<xref ref-type="bibr" rid="B40">40</xref>). However, our results indicate that for patients with HR-positive, HER2-negative breast cancer, neither achieving pCR nor attaining Miller&#x2013;Payne (MP) grades 4 or 5 after NAC is associated with a reduced risk of recurrence or mortality. These findings align with reports from some previous studies, which have also shown conflicting results in this patient subgroup (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B42">42</xref>). Our further analyses provide a possible explanation for this phenomenon. Cox proportional hazards regression revealed risk factors for worse prognosis, including younger age at diagnosis, low progesterone receptor expression, and a high Ki-67 index. However, these factors are also associated with a better response to chemotherapy. Thus, the prognostic benefit conferred by the chemotherapy response is offset by the higher baseline risk associated with more aggressive tumor biology, leading to the observation that NAC responders and nonresponders have similar long-term outcomes in this patient population. In light of this, the identification of high-risk patients for intensified therapy is essential to reduce the risk of recurrence. Our results demonstrate that machine learning models integrating pathomics and clinical information strongly predict 1-year recurrence, but these models do not accurately predict 3- or 5-year recurrence. This may be because recurrence within 1 year represents a very high degree of malignancy of the tumor, with certain identifiable characteristics at the pathological level. However, recurrence after a longer period is influenced by more diverse factors, and relying solely on information from the tumor itself may not be sufficient for accurate prediction. We also investigated the application of our models for survival prediction. Owing to the low number of deaths within 1 year, we developed models to predict 3-year and 5-year survival. Although the 3-year survival prediction model achieved a favorable area under the curve (AUC) of 0.770 in the validation set, decision curve analysis revealed no clinical net benefit for patient management (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figures S2A, B, D</bold></xref>). Analysis of the confusion matrix suggested that this is attributable to the overall favorable prognosis of this subtype, with a 3-year mortality rate of only 6.7%; assigning the majority of patients to the &#x201c;survival&#x201d; category yields high specificity (0.952) but fails to provide meaningful risk stratification despite an apparently good AUC (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S2C</bold></xref>).</p>
<p>The novelty of the present study lies in the development of a subtype specific, fully automated model for predicting NAC response in HR-positive,HER2-negative breast cancer, based on a rigorous and reproducible analytical pipeline. In addition, we investigated prognostic risk factors in this patient subgroup and evaluated the performance of the proposed model in predicting disease recurrence, thereby extending previous machine learning&#x2013;based pathology research. Nevertheless, this study has several limitations: First, our data were collected from a single-center retrospective cohort and lack external validation. Despite strict inclusion criteria to ensure data quality and the use of ensemble modeling to increase model robustness and generalizability, larger prospective cohorts and the incorporation of external validation datasets will be needed in future work to improve the model reliability and predictive accuracy. Second, in this study, pathomic features were extracted using the UNI model. While UNI enables efficient and accurate feature extraction, as a patch-level feature extractor, it generates encoded feature vectors rather than manually engineered morphological features, such as nuclear shape or tissue architecture (<xref ref-type="bibr" rid="B43">43</xref>). Although this abstract representation can capture complex pathological patterns, it does not allow direct mapping back to the original image to form interpretable visual markers, for example, overlaying heatmaps for intuitive pathological localization. As a result, the model lacks straightforward pathological interpretability. In future research, building on our existing work, we will continue to develop interpretable predictive models to further improve the model&#x2019;s predictive performance.</p>
<p>In conclusion, we developed a CatBoost-based machine learning model that integrates pathomics and clinical information to predict the efficacy of NAC in HR-positive, HER2-negative breast cancer and demonstrated its robust predictive performance. Furthermore, our pathological model predicted early recurrence in HR-positive, HER2-negative breast cancer patients, thus could provide better guidance for clinical practice when deciding whether to perform surgery first or NAC.</p>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p></sec>
<sec id="s6" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Ethics Committee of National Cancer Center/Cancer Hospital, Chinese Academy of Medical Sciences and Peking Union Medical College. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p></sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>JYu: Visualization, Validation, Writing &#x2013; original draft, Formal Analysis. JL: Visualization, Formal analysis, Writing &#x2013; original draft. XK: Writing &#x2013; original draft, Formal analysis, Methodology. PY:&#xa0;Writing &#x2013; original draft, Data curation, Resources. WW:&#xa0;Writing &#x2013; original draft, Software. ZW: Writing &#x2013; original draft, Conceptualization. CS: Conceptualization, Writing &#x2013; original draft. QS: Writing &#x2013; original draft, Investigation. GL: Investigation, Writing &#x2013; original draft. XD: Investigation, Writing &#x2013; original draft. TW: Writing &#x2013; original draft, Investigation. DY: Investigation, Writing &#x2013; original draft. SW: Writing &#x2013; review &amp; editing, Software. CY: Writing &#x2013; review &amp; editing, Conceptualization, Funding acquisition. JYi: Supervision, Resources, Writing &#x2013; review &amp; editing. XW: Supervision, Writing &#x2013; review &amp; editing, Project administration, Funding acquisition.</p></sec>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>Author WW was employed by company Thorough Future.</p>
<p>The remaining author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fonc.2026.1770037/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fonc.2026.1770037/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="DataSheet1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Siegel</surname> <given-names>RL</given-names></name>
<name><surname>Kratzer</surname> <given-names>TB</given-names></name>
<name><surname>Giaquinto</surname> <given-names>AN</given-names></name>
<name><surname>Sung</surname> <given-names>H</given-names></name>
<name><surname>Jemal</surname> <given-names>A</given-names></name>
</person-group>. 
<article-title>Cancer statistics, 2025</article-title>. <source>CA A Cancer J Clin</source>. (<year>2025</year>) <volume>75</volume>:<fpage>10</fpage>&#x2013;<lpage>45</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/caac.21871</pub-id>, PMID: <pub-id pub-id-type="pmid">39817679</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<label>2</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Giaquinto</surname> <given-names>AN</given-names></name>
<name><surname>Sung</surname> <given-names>H</given-names></name>
<name><surname>Newman</surname> <given-names>LA</given-names></name>
<name><surname>Freedman</surname> <given-names>RA</given-names></name>
<name><surname>Smith</surname> <given-names>RA</given-names></name>
<name><surname>Star</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>Breast cancer statistics 2024</article-title>. <source>CA A Cancer J Clin</source>. (<year>2024</year>) <volume>74</volume>:<page-range>477&#x2013;95</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/caac.21863</pub-id>, PMID: <pub-id pub-id-type="pmid">39352042</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<label>3</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Huppert</surname> <given-names>LA</given-names></name>
<name><surname>Gumusay</surname> <given-names>O</given-names></name>
<name><surname>Idossa</surname> <given-names>D</given-names></name>
<name><surname>Rugo</surname> <given-names>HS</given-names></name>
</person-group>. 
<article-title>Systemic therapy for hormone receptor-positive/human epidermal growth factor receptor 2-negative early stage and metastatic breast cancer</article-title>. <source>CA A Cancer J Clin</source>. (<year>2023</year>) <volume>73</volume>:<fpage>480</fpage>&#x2013;<lpage>515</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/caac.21777</pub-id>, PMID: <pub-id pub-id-type="pmid">36939293</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<label>4</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Loi</surname> <given-names>S</given-names></name>
</person-group>. 
<article-title>The ESMO clinical practise guidelines for early breast cancer: diagnosis, treatment and follow-up: on the winding road to personalized medicine</article-title>. <source>Ann Oncol</source>. (<year>2019</year>) <volume>30</volume>:<page-range>1183&#x2013;4</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/annonc/mdz201</pub-id>, PMID: <pub-id pub-id-type="pmid">31287498</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<label>5</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Curigliano</surname> <given-names>G</given-names></name>
<name><surname>Burstein</surname> <given-names>HJ</given-names></name>
<name><surname>Winer</surname> <given-names>EP</given-names></name>
<name><surname>Gnant</surname> <given-names>M</given-names></name>
<name><surname>Dubsky</surname> <given-names>P</given-names></name>
<name><surname>Loibl</surname> <given-names>S</given-names></name>
<etal/>
</person-group>. 
<article-title>De-escalating and escalating treatments for early-stage breast cancer: the St. Gallen International Expert Consensus Conference on the Primary Therapy of Early Breast Cancer 2017</article-title>. <source>Ann Oncol</source>. (<year>2017</year>) <volume>28</volume>:<page-range>1700&#x2013;12</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/annonc/mdx308</pub-id>, PMID: <pub-id pub-id-type="pmid">28838210</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<label>6</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bhargava</surname> <given-names>R</given-names></name>
<name><surname>Beriwal</surname> <given-names>S</given-names></name>
<name><surname>Dabbs</surname> <given-names>DJ</given-names></name>
<name><surname>Ozbek</surname> <given-names>U</given-names></name>
<name><surname>Soran</surname> <given-names>A</given-names></name>
<name><surname>Johnson</surname> <given-names>RR</given-names></name>
<etal/>
</person-group>. 
<article-title>Immunohistochemical surrogate markers of breast cancer molecular classes predicts response to neoadjuvant chemotherapy: A single institutional experience with 359 cases</article-title>. <source>Cancer</source>. (<year>2010</year>) <volume>116</volume>:<page-range>1431&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/cncr.24876</pub-id>, PMID: <pub-id pub-id-type="pmid">20131351</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<label>7</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lips</surname> <given-names>EH</given-names></name>
<name><surname>Mulder</surname> <given-names>L</given-names></name>
<name><surname>De Ronde</surname> <given-names>JJ</given-names></name>
<name><surname>Mandjes</surname> <given-names>IAM</given-names></name>
<name><surname>Vincent</surname> <given-names>A</given-names></name>
<name><surname>Vrancken Peeters</surname> <given-names>MTFD</given-names></name>
<etal/>
</person-group>. 
<article-title>Neoadjuvant chemotherapy in ER+ HER2&#x2013; breast cancer: response prediction based on immunohistochemical and molecular characteristics</article-title>. <source>Breast Cancer Res Treat</source>. (<year>2012</year>) <volume>131</volume>:<page-range>827&#x2013;36</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10549-011-1488-0</pub-id>, PMID: <pub-id pub-id-type="pmid">21472434</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<label>8</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>H&#xe4;berle</surname> <given-names>L</given-names></name>
<name><surname>Erber</surname> <given-names>R</given-names></name>
<name><surname>Gass</surname> <given-names>P</given-names></name>
<name><surname>Hein</surname> <given-names>A</given-names></name>
<name><surname>Niklos</surname> <given-names>M</given-names></name>
<name><surname>Volz</surname> <given-names>B</given-names></name>
<etal/>
</person-group>. 
<article-title>Prediction of pathological complete response after neoadjuvant chemotherapy for HER2-negative breast cancer patients with routine immunohistochemical markers</article-title>. <source>Breast Cancer Res</source>. (<year>2025</year>) <volume>27</volume>:<elocation-id>13</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13058-025-01960-8</pub-id>, PMID: <pub-id pub-id-type="pmid">39856787</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<label>9</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mastrantoni</surname> <given-names>L</given-names></name>
<name><surname>Garufi</surname> <given-names>G</given-names></name>
<name><surname>Giordano</surname> <given-names>G</given-names></name>
<name><surname>Maliziola</surname> <given-names>N</given-names></name>
<name><surname>Di Monte</surname> <given-names>E</given-names></name>
<name><surname>Arcuri</surname> <given-names>G</given-names></name>
<etal/>
</person-group>. 
<article-title>Accessible model predicts response in hormone receptor positive HER2 negative breast cancer receiving neoadjuvant chemotherapy</article-title>. <source>NPJ Breast Cancer</source>. (<year>2025</year>) <volume>11</volume>:<fpage>11</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41523-025-00727-w</pub-id>, PMID: <pub-id pub-id-type="pmid">39910103</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<label>10</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cortazar</surname> <given-names>P</given-names></name>
<name><surname>Zhang</surname> <given-names>L</given-names></name>
<name><surname>Untch</surname> <given-names>M</given-names></name>
<name><surname>Mehta</surname> <given-names>K</given-names></name>
<name><surname>Costantino</surname> <given-names>JP</given-names></name>
<name><surname>Wolmark</surname> <given-names>N</given-names></name>
<etal/>
</person-group>. 
<article-title>Pathological complete response and long-term clinical benefit in breast cancer: the CTNeoBC pooled analysis</article-title>. <source>Lancet</source>. (<year>2014</year>) <volume>384</volume>:<page-range>164&#x2013;72</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0140-6736(13)62422-8</pub-id>, PMID: <pub-id pub-id-type="pmid">24529560</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<label>11</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Conforti</surname> <given-names>F</given-names></name>
<name><surname>Pala</surname> <given-names>L</given-names></name>
<name><surname>Sala</surname> <given-names>I</given-names></name>
<name><surname>Oriecuia</surname> <given-names>C</given-names></name>
<name><surname>De Pas</surname> <given-names>T</given-names></name>
<name><surname>Specchia</surname> <given-names>C</given-names></name>
<etal/>
</person-group>. 
<article-title>Evaluation of pathological complete response as surrogate endpoint in neoadjuvant randomised clinical trials of early stage breast cancer: systematic review and meta-analysis</article-title>. <source>BMJ</source>. (<year>2021</year>) <volume>375</volume>:<fpage>e066381</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj-2021-066381</pub-id>, PMID: <pub-id pub-id-type="pmid">34933868</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<label>12</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fisher</surname> <given-names>TB</given-names></name>
<name><surname>Saini</surname> <given-names>G</given-names></name>
<name><surname>Rekha</surname> <given-names>TS</given-names></name>
<name><surname>Krishnamurthy</surname> <given-names>J</given-names></name>
<name><surname>Bhattarai</surname> <given-names>S</given-names></name>
<name><surname>Callagy</surname> <given-names>G</given-names></name>
<etal/>
</person-group>. 
<article-title>Digital image analysis and machine learning-assisted prediction of neoadjuvant chemotherapy response in triple-negative breast cancer</article-title>. <source>Breast Cancer Res</source>. (<year>2024</year>) <volume>26</volume>:<fpage>12</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13058-023-01752-y</pub-id>, PMID: <pub-id pub-id-type="pmid">38238771</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<label>13</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cao</surname> <given-names>R</given-names></name>
<name><surname>Yang</surname> <given-names>F</given-names></name>
<name><surname>Ma</surname> <given-names>S-C</given-names></name>
<name><surname>Liu</surname> <given-names>L</given-names></name>
<name><surname>Zhao</surname> <given-names>Y</given-names></name>
<name><surname>Li</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>Development and interpretation of a pathomics-based model for the prediction of microsatellite instability in Colorectal Cancer</article-title>. <source>Theranostics</source>. (<year>2020</year>) <volume>10</volume>:<page-range>11080&#x2013;91</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.7150/thno.49864</pub-id>, PMID: <pub-id pub-id-type="pmid">33042271</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<label>14</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>Q</given-names></name>
<name><surname>Jiang</surname> <given-names>N</given-names></name>
<name><surname>Hao</surname> <given-names>Y</given-names></name>
<name><surname>Hao</surname> <given-names>C</given-names></name>
<name><surname>Wang</surname> <given-names>W</given-names></name>
<name><surname>Bian</surname> <given-names>T</given-names></name>
<etal/>
</person-group>. 
<article-title>6.Identification of lymph node metastasis in pre-operation cervical cancer patients by weakly supervised deep learning from histopathological whole-slide biopsy images</article-title>. <source>Cancer Med</source>. (<year>2023</year>) <volume>12</volume>:<page-range>17952&#x2013;66</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/cam4.6437</pub-id>, PMID: <pub-id pub-id-type="pmid">37559500</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<label>15</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Qu</surname> <given-names>L</given-names></name>
<name><surname>Zhu</surname> <given-names>J</given-names></name>
<name><surname>Mei</surname> <given-names>X</given-names></name>
<name><surname>Yi</surname> <given-names>Z</given-names></name>
<name><surname>Luo</surname> <given-names>N</given-names></name>
<name><surname>Yuan</surname> <given-names>S</given-names></name>
<etal/>
</person-group>. 
<article-title>Evaluating axillary lymph node metastasis risks in breast cancer patients via Semi-ALNP: a multicenter study</article-title>. <source>eClinicalMedicine</source>. (<year>2025</year>) <volume>85</volume>:<elocation-id>103311</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eclinm.2025.103311</pub-id>, PMID: <pub-id pub-id-type="pmid">40620610</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<label>16</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>H</given-names></name>
<name><surname>Ju</surname> <given-names>X</given-names></name>
<name><surname>Zeng</surname> <given-names>C</given-names></name>
<name><surname>Chen</surname> <given-names>Z</given-names></name>
<name><surname>Yu</surname> <given-names>L</given-names></name>
<name><surname>Ke</surname> <given-names>G</given-names></name>
<etal/>
</person-group>. 
<article-title>Development and validation of a pathological model predicting the efficacy of neoadjuvant therapy for breast cancer based on RCB scoring</article-title>. <source>Arch Med Sci</source>. (<year>2024</year>) <volume>21</volume>(<issue>1</issue>):<page-range>92&#x2013;101</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.5114/aoms/188006</pub-id>, PMID: <pub-id pub-id-type="pmid">40190325</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<label>17</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ogston</surname> <given-names>KN</given-names></name>
<name><surname>Miller</surname> <given-names>ID</given-names></name>
<name><surname>Payne</surname> <given-names>S</given-names></name>
<name><surname>Hutcheon</surname> <given-names>AW</given-names></name>
<name><surname>Sarkar</surname> <given-names>TK</given-names></name>
<name><surname>Smith</surname> <given-names>I</given-names></name>
<etal/>
</person-group>. 
<article-title>A new histological grading system to assess response of breast cancers to primary chemotherapy: prognostic significance and survival</article-title>. <source>Breast</source>. (<year>2003</year>) <volume>12</volume>:<page-range>320&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0960-9776(03)00106-1</pub-id>, PMID: <pub-id pub-id-type="pmid">14659147</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<label>18</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>Z</given-names></name>
<name><surname>Li</surname> <given-names>Z</given-names></name>
<name><surname>Qu</surname> <given-names>J</given-names></name>
<name><surname>Zhang</surname> <given-names>R</given-names></name>
<name><surname>Zhou</surname> <given-names>X</given-names></name>
<name><surname>Li</surname> <given-names>L</given-names></name>
<etal/>
</person-group>. 
<article-title>Radiomics of multiparametric MRI for pretreatment prediction of pathologic complete response to neoadjuvant chemotherapy in breast cancer: A multicenter study</article-title>. <source>Clin Can-cer Res</source>. (<year>2019</year>) <volume>25</volume>:<page-range>3538&#x2013;47</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1158/1078-0432.CCR-18-3190</pub-id>, PMID: <pub-id pub-id-type="pmid">30842125</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<label>19</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>L</given-names></name>
<name><surname>Wang</surname> <given-names>Y</given-names></name>
<name><surname>Yang</surname> <given-names>L</given-names></name>
<name><surname>Ren</surname> <given-names>J</given-names></name>
<name><surname>Xu</surname> <given-names>Q</given-names></name>
<name><surname>Zhai</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>Using baseline MRI radiomics to predict the tumor shrinkage patterns in HR-Positive, HER2-Negative Breast Cancer</article-title>. <source>Front Oncol</source>. (<year>2025</year>) <volume>15</volume>:<elocation-id>1539644</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fonc.2025.1539644</pub-id>, PMID: <pub-id pub-id-type="pmid">40809032</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<label>20</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Haque</surname> <given-names>W</given-names></name>
<name><surname>Verma</surname> <given-names>V</given-names></name>
<name><surname>Hatch</surname> <given-names>S</given-names></name>
<name><surname>Suzanne Klimberg</surname> <given-names>V</given-names></name>
<name><surname>Brian Butler</surname> <given-names>E</given-names></name>
<name><surname>Teh</surname> <given-names>BS</given-names></name>
</person-group>. 
<article-title>Response rates and pathologic complete response by breast cancer molecular subtype following neoadjuvant chemotherapy</article-title>. <source>Breast Cancer Res Treat</source>. (<year>2018</year>) <volume>170</volume>:<page-range>559&#x2013;67</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10549-018-4801-3</pub-id>, PMID: <pub-id pub-id-type="pmid">29693228</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<label>21</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Torrisi</surname> <given-names>R</given-names></name>
<name><surname>Marrazzo</surname> <given-names>E</given-names></name>
<name><surname>Agostinetto</surname> <given-names>E</given-names></name>
<name><surname>De Sanctis</surname> <given-names>R</given-names></name>
<name><surname>Losurdo</surname> <given-names>A</given-names></name>
<name><surname>Masci</surname> <given-names>G</given-names></name>
<etal/>
</person-group>. 
<article-title>Neoadjuvant chemotherapy in hormone receptor-positive/HER2-negative early breast cancer: When, why and what</article-title>? <source>Crit Rev Oncol/Hematol</source>. (<year>2021</year>) <volume>160</volume>:<elocation-id>103280</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.critrevonc.2021.103280</pub-id>, PMID: <pub-id pub-id-type="pmid">33667658</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<label>22</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Denkert</surname> <given-names>C</given-names></name>
<name><surname>Untch</surname> <given-names>M</given-names></name>
<name><surname>Benz</surname> <given-names>S</given-names></name>
<name><surname>Schneeweiss</surname> <given-names>A</given-names></name>
<name><surname>Weber</surname> <given-names>KE</given-names></name>
<name><surname>Schmatloch</surname> <given-names>S</given-names></name>
<etal/>
</person-group>. 
<article-title>Reconstructing tumor history in breast cancer: signatures of mutational processes and response to neoadjuvant chemotherapy&#x2606;</article-title>. <source>Ann Oncol</source>. (<year>2021</year>) <volume>32</volume>:<page-range>500&#x2013;11</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.annonc.2020.12.016</pub-id>, PMID: <pub-id pub-id-type="pmid">33418062</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<label>23</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cantini</surname> <given-names>L</given-names></name>
<name><surname>Trapani</surname> <given-names>D</given-names></name>
<name><surname>Guidi</surname> <given-names>L</given-names></name>
<name><surname>Boscolo Bielo</surname> <given-names>L</given-names></name>
<name><surname>Scafetta</surname> <given-names>R</given-names></name>
<name><surname>Koziej</surname> <given-names>M</given-names></name>
<etal/>
</person-group>. 
<article-title>Neoadjuvant therapy in hormone Receptor-Positive/HER2-Negative breast cancer</article-title>. <source>Cancer Treat Rev</source>. (<year>2024</year>) <volume>123</volume>:<elocation-id>102669</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ctrv.2023.102669</pub-id>, PMID: <pub-id pub-id-type="pmid">38141462</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<label>24</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rubio</surname> <given-names>IT</given-names></name>
<name><surname>Sobrido</surname> <given-names>C</given-names></name>
</person-group>. 
<article-title>Neoadjuvant approach in patients with early breast cancer: patient assessment, staging, and planning</article-title>. <source>Breast</source>. (<year>2022</year>) <volume>62</volume>:<page-range>S17&#x2013;24</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.breast.2021.12.019</pub-id>, PMID: <pub-id pub-id-type="pmid">34996668</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<label>25</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Straver</surname> <given-names>ME</given-names></name>
<name><surname>EJTh</surname> <given-names>R</given-names></name>
<name><surname>Rodenhuis</surname> <given-names>S</given-names></name>
<name><surname>SC</surname> <given-names>L</given-names></name>
<name><surname>CE</surname> <given-names>L</given-names></name>
<name><surname>Wesseling</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>The relevance of breast cancer subtypes in the outcome of neoadjuvant chemotherapy</article-title>. <source>Ann Surg Oncol</source>. (<year>2010</year>) <volume>17</volume>:<page-range>2411&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1245/s10434-010-1008-1</pub-id>, PMID: <pub-id pub-id-type="pmid">20373039</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<label>26</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Boughey</surname> <given-names>JC</given-names></name>
<name><surname>McCall</surname> <given-names>LM</given-names></name>
<name><surname>Ballman</surname> <given-names>KV</given-names></name>
<name><surname>Mittendorf</surname> <given-names>EA</given-names></name>
<name><surname>Ahrendt</surname> <given-names>GM</given-names></name>
<name><surname>Wilke</surname> <given-names>LG</given-names></name>
<etal/>
</person-group>. 
<article-title>Tumor biology correlates with rates of breast-conserving surgery and pathologic complete response after neoadjuvant chemotherapy for breast cancer: findings from the ACOSOG Z1071 (Alliance) prospective multicenter clinical trial</article-title>. <source>Ann Surg</source>. (<year>2014</year>) <volume>260</volume>:<page-range>608&#x2013;16</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/SLA.0000000000000924</pub-id>, PMID: <pub-id pub-id-type="pmid">25203877</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<label>27</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hage</surname> <given-names>AN</given-names></name>
<name><surname>Capriccioso</surname> <given-names>C</given-names></name>
<name><surname>Brennan</surname> <given-names>J</given-names></name>
<name><surname>Heiden</surname> <given-names>B</given-names></name>
<name><surname>Zheutlin</surname> <given-names>A</given-names></name>
<name><surname>Sabel</surname> <given-names>MS</given-names></name>
</person-group>. 
<article-title>Impact of neoadjuvant chemotherapy on surgical outcomes among patients with hormone receptor positive breast cancer</article-title>. <source>J Surg Oncol</source>. (<year>2017</year>) <volume>116</volume>:<page-range>665&#x2013;70</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/jso.24721</pub-id>, PMID: <pub-id pub-id-type="pmid">28672101</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<label>28</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Petruolo</surname> <given-names>OA</given-names></name>
<name><surname>Pilewskie</surname> <given-names>M</given-names></name>
<name><surname>Patil</surname> <given-names>S</given-names></name>
<name><surname>Barrio</surname> <given-names>AV</given-names></name>
<name><surname>Stempel</surname> <given-names>M</given-names></name>
<name><surname>Wen</surname> <given-names>HY</given-names></name>
<etal/>
</person-group>. 
<article-title>Standard pathologic features can be used to identify a subset of estrogen receptor-positive, HER2 negative patients likely to benefit from neoadjuvant chemotherapy</article-title>. <source>Ann Surg Oncol</source>. (<year>2017</year>) <volume>24</volume>:<page-range>2556&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1245/s10434-017-5898-z</pub-id>, PMID: <pub-id pub-id-type="pmid">28560596</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<label>29</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kim</surname> <given-names>HS</given-names></name>
<name><surname>Yoo</surname> <given-names>TK</given-names></name>
<name><surname>Park</surname> <given-names>WC</given-names></name>
<name><surname>Chae</surname> <given-names>BJ</given-names></name>
</person-group>. 
<article-title>Potential benefits of neoadjuvant chemotherapy in clinically node-positive luminal subtype<sup>&#x2013;</sup> breast cancer</article-title>. <source>J Breast Cancer</source>. (<year>2019</year>) <volume>22</volume>:<fpage>412</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4048/jbc.2019.22.e35</pub-id>, PMID: <pub-id pub-id-type="pmid">31598341</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<label>30</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lee</surname> <given-names>E-G</given-names></name>
<name><surname>Lee</surname> <given-names>D-E</given-names></name>
<name><surname>Kim</surname> <given-names>HH</given-names></name>
<name><surname>Han</surname> <given-names>JH</given-names></name>
<name><surname>Lee</surname> <given-names>S</given-names></name>
<name><surname>Kang</surname> <given-names>H-S</given-names></name>
<etal/>
</person-group>. 
<article-title>Androgen receptor as a predictive marker for pathologic complete response in hormone receptor&#x2013;positive and HER-2&#x2013;negative breast cancer with neoadjuvant chemotherapy</article-title>. <source>Cancer Res Treat</source>. (<year>2023</year>) <volume>55</volume>:<page-range>542&#x2013;50</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.4143/crt.2022.834</pub-id>, PMID: <pub-id pub-id-type="pmid">36097802</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<label>31</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>J</given-names></name>
<name><surname>Wu</surname> <given-names>Q</given-names></name>
<name><surname>Yin</surname> <given-names>W</given-names></name>
<name><surname>Yang</surname> <given-names>L</given-names></name>
<name><surname>Xiao</surname> <given-names>B</given-names></name>
<name><surname>Wang</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>Development and validation of a radiopathomic model for predicting pathologic complete response to neoadjuvant chemotherapy in breast cancer patients</article-title>. <source>BMC Cancer</source>. (<year>2023</year>) <volume>23</volume>:<fpage>431</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12885-023-10817-2</pub-id>, PMID: <pub-id pub-id-type="pmid">37173635</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<label>32</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chen</surname> <given-names>RJ</given-names></name>
<name><surname>Ding</surname> <given-names>T</given-names></name>
<name><surname>Lu</surname> <given-names>MY</given-names></name>
<name><surname>Williamson</surname> <given-names>DFK</given-names></name>
<name><surname>Jaume</surname> <given-names>G</given-names></name>
<name><surname>Song</surname> <given-names>AH</given-names></name>
<etal/>
</person-group>. 
<article-title>Towards a general-purpose foundation model for computational pathology</article-title>. <source>Nat Med</source>. (<year>2024</year>) <volume>30</volume>:<page-range>850&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41591-024-02857-3</pub-id>, PMID: <pub-id pub-id-type="pmid">38504018</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<label>33</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hancock</surname> <given-names>JT</given-names></name>
<name><surname>Khoshgoftaar</surname> <given-names>TM</given-names></name>
</person-group>. 
<article-title>CatBoost for big data: an interdisciplinary review</article-title>. <source>J Big Data</source>. (<year>2020</year>) <volume>7</volume>:<fpage>94</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s40537-020-00369-8</pub-id>, PMID: <pub-id pub-id-type="pmid">33169094</pub-id>
</mixed-citation>
</ref>
<ref id="B34">
<label>34</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Freire-&#xc1;lvarez</surname> <given-names>E</given-names></name>
<name><surname>Ram&#xed;rez</surname> <given-names>IL</given-names></name>
<name><surname>Garc&#xed;a-Ramos</surname> <given-names>R</given-names></name>
<name><surname>Carrillo</surname> <given-names>F</given-names></name>
<name><surname>Santos-Garc&#xed;a</surname> <given-names>D</given-names></name>
<name><surname>G&#xf3;mez-Esteban</surname> <given-names>JC</given-names></name>
<etal/>
</person-group>. 
<article-title>Artificial intelligence for identification of candidates for device-aided therapy in Parkinson&#x2019;s disease: DELIST-PD study</article-title>. <source>Comput Biol Med</source>. (<year>2025</year>) <volume>185</volume>:<elocation-id>109504</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compbiomed.2024.109504</pub-id>, PMID: <pub-id pub-id-type="pmid">39637457</pub-id>
</mixed-citation>
</ref>
<ref id="B35">
<label>35</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shen</surname> <given-names>Z</given-names></name>
<name><surname>Chen</surname> <given-names>H</given-names></name>
<name><surname>Wang</surname> <given-names>W</given-names></name>
<name><surname>Xu</surname> <given-names>W</given-names></name>
<name><surname>Zhou</surname> <given-names>Y</given-names></name>
<name><surname>Weng</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>Machine learning algorithms as early diagnostic tools for pancreatic fistula following pancreaticoduodenectomy and guide drain removal: A retrospective cohort study</article-title>. <source>Int J Surg</source>. (<year>2022</year>) <volume>102</volume>:<elocation-id>106638</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ijsu.2022.106638</pub-id>, PMID: <pub-id pub-id-type="pmid">35500881</pub-id>
</mixed-citation>
</ref>
<ref id="B36">
<label>36</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>Y</given-names></name>
<name><surname>An</surname> <given-names>W</given-names></name>
<name><surname>Wang</surname> <given-names>C</given-names></name>
<name><surname>Liu</surname> <given-names>X</given-names></name>
<name><surname>Zhang</surname> <given-names>Q</given-names></name>
<name><surname>Zhang</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>Novel models based on machine learning to predict the prognosis of metaplastic breast cancer</article-title>. <source>Breast</source>. (<year>2025</year>) <volume>79</volume>:<elocation-id>103858</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.breast.2024.103858</pub-id>, PMID: <pub-id pub-id-type="pmid">39675092</pub-id>
</mixed-citation>
</ref>
<ref id="B37">
<label>37</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Czarnecka</surname> <given-names>AM</given-names></name>
<name><surname>Ostaszewski</surname> <given-names>K</given-names></name>
<name><surname>B&#x142;o&#x144;ski</surname> <given-names>PJ</given-names></name>
<name><surname>Szumera-Cie&#x107;kiewicz</surname> <given-names>A</given-names></name>
<name><surname>&#x15a;witaj</surname> <given-names>T</given-names></name>
<name><surname>Kozak</surname> <given-names>K</given-names></name>
<etal/>
</person-group>. 
<article-title>Long-term efficacy of neoadjuvant&#x2013;adjuvant targeted therapy in borderline resectable stage IIIB&#x2013;D and IV melanoma</article-title>. <source>Cancer</source>. (<year>2024</year>) <volume>130</volume>:<page-range>3463&#x2013;72</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/cncr.35425</pub-id>, PMID: <pub-id pub-id-type="pmid">38843386</pub-id>
</mixed-citation>
</ref>
<ref id="B38">
<label>38</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rose</surname> <given-names>KM</given-names></name>
<name><surname>Pham</surname> <given-names>R</given-names></name>
<name><surname>Zacharias</surname> <given-names>NM</given-names></name>
<name><surname>Ionescu</surname> <given-names>F</given-names></name>
<name><surname>Paravathaneni</surname> <given-names>M</given-names></name>
<name><surname>Marchetti</surname> <given-names>KA</given-names></name>
<etal/>
</person-group>. 
<article-title>Neoadjuvant platinum-based chemotherapy and lymphadenectomy for penile cancer: an international, multi-institutional, real-world study</article-title>. <source>JNCI: J Natl Cancer Inst</source>. (<year>2024</year>) <volume>116</volume>:<page-range>966&#x2013;73</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/jnci/djae034</pub-id>, PMID: <pub-id pub-id-type="pmid">38366627</pub-id>
</mixed-citation>
</ref>
<ref id="B39">
<label>39</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Marm&#xe9;</surname> <given-names>F</given-names></name>
<name><surname>Solbach</surname> <given-names>C</given-names></name>
<name><surname>Michel</surname> <given-names>L</given-names></name>
<name><surname>Schneeweiss</surname> <given-names>A</given-names></name>
<name><surname>Blohmer</surname> <given-names>J-U</given-names></name>
<name><surname>Huober</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>Utility of the CPS + EG scoring system in triple-negative breast cancer treated with neoadjuvant chemotherapy</article-title>. <source>Eur J Cancer</source>. (<year>2021</year>) <volume>153</volume>:<page-range>203&#x2013;12</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ejca.2021.05.027</pub-id>, PMID: <pub-id pub-id-type="pmid">34186505</pub-id>
</mixed-citation>
</ref>
<ref id="B40">
<label>40</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kong</surname> <given-names>X</given-names></name>
<name><surname>Moran</surname> <given-names>MS</given-names></name>
<name><surname>Zhang</surname> <given-names>N</given-names></name>
<name><surname>Haffty</surname> <given-names>B</given-names></name>
<name><surname>Yang</surname> <given-names>Q</given-names></name>
</person-group>. 
<article-title>Meta-analysis confirms achieving pathological complete response after neoadjuvant chemotherapy predicts favourable prognosis for breast cancer patients</article-title>. <source>Eur J Cancer</source>. (<year>2011</year>) <volume>47</volume>:<page-range>2084&#x2013;90</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ejca.2011.06.014</pub-id>, PMID: <pub-id pub-id-type="pmid">21737257</pub-id>
</mixed-citation>
</ref>
<ref id="B41">
<label>41</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Collins</surname> <given-names>PM</given-names></name>
<name><surname>Brennan</surname> <given-names>MJ</given-names></name>
<name><surname>Elliott</surname> <given-names>JA</given-names></name>
<name><surname>Abd Elwahab</surname> <given-names>S</given-names></name>
<name><surname>Barry</surname> <given-names>K</given-names></name>
<name><surname>Sweeney</surname> <given-names>K</given-names></name>
<etal/>
</person-group>. 
<article-title>Neoadjuvant chemotherapy for luminal a breast cancer: Factors predictive of histopathologic response and oncologic outcome</article-title>. <source>Am J Surg</source>. (<year>2021</year>) <volume>222</volume>:<page-range>368&#x2013;76</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.amjsurg.2020.11.053</pub-id>, PMID: <pub-id pub-id-type="pmid">33334569</pub-id>
</mixed-citation>
</ref>
<ref id="B42">
<label>42</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hayashi</surname> <given-names>N</given-names></name>
<name><surname>Takahashi</surname> <given-names>Y</given-names></name>
<name><surname>Matsuda</surname> <given-names>N</given-names></name>
<name><surname>Tsunoda</surname> <given-names>H</given-names></name>
<name><surname>Yoshida</surname> <given-names>A</given-names></name>
<name><surname>Suzuki</surname> <given-names>K</given-names></name>
<etal/>
</person-group>. 
<article-title>The prognostic effect of changes in tumor stage and nodal status after neoadjuvant chemotherapy in each primary breast cancer subtype</article-title>. <source>Clin Breast Cancer</source>. (<year>2018</year>) <volume>18</volume>:<page-range>e219&#x2013;29</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.clbc.2017.09.013</pub-id>, PMID: <pub-id pub-id-type="pmid">29138067</pub-id>
</mixed-citation>
</ref>
<ref id="B43">
<label>43</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Xu</surname> <given-names>H</given-names></name>
<name><surname>Wang</surname> <given-names>M</given-names></name>
<name><surname>Shi</surname> <given-names>D</given-names></name>
<name><surname>Qin</surname> <given-names>H</given-names></name>
<name><surname>Zhang</surname> <given-names>Y</given-names></name>
<name><surname>Liu</surname> <given-names>Z</given-names></name>
<etal/>
</person-group>. 
<article-title>When multiple instance learning meets foundation models: Advancing histological whole slide image analysis</article-title>. <source>Med Img Anal</source>. (<year>2025</year>) <volume>101</volume>:<elocation-id>103456</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.media.2025.103456</pub-id>, PMID: <pub-id pub-id-type="pmid">39842326</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/154155">Sharon R Pine</ext-link>, University of Colorado Anschutz Medical Campus, United States</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/471979">Marko Radulovic</ext-link>, Institute of Oncology and Radiology of Serbia, Serbia</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2944074">Solmaz Sohrabei</ext-link>, Shahid Beheshti University of Medical Sciences, Iran</p></fn>
</fn-group>
</back>
</article>