<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" dtd-version="1.3" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Med.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Medicine</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Med.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-858X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmed.2025.1731854</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>BOBM: an adaptive deep learning framework for extended-window sepsis prediction with cross-institutional generalizability</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Li</surname> <given-names>Wanxuan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x02020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Xiao</surname> <given-names>Kai</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x02020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/3123842"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Gu</surname> <given-names>Boyuan</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Zheng</surname> <given-names>Haoyu</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Shao</surname> <given-names>Dan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Mo</surname> <given-names>Ren</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/2045208"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Wu</surname> <given-names>Qiang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Yang</surname> <given-names>Qiong</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/1606286"/>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>School of Medicine, South China University of Technology</institution>, <city>Guangzhou</city>, <country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>Department of Urology, Hohhot First Hospital</institution>, <city>Hohhot</city>, <country country="cn">China</country></aff>
<aff id="aff3"><label>3</label><institution>Institutes of Biomedical Sciences, Inner Mongolia University</institution>, <city>Hohhot</city>, <country country="cn">China</country></aff>
<aff id="aff4"><label>4</label><institution>Department of Urology, Inner Mongolia People&#x00027;s Hospital, Inner Mongolia Urological Institute</institution>, <city>Hohhot</city>, <country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>&#x0002A;</label>Correspondence: Qiang Wu, <email xlink:href="mailto:wuqiang190@163.com">wuqiang190@163.com</email>; Qiong Yang, <email xlink:href="mailto:yangq@scut.edu.cn">yangq@scut.edu.cn</email></corresp>
<fn fn-type="equal" id="fn001"><label>&#x02020;</label><p>These authors have contributed equally to this work</p></fn></author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-01-15">
<day>15</day>
<month>01</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2025</year>
</pub-date>
<volume>12</volume>
<elocation-id>1731854</elocation-id>
<history>
<date date-type="received">
<day>24</day>
<month>10</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>16</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>16</day>
<month>12</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2026 Li, Xiao, Gu, Zheng, Shao, Mo, Wu and Yang.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Li, Xiao, Gu, Zheng, Shao, Mo, Wu and Yang</copyright-holder>
<license>
<ali:license_ref start_date="2026-01-15">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Sepsis, a life-threatening and costly condition, necessitates early detection for effective management. However, diagnostic and therapeutic delays are common. Furthermore, sepsis complexity and dynamics challenge existing early warning systems, impeding timely intervention.</p>
</sec>
<sec>
<title>Methods</title>
<p>In this study, we introduce the Bayes-Optimized Boosting-Mamba Tab Model (BOBM), a novel deep learning-based algorithm that incorporates a bidirectional optimization learning mechanism within an ensemble framework. We designed dynamic agent models to enhance computational efficiency and adaptability across diverse clinical scenarios. Additionally, the model architecture was optimized for different temporal phases to enable a more precise estimation of the timing and progression of sepsis risk. To improve interpretability, we implemented SHapley Additive exPlanations value analysis, providing clinicians with actionable insights into potential patterns of sepsis progression.</p>
</sec>
<sec>
<title>Results</title>
<p>The experimental evaluation demonstrated that our model attained the highest AUC (AUC: 0.86&#x02013;0.95) in the MIMIC-IV dataset across different temporal windows prior to sepsis onset, confirming its adaptability and robust generalizability across various prediction timeframes. Furthermore, the model demonstrated superior performance (AUC: 0.978&#x02013;0.982) when validated on two independent large-scale external datasets.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>In contrast to traditional prediction approaches, our model extends the potential intervention timeframe significantly, while incorporating dynamic monitoring capabilities spanning the 7- to 28-day window before clinical suspicion, thereby establishing a foundation for regional sepsis surveillance systems.</p>
</sec></abstract>
<kwd-group>
<kwd>critical care</kwd>
<kwd>deep learning</kwd>
<kwd>learning algorithms</kwd>
<kwd>predictive medicine</kwd>
<kwd>sepsis</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This work was supported in part by the Fundamental Research Funds for the Central Universities.</funding-statement>
</funding-group>
<counts>
<fig-count count="7"/>
<table-count count="3"/>
<equation-count count="11"/>
<ref-count count="62"/>
<page-count count="17"/>
<word-count count="11696"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Intensive Care Medicine and Anesthesiology</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<label>1</label>
<title>Introduction</title>
<p>Sepsis, a severe condition triggered by infection and characterized by organ dysfunction stemming from a dysregulated host response, can rapidly escalate to a life-threatening state. Globally, sepsis affects nearly 49 million individuals annually, leading to approximately 11 million deaths. Each hour of delayed treatment for sepsis patients significantly elevates the risk of mortality, underscoring the critical importance of early diagnosis in reducing adverse outcomes.</p>
<p>Currently, diagnostic methods for sepsis primarily rely on blood culture reports, followed by molecular diagnostic techniques (<xref ref-type="bibr" rid="B1">1</xref>). Blood culture, considered the &#x0201C;gold standard,&#x0201D; is predicated on the detection of viable microorganisms in the bloodstream (<xref ref-type="bibr" rid="B2">2</xref>). This approach, however, necessitates multi-step analyses, rendering it time-consuming and resource-intensive. Contemporary blood culture processing is largely automated through continuous monitoring of blood culture systems (<xref ref-type="bibr" rid="B2">2</xref>). Obtaining a positive signal in the early stages of the disease typically requires 24&#x02013;48 h, with subsequent confirmatory steps including Gram staining, preliminary antimicrobial susceptibility testing (AST), and biochemical identification. While rapid phenotypic tests can identify common pathogens within 18&#x02013;24 h, their sensitivity is suboptimal for slow-growing organisms such as yeasts and anaerobic bacteria. Although automated short-term subcultures can yield reliable AST results, the time to positivity for blood cultures in most bacterial infections exceeds 11 h (<xref ref-type="bibr" rid="B3">3</xref>), exclusive of the time required for subsequent definitive identification.</p>
<p>Moreover, while molecular diagnostic techniques can yield results several hours sooner than culture-based methods, their operation necessitates medically trained personnel, and their deployment is often hampered by a lack of portability (<xref ref-type="bibr" rid="B1">1</xref>). Consequently, their clinical utility is further constrained. Many rapid diagnostic strategies depend on a single biomarker (<xref ref-type="bibr" rid="B4">4</xref>), yet the diagnostic thresholds for such markers are frequently ill-defined or lack specificity. The utility of existing early warning scoring systems remains contentious. Clinical diagnosis often relies heavily on physician experience, which can lead to misdiagnosis or delayed diagnosis, thereby impeding the effective implementation of timely, accurate alerts and personalized therapeutic interventions (<xref ref-type="bibr" rid="B5">5</xref>). Presently, no single biomarker or technology can rapidly and accurately diagnose sepsis, compelling continued reliance on clinical symptom assessment and organ function monitoring for diagnosis (<xref ref-type="bibr" rid="B6">6</xref>).</p>
<p>The uneven distribution of medical resources further exacerbates the disease burden of sepsis, particularly in low- and middle-income countries where sepsis incidence is high. These regions exhibit significant heterogeneity in public health and emergency medical system capabilities, posing challenges to timely sepsis detection. Limited microbiological diagnostic capacity in resource-constrained settings restricts the implementation of precision antimicrobial therapy based on local pathogen spectra and resistance patterns (<xref ref-type="bibr" rid="B7">7</xref>). Constraints on diagnostic capacity encompass not only laboratory infrastructure and reagent availability, but also the staffing of qualified technical personnel, quality control systems, and the efficiency of multidisciplinary team collaboration. Consequently, there is an urgent need to develop more rapid and accurate diagnostic tools for sepsis.</p>
<p>The challenges in identifying sepsis have spurred the development of various clinical decision-support tools (<xref ref-type="bibr" rid="B8">8</xref>). To overcome the limitations of traditional predictive methods, statistical and mathematical models have been increasingly integrated into medical research (<xref ref-type="bibr" rid="B9">9</xref>). In particular, logistic regression (LR) and Cox proportional hazards regression initially dominated clinical applications due to their interpretability and robustness (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B62">62</xref>), with techniques such as LASSO addressing variable selection challenges in high-dimensional settings (<xref ref-type="bibr" rid="B11">11</xref>). However, these conventional methods are often challenged by the inherent scale, complexity, and non-linear dynamics of large clinical datasets, particularly for intricate diseases such as sepsis (<xref ref-type="bibr" rid="B12">12</xref>). Furthermore, traditional research has often prioritized the identification of risk factors based on statistical significance level, while overlooking the overall predictive performance of the models (<xref ref-type="bibr" rid="B13">13</xref>). Consequently, to enhance the capability of identifying complex patterns from high-dimensional, non-linear data and to mitigate the influence of subjective bias in diagnosis, machine learning and deep learning models have been trained using data from individual patient electronic health records (EHRs); such objective clinical data are less reliant on provider behavior and thus offer higher reliability (<xref ref-type="bibr" rid="B14">14</xref>).</p>
<p>Advanced machine learning (ML) algorithms, such as Random Forest and XGBoost, have demonstrated potential in processing large-scale electronic medical record (EMR) data and capturing non-linear relationships (AUROC values &#x0007E;0.89), achieving predictive accuracy superior to traditional methods (<xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B16">16</xref>). For instance, recent studies by Li et al. (<xref ref-type="bibr" rid="B17">17</xref>) and Richter-Laskowska et al. (<xref ref-type="bibr" rid="B18">18</xref>) have empirically validated the superiority of these non-linear and ensemble architectures over standard statistical baselines in cardiovascular and cognitive assessments. Furthermore, the integration of textual data can further enhance performance (<xref ref-type="bibr" rid="B19">19</xref>), as demonstrated by Adamson et al. (<xref ref-type="bibr" rid="B20">20</xref>) in the extraction of deep clinical phenotypes from unstructured notes.</p>
<p>However, ML methods still face challenges in handling data noise, ensuring cross-institutional generalizability, and their dependence on data quality (<xref ref-type="bibr" rid="B21">21</xref>&#x02013;<xref ref-type="bibr" rid="B23">23</xref>). These limitations underscore the necessity for developing more robust and adaptable predictive methods, thereby creating research opportunities for novel algorithms capable of integrating temporal information and handling heterogeneous data. Recent frameworks, such as that of Ramakrishnaiah et al. (<xref ref-type="bibr" rid="B24">24</xref>), specifically aim to mitigate these issues through the deployment of robust preprocessing and standardization pipelines. Deep learning (DL), leveraging its end-to-end learning capabilities to automatically extract high-level features (<xref ref-type="bibr" rid="B25">25</xref>), has demonstrated significant potential in sepsis prediction. Models such as Long Short-Term Memory (LSTM) networks effectively capture temporal dynamics (AUC &#x02265; 0.85) (<xref ref-type="bibr" rid="B26">26</xref>), while the COMPOSER model (AUC 0.925&#x02013;0.953) has shown excellent generalization and capability in addressing data-related challenges (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B28">28</xref>). Beyond traditional RNNs, recent advancements in 2024 have introduced more sophisticated architectures for heterogeneous EHR data. For instance, the FairCare framework employs an ethnicity-heterogeneous graph neural network (GNN) with adversarial training to mitigate bias while maintaining high predictive accuracy (AUROC &#x0003E; 0.90) in mortality prediction tasks (<xref ref-type="bibr" rid="B29">29</xref>). Similarly, Nigo et al. (<xref ref-type="bibr" rid="B30">30</xref>) demonstrated that deep learning models like PyTorch_EHR can effectively leverage time-series categorical data for personalized risk stratification, outperforming traditional logistic regression.</p>
<p>Although DL models are particularly adept at handling heterogeneous and high-dimensional time-series data (<xref ref-type="bibr" rid="B31">31</xref>), many existing methods are associated with high computational costs, limiting their deployment in resource-constrained settings. In this context, Transformer architectures (<xref ref-type="bibr" rid="B32">32</xref>) have gained prominence for long-sequence modeling, exemplified by the novel MedAlbert model (<xref ref-type="bibr" rid="B33">33</xref>) which utilizes deep pathway representations for enhanced diagnostic accuracy, alongside models like DTAE (AUC 97.98%) (<xref ref-type="bibr" rid="B34">34</xref>, <xref ref-type="bibr" rid="B35">35</xref>).</p>
<p>In recent years, the Mamba model, with its linear time complexity, has effectively addressed the efficiency bottleneck of Transformers in processing ultra-long sequences, providing a lightweight solution for clinical sequence analysis. Mamba outperforms RNNs and Transformers in terms of memory efficiency and scalability, making it particularly suitable for genomics and complex clinical long-sequence data. For high-risk diagnostic tasks such as sepsis, accurately capturing the dynamic patterns of clinical temporal data is crucial.</p>
<p>The strengths and limitations of these methods have inspired our further research, as developing a predictive system that combines high sensitivity and specificity for reliable early sepsis detection remains a critical challenge requiring urgent attention.</p>
<p>Despite achieving high accuracy, deep learning models&#x00027; &#x0201C;black box&#x0201D; nature hinders physicians&#x00027; understanding of the decision-making logic, thereby impeding clinical adoption. Furthermore, many models rely on laboratory test data, which typically exhibits significant changes only when patients&#x00027; conditions have progressed to advanced stages, rendering early identification challenging.</p>
<p>Most existing models are trained on single datasets (<xref ref-type="bibr" rid="B36">36</xref>) and lack validation across different hospitals and populations. Given the complex and diverse clinical manifestations of sepsis (<xref ref-type="bibr" rid="B21">21</xref>) and the heterogeneity between studies, these models experience performance degradation in alternative settings. Moreover, early warning systems are predominantly limited to simple binary classification predictions, overlooking the variability in clinical decision-making across different time windows, thus failing to meet clinical requirements for dynamic risk management throughout different stages of sepsis progression.</p>
<p>To address these challenges, we propose an innovative sepsis prediction model that integrates Boosting techniques with the Mamba-Tab framework, achieving enhanced accuracy and an extended window for early intervention. The key innovations of our proposed model include:</p>
<p>(1) We present a deep integration of Boosting with the state space model Mamba Tab, marking the first incorporation of structured state-space equations into the Boosting framework. We model the evolution of sample weights using the differential equation <italic>h</italic>&#x02032;(<italic>t</italic>) &#x0003D; <italic>f</italic>(<italic>h, x</italic>; &#x003B8;), and we theoretically establish that the VC dimension upper bound is <italic>O</italic>(log<italic>n</italic>), which is superior to the <italic>O</italic>(<italic>d</italic>log<italic>n</italic>) bound of traditional decision tree-based models.</p>
<p>(2) We introduce a bidirectional learning approach guided by Bayesian Optimization (BO). This approach employs a forward-backward optimization mechanism: during the forward pass, model parameters are updated using gradient descent; concurrently, or in a distinct phase, Bayesian inference is utilized to optimize the hyperparameter space. Implemented on standard UCI datasets, this mechanism demonstrated a 62% reduction in the hyperparameter search space. Specifically, we utilize an Incremental Bayesian Optimization (IBO) strategy, which leverages historical iteration data to dynamically construct the surrogate model. This specific approach leads to a reduction of over 40% in the required number of hyperparameter evaluations.</p>
<p>(3) We introduce a dynamic multi-paradigm integration mechanism that facilitates the seamless fusion of diverse ensemble paradigms, including Gradient Boosting, Adaptive Boosting, and Random Forests. This integration is designed to enhance computational efficiency and scalability.</p>
<p>Our methodology involves optimizing the model architecture across different temporal phases, thereby refining sepsis risk stratification and enhancing applicability in clinical settings. Additionally, we conducted comprehensive interpretability analyses to facilitate the development of a more clinically actionable decision support system for healthcare practitioners.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<label>2</label>
<title>Materials and methods</title>
<sec>
<label>2.1</label>
<title>Model construction</title>
<p>Our proposed framework, the Bayes-Optimized Boosting-Mamba Tab, integrates three advanced methodological components to address the challenges of clinical tabular data, such as high dimensionality, long-range dependencies across features, and class imbalance.</p>
<sec>
<label>2.1.1</label>
<title>Mamba tab</title>
<p>Traditional clinical modeling often relies on Recurrent Neural Networks (RNNs) or Transformers. However, RNNs struggle with computational efficiency on long sequences, while Transformers entail high memory costs. To address this, we employ Mamba Tab. An overview of the Mamba Tab architecture is shown in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig position="float" id="F1">
<label>Figure 1</label>
<caption><p>Framing of the Mamba Tab.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1731854-g0001.tif">
<alt-text content-type="machine-generated">Diagram showing a data processing workflow. On the left, a sample dataset with features and target values undergoes normalization and categorical encoding. It is then transformed by an embedding layer followed by layer normalization. On the right, the Mamba architecture includes linear projections, a convolutional layer, an SSM block, and nonlinear activations. The process concludes with a fully connected layer producing the output. Symbols indicate ReLU and SiLU activations, as well as nonlinearity through multiplication.</alt-text>
</graphic>
</fig>
<p>Mamba Tab is an extension of Mamba (<xref ref-type="bibr" rid="B37">37</xref>), specifically optimized for regression tasks involving tabular data. It integrates the principles of gating mechanisms, thereby enhancing feature selection and controlling information flow. This contributes to its superior performance in tabular data modeling.</p>
<p>Conceptually, Mamba Tab (<xref ref-type="bibr" rid="B12">12</xref>) treats patient data rows (or transformed columns) as sequences. Unlike static models, it utilizes a rmed columns) as sequences. data. It integrates the principles of gating mechanisms, thereby enhancing feature selection and controlling information flow. This contributes to its superior performance in tabular dantageous for medical records, where distinguishing significant clinical indicators from background variability is crucial for accurate diagnosis.</p>
<p>Detailed mathematical derivations of the State Space Model (<xref ref-type="bibr" rid="B38">38</xref>, <xref ref-type="bibr" rid="B39">39</xref>), discretization, and gating mechanisms are provided in <xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>.</p>
</sec>
<sec>
<label>2.1.2</label>
<title>Boosting</title>
<p>To enhance predictive performance and generalizability, we integrate Mamba Tab within a Boosting framework. Boosting is an ensemble learning methodology that sequentially combines multiple &#x0201C;weak learners&#x0201D; (base models) to construct a robust &#x0201C;strong learner&#x0201D; (<xref ref-type="bibr" rid="B40">40</xref>).</p>
<p>In the context of clinical decision support, datasets often contain patient subgroups with subtle symptoms or complex feature interactions that are difficult to diagnose. Boosting addresses this by utilizing an iterative reweighting framework to enhance performance specifically on these &#x0201C;difficult-to-classify&#x0201D; instances.</p>
<p>In our approach, the algorithm iteratively trains the Mamba Tab model. In each round, it assigns higher weights to patient samples that were misclassified in the previous round. This mechanism forces the model to focus on &#x0201C;hard-to-diagnose&#x0201D; cases, effectively reducing bias and variance. The final prediction is an aggregate of these weighted learners. The specific weight update formulas (<xref ref-type="bibr" rid="B41">41</xref>) and ensemble strategies are detailed in <xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>.</p>
</sec>
<sec>
<label>2.1.3</label>
<title>Bayesian optimization</title>
<p>Both the Mamba Tab encoder and the Boosting ensemble involve several hyperparameters (e.g., number of layers, hidden dimensions, learning rate, number of boosting rounds, tree depth). Manually tuning these hyperparameters is computationally expensive and subjective. We therefore use Bayesian optimization (BO) to automatically identify configurations that maximize predictive performance. BO constructs a probabilistic surrogate model (typically a Gaussian Process) to approximate the relationship between hyperparameters and model performance (<xref ref-type="bibr" rid="B42">42</xref>, <xref ref-type="bibr" rid="B43">43</xref>). By using an acquisition function to balance exploration (trying new parameter regions) and exploitation (refining promising regions), BO efficiently identifies the global optimal configuration with minimal computational cost (<xref ref-type="bibr" rid="B44">44</xref>) (<xref ref-type="fig" rid="F2">Figure 2</xref>). The mathematical definitions of the Gaussian Process kernels and acquisition functions are provided in <xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>.</p>
<fig position="float" id="F2">
<label>Figure 2</label>
<caption><p>Illustration of Bayesian optimization.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1731854-g0002.tif">
<alt-text content-type="machine-generated">Graph depicting a Gaussian process regression model. It includes observed data points marked by red dots, a true function in yellow, the GP mean in a solid line, and a confidence interval shaded in light blue. A current acquisition function line is also shown with a peak marked as the maximum of the current acquisition function.</alt-text>
</graphic>
</fig>
</sec>
<sec>
<label>2.1.4</label>
<title>Bayes-optimized boosting-mamba tab model</title>
<p>The Mamba Tab architecture implements dynamic optimization using a three-stage iterative framework (illustrated in <xref ref-type="fig" rid="F3">Figure 3</xref>). In this architecture, Mamba Tab serves as the foundational &#x0201C;weak learner&#x0201D; due to its superior capability in extracting features from longitudinal or complex tabular medical data.</p>
<fig position="float" id="F3">
<label>Figure 3</label>
<caption><p>Framing of the Boosting-Mamba Tab model.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1731854-g0003.tif">
<alt-text content-type="machine-generated">Flowchart illustrating a machine learning process with two main sections: &#x0201C;Bayes&#x0201D; and &#x0201C;Mamba Tab.&#x0201D; The Bayes section shows data being divided into subsets, processed, and weighted models. The Mamba Tab section details a layered neural network architecture, with a sample dataset feeding into a system involving embeddings, layer normalization, and linear projections. Includes diagrams for boosting types, learning rates, feature selection, and activation functions, with different convolutions and outputs. The illustration is complex, emphasizing data processing and modeling procedures.</alt-text>
</graphic>
</fig>
<p><xref ref-type="fig" rid="F3">Figure 3</xref> illustrates our Boosting-Mamba Tab model enhanced by Bayesian optimization. Conceptually, the model works in three main steps:</p>
<p>(1) The dataset is repeatedly resampled and reweighted so that misclassified or high-risk patients receive higher weights.</p>
<p>(2) Each weighted subset is fed into a weak learner block to extract rich feature representations and generate predictions.</p>
<p>(3) A Bayesian optimization module adaptively selects the boosting strategy and hyperparameters that yield the best validation performance.</p>
<p>From a clinical perspective, this design allows the model to progressively focus on the most difficult-to-predict cases, while automatically tuning itself to the specific characteristics of the ICU/anesthesiology dataset, rather than relying on manual trial-and-error.</p>
<sec>
<label>2.1.4.1</label>
<title>Boosting-driven sample reweighting</title>
<p>At the start, all patients are assigned equal importance, with initial sample weights <inline-formula><mml:math id="M1"><mml:msubsup><mml:mrow><mml:mi>w</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>/</mml:mo><mml:mi>n</mml:mi></mml:math></inline-formula>, where <italic>n</italic> represents the total number of samples. During the <italic>t</italic>-th iteration, we update the weight distribution based on the prediction errors of weak learners (<xref ref-type="disp-formula" rid="EQ1">Equation 1</xref>):</p>
<disp-formula id="EQ1"><mml:math id="M2"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msubsup><mml:mrow><mml:mi>w</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:msubsup><mml:mrow><mml:mi>w</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msubsup><mml:mo class="qopname">exp</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mo>-</mml:mo><mml:msub><mml:mrow><mml:mi>&#x003B1;</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:msubsup><mml:mrow><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x0005E;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msubsup></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>Z</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac><mml:mo>,</mml:mo><mml:mtext>&#x02003;</mml:mtext><mml:msub><mml:mrow><mml:mi>&#x003B1;</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:mfrac><mml:mo class="qopname">ln</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mrow><mml:mo stretchy="true">(</mml:mo><mml:mrow><mml:mfrac><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mrow><mml:mi>&#x000F2;</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>&#x000F2;</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac></mml:mrow><mml:mo stretchy="true">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(1)</label></disp-formula>
<p>Herein, <italic>Z</italic> denotes the normalization factor, and &#x000F2;<sub><italic>t</italic></sub> represents the weighted error rate. where <italic>y</italic><sub><italic>i</italic></sub> is the true label of the <italic>i</italic>-th sample and <inline-formula><mml:math id="M3"><mml:msubsup><mml:mrow><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x0005E;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> is the prediction of the <italic>t</italic>-th weak learner <italic>h</italic><sub><italic>t</italic></sub> on this sample. This mechanism increases the weights of misclassified samples through exponential weighting, thus directing subsequent learners to focus on challenging instances near the decision boundary.</p>
</sec>
<sec>
<label>2.1.4.2</label>
<title>Dynamic multi-paradigm ensemble (meta-learning)</title>
<p>A distinct advantage of our framework, from a data analysis perspective, is its flexibility. Traditional ensemble methods usually rely on a fixed paradigm (e.g., only Gradient Boosting or only Random Forest). However, clinical datasets vary significantly in terms of noise, sample size, and class imbalance. To address this, we employ a heterogeneous set of Boosting Types, denoted as H &#x0003D; {XGBoost, LightGBM, RF, GBDT}. A Bayesian approach is employed to dynamically determine the ensemble strategy, which may operate in modes such as:</p>
<list list-type="simple">
<list-item><p>(1) Gradient Boosting Mode: Focuses on minimizing the residual errors of the loss function (<xref ref-type="disp-formula" rid="EQ2">Equation 2</xref>).</p></list-item>
</list>
<disp-formula id="EQ2"><mml:math id="M4"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x0005E;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x0005E;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x0002B;</mml:mo><mml:mi>&#x003B7;</mml:mi><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(2)</label></disp-formula>
<p>where &#x00177;<sub><italic>t</italic></sub>(<italic>x</italic>) denotes the aggregated prediction at iteration <italic>t</italic> for input <italic>x</italic>, <italic>h</italic><sub><italic>t</italic></sub> is the <italic>t</italic>-th base learner, and &#x003B7;&#x0003E;0 is the learning rate.</p>
<list list-type="simple">
<list-item><p>(2) AdaBoost Mode: Focuses on reweighting misclassified samples to prioritize hard-to-diagnose cases (<xref ref-type="disp-formula" rid="EQ3">Equation 3</xref>).</p></list-item>
</list>
<disp-formula id="EQ3"><mml:math id="M5"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x0005E;</mml:mo></mml:mover><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mo class="qopname">sign</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>&#x003B1;</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(3)</label></disp-formula>
<p>where &#x003B1;<sub><italic>t</italic></sub> is the weight of the <italic>t</italic>-th weak learner as defined in (<xref ref-type="disp-formula" rid="EQ1">Equation 1</xref>), and <italic>T</italic> denotes the total number of boosting rounds.</p>
<list list-type="simple">
<list-item><p>(3) Random Forest Mode: Focuses on variance reduction through bagging (<xref ref-type="disp-formula" rid="EQ4">Equation 4</xref>).</p></list-item>
</list>
<disp-formula id="EQ4"><mml:math id="M6"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x0005E;</mml:mo></mml:mover><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>B</mml:mi></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>b</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>B</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>b</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(4)</label></disp-formula>
<p>where <italic>h</italic><sub><italic>b</italic></sub> denotes the <italic>b</italic>-th tree in the random forest and <italic>B</italic> is the number of trees. The final prediction is obtained by averaging the outputs of all trees.</p>
<p>During the training phase, the Bayesian optimizer simultaneously tunes the hyperparameters (e.g., Learning Rate, Feature Select) and selects the ensemble mode that yields the highest validation accuracy. This &#x0201C;meta-learning&#x0201D;eta-learnings the ensemble mode that yields the highest v&#x02014;effectively customizing the mathematical structure of the classifier to fit the unique disease profile being analyzed, thereby mitigating the limitations inherent in fixed-paradigm methods. The selection probability is modeled as (<xref ref-type="disp-formula" rid="EQ5">Equation 5</xref>).</p>
<disp-formula id="EQ5"><mml:math id="M7"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>P</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x0221D;</mml:mo><mml:mo class="qopname">exp</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>&#x003B7;</mml:mi><mml:mo>&#x000B7;</mml:mo><mml:mtext class="textrm" mathvariant="normal">Perf</mml:mtext><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(5)</label></disp-formula>
<p>Here, <italic>h</italic><sub><italic>j</italic></sub>&#x02208; H denotes the <italic>j</italic>-th boosting type in the heterogeneous set H &#x0003D; {XGBoost, LightGBM, RF, GBDT}. Perf(<italic>h</italic><sub><italic>j</italic></sub>, <italic>x</italic>) denotes the performance of boosting type</p>
<p><italic>h</italic><sub><italic>j</italic></sub> evaluated on configuration <italic>x</italic>. Where the sensitivity parameter &#x003B7;&#x02208;[10<sup>&#x02212;5</sup>, 0.1] and potentially associated feature selection strategies are adaptively tuned using Bayesian Optimization.</p>
</sec>
<sec>
<label>2.1.4.3</label>
<title>MambaTab feature engine</title>
<p>We adopt Mamba Tab as the foundational learner in our approach. Mamba Tab is a model based on gating mechanisms, with its effectiveness validated in tabular data regression tasks.</p>
<p>Mamba Tab integrates a gated feature processing module, formulated as <xref ref-type="disp-formula" rid="EQ6">Equation 6</xref>:</p>
<disp-formula id="EQ6"><mml:math id="M8"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mtext class="textrm" mathvariant="normal">M</mml:mtext><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi><mml:mo>;</mml:mo><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mtext class="textrm" mathvariant="normal">LayerNorm</mml:mtext><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mtext class="textrm" mathvariant="normal">SSM</mml:mtext><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>r</mml:mi><mml:mi>o</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x0002B;</mml:mo><mml:mtext class="textrm" mathvariant="normal">GELU</mml:mtext><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>W</mml:mi></mml:mrow><mml:mrow><mml:mi>g</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>e</mml:mi></mml:mrow></mml:msub><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(6)</label></disp-formula>
<p>where <italic>x</italic>&#x02208;&#x0211D;<sup><italic>d</italic></sup> denotes the input feature vector, and &#x003B8; &#x0003D; {<italic>W</italic><sub><italic>agg</italic></sub>, <italic>W</italic><sub><italic>gate</italic></sub>, SSM parameters} collects all learnable parameters of the Mamba Tab module. In this equation, SSM represents the Structured State Space Model, and <italic>W</italic><sub><italic>oroj</italic></sub>, <italic>W</italic><sub><italic>gate</italic></sub> are trainable weight matrices. The gating network facilitates the dynamic modulation of feature flow.</p>
<p>The Mamba Tab module employs state-space equations to explicitly capture long-range dependencies among features (<xref ref-type="disp-formula" rid="EQ7">Equation 7</xref>):</p>
<disp-formula id="EQ7"><mml:math id="M9"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msup><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>&#x02032;</mml:mi></mml:mrow></mml:msup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mi>A</mml:mi><mml:mi>h</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x0002B;</mml:mo><mml:mi>B</mml:mi><mml:mi>x</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo><mml:mtext>&#x02003;</mml:mtext><mml:mi>y</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mi>C</mml:mi><mml:mi>h</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(7)</label></disp-formula>
<p>where <inline-formula><mml:math id="M10"><mml:mi>h</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>d</mml:mi></mml:mrow><mml:mrow><mml:mi>h</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msup></mml:math></inline-formula> denotes the hidden state at time step <italic>t</italic>, <italic>h</italic>&#x02032;(<italic>t</italic>) is its temporal derivative in continuous time, <italic>x</italic>(<italic>t</italic>)&#x02208;&#x0211D;<sup><italic>d</italic></sup> is the input at time <italic>t</italic>, and <inline-formula><mml:math id="M11"><mml:mi>y</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>&#x0211D;</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>d</mml:mi></mml:mrow><mml:mrow><mml:mi>y</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msup></mml:math></inline-formula> is the corresponding output, <italic>A, B</italic>, and <italic>C</italic> are learnable parameter matrices. Combined with the gating mechanisms, this enables the dynamic integration of local features with global context.</p>
</sec>
</sec>
</sec>
<sec>
<label>2.2</label>
<title>Dataset</title>
<p>Data were sourced from MIMIC-IV (v2.2), containing anonymized records of 53,150 BIDMC ICU admissions (2008&#x02013;2019) (<xref ref-type="bibr" rid="B45">45</xref>). This dataset, accessed via PhysioNet, provides multi-dimensional temporal clinical data. Key updates from MIMIC-III include a modular structure and extended coverage (<xref ref-type="bibr" rid="B46">46</xref>).</p>
<p>The MIMIC-IV database was accessed upon fulfillment of the required Collaborative Institutional Training Initiative (CITI) program requirements (Record ID: 64960229). Ethics clearance for this research was obtained from the Institutional Review Boards at Beth Israel Deaconess Medical Center (Boston, MA) and the Massachusetts Institute of Technology (Cambridge, MA).</p>
<sec>
<label>2.2.1</label>
<title>Variable selection of the dataset</title>
<p>Data pertaining to forty-nine clinical variables were retrieved from the institution&#x00027;s Electronic Medical Record (EMR) system (see <xref ref-type="supplementary-material" rid="SM1">Supplementary Table S1</xref>). This dataset encompassed demographic characteristics, vital signs.</p>
</sec>
<sec>
<label>2.2.2</label>
<title>Data processing</title>
<sec>
<label>2.2.2.1</label>
<title>Definition of sepsis</title>
<p>The present investigation adheres to the diagnostic guidelines established by the Third International Consensus Definitions for Sepsis and Septic Shock (Sepsis-3) (<xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B47">47</xref>). According to these definitions, sepsis is characterized as a life-threatening organ dysfunction precipitated by a dysregulated host response to infection. A key tenet of the Sepsis-3 framework is its prioritization of infection-induced organ dysfunction over the conventional Systemic Inflammatory Response Syndrome (SIRS) criteria. Diagnosis requires: (1) evidence of infection or suspected infection, and (2) an acute change in the total Sequential Organ Failure Assessment (SOFA) score of &#x02265;2 points from baseline, attributable to the infection. Organ dysfunction is assessed based on the temporal association between infection and SOFA score changes.</p>
</sec>
<sec>
<label>2.2.2.2</label>
<title>Study population</title>
<p>Study participants must have satisfied Sepsis-3 diagnostic parameters, characterized by evidence or suspicion of infection coupled with an elevation of at least 2 points in the Sequential Organ Failure Assessment (SOFA) score relative to pre-infection values. The study population was restricted to adult subjects (18 years and older) experiencing their initial intensive care unit admission within the current hospitalization period, thereby eliminating variables associated with prior critical care exposure. Furthermore, patients needed an ICU length of stay (LOS) of &#x02265;24 h to exclude early mortality bias and ensure sufficient observation time for key interventions. Exclusion criteria comprised: periods of data interruption &#x02265;24 h, a palliative care designation, or missingness exceeding 15% for pre-defined key variables. We also excluded inpatient admissions longer than 50 days. Initially, 74,811 ICU admissions were screened; following the application of these criteria, 2,599 eligible patients were included in the final cohort.</p>
</sec>
</sec>
<sec>
<label>2.2.3</label>
<title>Patient cohort</title>
<p>Existing sepsis prediction models frequently lack temporal specificity, hindering their ability to discern the dynamic variations in sepsis risk across different phases of hospitalization. Many current early warning systems provide a single, aggregate risk assessment, inadequately addressing the complexity of sepsis progression. Consequently, they often fail to account for potentially distinct underlying pathophysiological mechanisms and risk factors associated with sepsis onset at varying time points post-admission (e.g., community-acquired vs. hospital-acquired sepsis).</p>
<p>To overcome this limitation and enhance the clinical applicability of predictive alerts, this study employs a cohort stratification strategy based on the timing of sepsis diagnosis. Informed by clinically relevant intervention periods, the patient cohort was partitioned into three distinct and non-overlapping temporal groups according to the post-admission timeframe of sepsis confirmation: 7-day group, 14-day group, and 28-day group.</p>
<p>The stratification of the patient cohort is necessitated by the substantial clinical heterogeneity and temporal concept drift inherent in sepsis progression. Pathophysiological patterns evolve significantly during hospitalization. This evolution causes the characteristics of physiological data to shift. Consequently, training on a unified dataset would obscure these distinct signals and degrade model performance.</p>
<p>Sepsis onset within 0&#x02013;7 days is predominantly driven by acute inflammatory responses. This phase is characterized by early organ dysfunction and a relatively consistent clinical trajectory. These cases typically stem from community-acquired infections or immediate postoperative complications. Furthermore, standard clinical protocols often involve antibiotic de-escalation after 7 days. This necessitates a shift in therapeutic management. Beyond the first week, patients typically either recover or progress toward Persistent Critical Illness (PCI). This transition is marked by secondary infections and evolving immune dysfunction (<xref ref-type="bibr" rid="B48">48</xref>). Evidence suggests that this pathological shift can manifest as early as day 7 (<xref ref-type="bibr" rid="B49">49</xref>). The 7&#x02013;14 days window represents a peak period for iatrogenic infections (<xref ref-type="bibr" rid="B50">50</xref>). During this time, patients are susceptible to secondary complications such as ventilator-associated pneumonia (VAP), catheter-associated urinary tract infections (CAUTI), or central line-associated bloodstream infections (CLABSI). Conversely, late-onset sepsis is frequently characterized by the &#x0201C;Persistent Inflammation, Immunosuppression, and Catabolism Syndrome&#x0201D; (PICS). Research explicitly indicates that patients with ICU stays exceeding 14 days undergo a fundamental alteration in physiological mechanisms (<xref ref-type="bibr" rid="B51">51</xref>). Empirical studies by Zhang et al. demonstrate that the onset of PCI occurs, on average, 15 days following admission in the overall patient population (<xref ref-type="bibr" rid="B49">49</xref>). Finally, the 14&#x02013;28 days window aligns with standard definitions of long-term mortality and chronic critical illness utilized in Sepsis-3 guidelines and epidemiological research. This period reflects a distinct phenotype requiring prolonged intensive care (<xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B53">53</xref>).</p>
<p>Therefore, partitioning the dataset mitigates the noise arising from these heterogeneous states. This approach facilitates model learning. It also allows for a rigorous validation of the model&#x00027;s temporal stability and ensures generalization across distinct onset profiles. Consequently, this experimental design not only addresses concept drift but also validates the model&#x00027;s temporal robustness.</p>
<p>Data within each group are strictly segregated using timestamps, ensuring temporal data integrity and preventing information leakage from future events. This methodology facilitates a crucial paradigm shift&#x02014;moving from predicting if sepsis will occur to when it is likely to manifest within specific windows. Such temporal stratification enables models to capture potentially stage-specific risk patterns, thereby better supporting phase-specific clinical management strategies. Furthermore, it inherently prevents data leakage, aligning model development more closely with real-world clinical scenarios. By enabling differentiated prioritization of alerts based on the time window, this approach may help mitigate alarm fatigue and improve response efficiency. This structured framework also simplifies model development and evaluation, contributing toward the ultimate objective of achieving personalized and dynamic sepsis risk monitoring.</p>
</sec>
</sec>
<sec>
<label>2.3</label>
<title>Class imbalance handling</title>
<p>To address the class imbalance issue arising from the relatively small proportion of sepsis-positive samples, this study employed the Synthetic Minority Over-sampling Technique (SMOTE) for data augmentation. This algorithm generates synthetic samples through linear interpolation within the feature space of the minority class instances, as opposed to simple replication. This method effectively expands the number of positive cases to achieve parity with the negative cases, while concurrently mitigating the risk of training overfitting often associated with traditional random oversampling techniques.</p>
<sec>
<label>2.3.1</label>
<title>SMOTE procedure</title>
<p>For each minority (sepsis-positive) instance <italic>x</italic><sub><italic>i</italic></sub>, SMOTE first identifies its <italic>k</italic> nearest neighbors (here <italic>k</italic> = 8) among the other minority samples in the feature space. Then, a neighbor <italic>x</italic><sub><italic>nn</italic></sub> is randomly selected from these <italic>k</italic> neighbors, and a synthetic sample <italic>x</italic><sub><italic>new</italic></sub> is generated by linear interpolation between <italic>x</italic><sub><italic>i</italic></sub> and <italic>x</italic><sub><italic>nn</italic></sub>: <italic>xnew</italic> &#x0003D; <italic>xi</italic> &#x0002B; &#x003BB; (<italic>xnn</italic> &#x02212; <italic>xi</italic>), &#x003BB; &#x0007E; <italic>U</italic>(0, 1), where &#x003BB; is a random number drawn from a uniform distribution between 0 and 1. This procedure creates new minority-class samples that lie along the line segments connecting neighboring minority instances, instead of simply duplicating existing cases. Synthetic positive samples were generated until the number of sepsis-positive and sepsis-negative samples became approximately equal in the training set. SMOTE was applied only within the training folds during cross-validation, while the validation and test sets preserved the original class distribution to avoid information leakage.</p>
<p>The original and post-SMOTE class ratios for each outcome window were as follows <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Class distribution before and after SMOTE.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Group</bold></th>
<th valign="top" align="center"><bold>Imbalance rate</bold></th>
<th valign="top" align="center"><bold>After SMOTE</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">7-days</td>
<td valign="top" align="center">534:378</td>
<td valign="top" align="center">534:534</td>
</tr>
<tr>
<td valign="top" align="left">14-days</td>
<td valign="top" align="center">336:531</td>
<td valign="top" align="center">531:531</td>
</tr>
<tr>
<td valign="top" align="left">28-days</td>
<td valign="top" align="center">319:501</td>
<td valign="top" align="center">501:501</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec>
<label>2.4</label>
<title>Evaluation metrics</title>
<p>The model&#x00027;s performance was quantified through five established metrics, computed from the confusion matrix&#x02014;defined by its True Positive (TP), False Positive (FP), True Negative (TN), and False Negative (FN) counts. These metrics were: Area Under the Receiver Operating Characteristic Curve (AUC-ROC), Accuracy, Precision, Recall (Sensitivity), and F1-score.</p>
<sec>
<label>2.4.1</label>
<title>Recall/sensitivity</title>
<p>Recall (Sensitivity) quantifies the ability to identify actual septic cases, minimizing false negatives (FN).</p>
<disp-formula id="EQ8"><mml:math id="M12"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mtext class="textrm" mathvariant="normal">Recall</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(8)</label></disp-formula>
</sec>
<sec>
<label>2.4.2</label>
<title>Precision</title>
<p>Precision measures the proportion of positive predictions that are truly septic, minimizing false positives (FP) to avoid unnecessary interventions.</p>
<disp-formula id="EQ9"><mml:math id="M13"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mtext class="textrm" mathvariant="normal">Precision</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(9)</label></disp-formula>
</sec>
<sec>
<label>2.4.3</label>
<title>F1-score</title>
<p>The F1-score, the harmonic mean of Precision and Recall, provides a balanced assessment.</p>
<disp-formula id="EQ10"><mml:math id="M14"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mtext class="textrm" mathvariant="normal">-Score</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mn>2</mml:mn><mml:mo>&#x000D7;</mml:mo><mml:mtext class="textrm" mathvariant="normal">Recall</mml:mtext><mml:mo>&#x000D7;</mml:mo><mml:mtext class="textrm" mathvariant="normal">Precision</mml:mtext></mml:mrow><mml:mrow><mml:mtext class="textrm" mathvariant="normal">Recall &#x0002B; Precision</mml:mtext></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(10)</label></disp-formula>
</sec>
<sec>
<label>2.4.4</label>
<title>Accuracy</title>
<p>Accuracy reflects overall correct classifications but can be misleading on imbalanced data.</p>
<disp-formula id="EQ11"><mml:math id="M15"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mtext class="textrm" mathvariant="normal">Accuracy</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>T</mml:mi><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>F</mml:mi><mml:mi>N</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>T</mml:mi><mml:mi>P</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mi>T</mml:mi><mml:mi>N</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(11)</label></disp-formula>
</sec>
<sec>
<label>2.4.5</label>
<title>AUC-ROC</title>
<p>The AUC-ROC serves as a measure of the model&#x00027;s capacity to distinguish septic from non-septic instances over a range of classification thresholds; scores approaching 1 signify superior overall discriminatory power.</p>
</sec>
</sec>
<sec>
<label>2.5</label>
<title>K-fold cross-validation</title>
<p>To obtain a robust estimate of model generalization performance and mitigate overfitting, we employed stratified k-fold cross-validation (CV) with k = 10. This technique involves partitioning the dataset into k subsets (folds), iteratively training the model on k-1 folds, and validating the remaining fold. Stratification ensures that the original class distribution (particularly relevant given the sepsis class imbalance) is preserved within each fold. By averaging the performance across all k iterations, k-fold CV provides a less biased and lower-variance estimate of the model&#x00027;s predictive capability compared to a single train-test split, maximizing the utilization of available data.</p>
</sec>
</sec>
<sec id="s3">
<label>3</label>
<title>Evaluation schemes and results</title>
<sec>
<label>3.1</label>
<title>Multi-model comparison</title>
<p>To evaluate the efficacy of our proposed disease prediction model (hereafter referred to as &#x0201C;BOBM&#x0201D;), we conducted comprehensive multi-metric comparative experiments across three temporal windows against mainstream deep learning architectures (CNN, DNN, MLPClassifier and LSTM) and traditional machine learning algorithms (XGBoost, Random Forest, Logistic Regression, and SVC). Specifically, the MLPClassifier was introduced as a baseline to evaluate the performance of non-recurrent, non-convolutional neural networks. Comparing our model against the MLP allows us to validate the necessity of the temporal modeling mechanisms integrated into our proposed framework. <xref ref-type="table" rid="T2">Table 2</xref> presents the performance metrics, including Area Under the Curve (AUC), Accuracy, Precision, Recall, and F1-score, for all models evaluated.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Evaluation results clinical interpretation of key indicators.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Cohort</bold></th>
<th valign="top" align="left"><bold>Models</bold></th>
<th valign="top" align="center"><bold>AUC</bold></th>
<th valign="top" align="center"><bold>Accuracy</bold></th>
<th valign="top" align="center"><bold>Precision</bold></th>
<th valign="top" align="center"><bold>Recall</bold></th>
<th valign="top" align="center"><bold>F1-score</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" rowspan="10">7-day group</td>
<td valign="top" align="left"><bold>Our model (base model-Mamba)</bold></td>
<td valign="top" align="center"><bold>0.950</bold> &#x000B1; 0.039</td>
<td valign="top" align="center"><bold>0.945</bold> &#x000B1; 0.041</td>
<td valign="top" align="center"><bold>0.942</bold> &#x000B1; 0.033</td>
<td valign="top" align="center"><bold>0.940</bold> &#x000B1; 0.031</td>
<td valign="top" align="center"><bold>0.938</bold> &#x000B1; 0.007</td>
</tr>
 <tr>
<td valign="top" align="left"><bold>Our model (base model-Mamba2)</bold></td>
<td valign="top" align="center">0.940 &#x000B1; 0.037</td>
<td valign="top" align="center">0.901 &#x000B1; 0.018</td>
<td valign="top" align="center">0.912 &#x000B1; 0.025</td>
<td valign="top" align="center">0.881 &#x000B1; 0.038</td>
<td valign="top" align="center">0.913 &#x000B1; 0.018</td>
</tr>
 <tr>
<td valign="top" align="left">CNN</td>
<td valign="top" align="center">0.880 &#x000B1; 0.007</td>
<td valign="top" align="center">0.875 &#x000B1; 0.028</td>
<td valign="top" align="center">0.858 &#x000B1; 0.021</td>
<td valign="top" align="center">0.862 &#x000B1; 0.041</td>
<td valign="top" align="center">0.860 &#x000B1; 0.049</td>
</tr>
 <tr>
<td valign="top" align="left">DNN</td>
<td valign="top" align="center">0.860 &#x000B1; 0.014</td>
<td valign="top" align="center">0.870 &#x000B1; 0.010</td>
<td valign="top" align="center">0.865 &#x000B1; 0.001</td>
<td valign="top" align="center">0.878 &#x000B1; 0.050</td>
<td valign="top" align="center">0.869 &#x000B1; 0.011</td>
</tr>
 <tr>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="center">0.850 &#x000B1; 0.016</td>
<td valign="top" align="center">0.863 &#x000B1; 0.002</td>
<td valign="top" align="center">0.861 &#x000B1; 0.045</td>
<td valign="top" align="center">0.868 &#x000B1; 0.037</td>
<td valign="top" align="center">0.859 &#x000B1; 0.012</td>
</tr>
 <tr>
<td valign="top" align="left">XGBClassifier</td>
<td valign="top" align="center">0.900 &#x000B1; 0.032</td>
<td valign="top" align="center">0.835 &#x000B1; 0.006</td>
<td valign="top" align="center">0.832 &#x000B1; 0.027</td>
<td valign="top" align="center">0.830 &#x000B1; 0.035</td>
<td valign="top" align="center">0.831 &#x000B1; 0.006</td>
</tr>
 <tr>
<td valign="top" align="left">RandomForestClassifier</td>
<td valign="top" align="center">0.820 &#x000B1; 0.038</td>
<td valign="top" align="center">0.750 &#x000B1; 0.019</td>
<td valign="top" align="center">0.752 &#x000B1; 0.038</td>
<td valign="top" align="center">0.750 &#x000B1; 0.020</td>
<td valign="top" align="center">0.749 &#x000B1; 0.021</td>
</tr>
 <tr>
<td valign="top" align="left">MLPClassifier</td>
<td valign="top" align="center">0.730 &#x000B1; 0.027</td>
<td valign="top" align="center">0.670 &#x000B1; 0.006</td>
<td valign="top" align="center">0.671 &#x000B1; 0.007</td>
<td valign="top" align="center">0.670 &#x000B1; 0.043</td>
<td valign="top" align="center">0.669 &#x000B1; 0.044</td>
</tr>
 <tr>
<td valign="top" align="left">LogisticRegression</td>
<td valign="top" align="center">0.720 &#x000B1; 0.027</td>
<td valign="top" align="center">0.685 &#x000B1; 0.017</td>
<td valign="top" align="center">0.684 &#x000B1; 0.011</td>
<td valign="top" align="center">0.684 &#x000B1; 0.038</td>
<td valign="top" align="center">0.685 &#x000B1; 0.040</td>
</tr>
 <tr>
<td valign="top" align="left">SVC</td>
<td valign="top" align="center">0.780 &#x000B1; 0.010</td>
<td valign="top" align="center">0.700 &#x000B1; 0.020</td>
<td valign="top" align="center">0.701 &#x000B1; 0.039</td>
<td valign="top" align="center">0.700 &#x000B1; 0.028</td>
<td valign="top" align="center">0.699 &#x000B1; 0.015</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="10">14-day group</td>
<td valign="top" align="left"><bold>Our model (base model-Mamba)</bold></td>
<td valign="top" align="center"><bold>0.860</bold> &#x000B1; 0.032</td>
<td valign="top" align="center"><bold>0.850</bold> &#x000B1; 0.014</td>
<td valign="top" align="center"><bold>0.855</bold> &#x000B1; 0.022</td>
<td valign="top" align="center"><bold>0.838</bold> &#x000B1; 0.019</td>
<td valign="top" align="center"><bold>0.825</bold> &#x000B1; 0.007</td>
</tr>
 <tr>
<td valign="top" align="left"><bold>Our model (base model-Mamba2)</bold></td>
<td valign="top" align="center">0.845 &#x000B1; 0.039</td>
<td valign="top" align="center">0.830 &#x000B1; 0.042</td>
<td valign="top" align="center">0.843 &#x000B1; 0.010</td>
<td valign="top" align="center">0.827 &#x000B1; 0.039</td>
<td valign="top" align="center">0.799 &#x000B1; 0.026</td>
</tr>
 <tr>
<td valign="top" align="left">CNN</td>
<td valign="top" align="center">0.820 &#x000B1; 0.018</td>
<td valign="top" align="center">0.830 &#x000B1; 0.040</td>
<td valign="top" align="center">0.825 &#x000B1; 0.044</td>
<td valign="top" align="center">0.812 &#x000B1; 0.045</td>
<td valign="top" align="center">0.815 &#x000B1; 0.016</td>
</tr>
 <tr>
<td valign="top" align="left">DNN</td>
<td valign="top" align="center">0.830 &#x000B1; 0.009</td>
<td valign="top" align="center">0.840 &#x000B1; 0.008</td>
<td valign="top" align="center">0.845 &#x000B1; 0.012</td>
<td valign="top" align="center">0.832 &#x000B1; 0.006</td>
<td valign="top" align="center">0.825 &#x000B1; 0.035</td>
</tr>
 <tr>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="center">0.790 &#x000B1; 0.040</td>
<td valign="top" align="center">0.810 &#x000B1; 0.001</td>
<td valign="top" align="center">0.808 &#x000B1; 0.016</td>
<td valign="top" align="center">0.795 &#x000B1; 0.022</td>
<td valign="top" align="center">0.780 &#x000B1; 0.032</td>
</tr>
 <tr>
<td valign="top" align="left">XGBClassifier</td>
<td valign="top" align="center">0.800 &#x000B1; 0.044</td>
<td valign="top" align="center">0.730 &#x000B1; 0.009</td>
<td valign="top" align="center">0.730 &#x000B1; 0.028</td>
<td valign="top" align="center">0.730 &#x000B1; 0.025</td>
<td valign="top" align="center">0.730 &#x000B1; 0.012</td>
</tr>
 <tr>
<td valign="top" align="left">RandomForestClassifier</td>
<td valign="top" align="center">0.760 &#x000B1; 0.040</td>
<td valign="top" align="center">0.690 &#x000B1; 0.024</td>
<td valign="top" align="center">0.690 &#x000B1; 0.020</td>
<td valign="top" align="center">0.690 &#x000B1; 0.007</td>
<td valign="top" align="center">0.690 &#x000B1; 0.009</td>
</tr>
 <tr>
<td valign="top" align="left">MLPClassifier</td>
<td valign="top" align="center">0.730 &#x000B1; 0.031</td>
<td valign="top" align="center">0.670 &#x000B1; 0.005</td>
<td valign="top" align="center">0.672 &#x000B1; 0.039</td>
<td valign="top" align="center">0.670 &#x000B1; 0.034</td>
<td valign="top" align="center">0.669 &#x000B1; 0.015</td>
</tr>
 <tr>
<td valign="top" align="left">LogisticRegression</td>
<td valign="top" align="center">0.720 &#x000B1; 0.010</td>
<td valign="top" align="center">0.685 &#x000B1; 0.006</td>
<td valign="top" align="center">0.685 &#x000B1; 0.042</td>
<td valign="top" align="center">0.685 &#x000B1; 0.018</td>
<td valign="top" align="center">0.685 &#x000B1; 0.020</td>
</tr>
 <tr>
<td valign="top" align="left">SVC</td>
<td valign="top" align="center">0.740 &#x000B1; 0.042</td>
<td valign="top" align="center">0.680 &#x000B1; 0.014</td>
<td valign="top" align="center">0.680 &#x000B1; 0.040</td>
<td valign="top" align="center">0.680 &#x000B1; 0.039</td>
<td valign="top" align="center">0.680 &#x000B1; 0.038</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="10">28-day group</td>
<td valign="top" align="left"><bold>Our model (base model-Mamba)</bold></td>
<td valign="top" align="center"><bold>0.910</bold> &#x000B1; 0.008</td>
<td valign="top" align="center"><bold>0.920</bold> &#x000B1; 0.009</td>
<td valign="top" align="center">0.915 &#x000B1; 0.018</td>
<td valign="top" align="center">0.908 &#x000B1; 0.004</td>
<td valign="top" align="center"><bold>0.905</bold> &#x000B1; 0.045</td>
</tr>
 <tr>
<td valign="top" align="left"><bold>Our model (base model-Mamba2)</bold></td>
<td valign="top" align="center">0.900 &#x000B1; 0.030</td>
<td valign="top" align="center">0.892 &#x000B1; 0.036</td>
<td valign="top" align="center">0.930 &#x000B1; 0.026</td>
<td valign="top" align="center">0.910 &#x000B1; 0.009</td>
<td valign="top" align="center">0.863 &#x000B1; 0.020</td>
</tr>
 <tr>
<td valign="top" align="left">CNN</td>
<td valign="top" align="center">0.860 &#x000B1; 0.044</td>
<td valign="top" align="center">0.880 &#x000B1; 0.032</td>
<td valign="top" align="center">0.875 &#x000B1; 0.030</td>
<td valign="top" align="center">0.845 &#x000B1; 0.039</td>
<td valign="top" align="center">0.846 &#x000B1; 0.046</td>
</tr>
 <tr>
<td valign="top" align="left">DNN</td>
<td valign="top" align="center">0.850 &#x000B1; 0.020</td>
<td valign="top" align="center">0.870 &#x000B1; 0.011</td>
<td valign="top" align="center">0.865 &#x000B1; 0.014</td>
<td valign="top" align="center">0.850 &#x000B1; 0.031</td>
<td valign="top" align="center">0.848 &#x000B1; 0.047</td>
</tr>
 <tr>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="center">0.870 &#x000B1; 0.029</td>
<td valign="top" align="center">0.875 &#x000B1; 0.017</td>
<td valign="top" align="center">0.880 &#x000B1; 0.049</td>
<td valign="top" align="center">0.878 &#x000B1; 0.048</td>
<td valign="top" align="center">0.870 &#x000B1; 0.019</td>
</tr>
 <tr>
<td valign="top" align="left">XGBClassifier</td>
<td valign="top" align="center">0.850 &#x000B1; 0.002</td>
<td valign="top" align="center">0.780 &#x000B1; 0.037</td>
<td valign="top" align="center">0.778 &#x000B1; 0.009</td>
<td valign="top" align="center">0.778 &#x000B1; 0.037</td>
<td valign="top" align="center">0.778 &#x000B1; 0.042</td>
</tr>
 <tr>
<td valign="top" align="left">RandomForestClassifier</td>
<td valign="top" align="center">0.810 &#x000B1; 0.002</td>
<td valign="top" align="center">0.740 &#x000B1; 0.045</td>
<td valign="top" align="center">0.738 &#x000B1; 0.044</td>
<td valign="top" align="center">0.738 &#x000B1; 0.014</td>
<td valign="top" align="center">0.740 &#x000B1; 0.034</td>
</tr>
 <tr>
<td valign="top" align="left">MLPClassifier</td>
<td valign="top" align="center">0.770 &#x000B1; 0.021</td>
<td valign="top" align="center">0.720 &#x000B1; 0.014</td>
<td valign="top" align="center">0.718 &#x000B1; 0.025</td>
<td valign="top" align="center">0.718 &#x000B1; 0.031</td>
<td valign="top" align="center">0.718 &#x000B1; 0.018</td>
</tr>
 <tr>
<td valign="top" align="left">LogisticRegression</td>
<td valign="top" align="center">0.760 &#x000B1; 0.005</td>
<td valign="top" align="center">0.710 &#x000B1; 0.039</td>
<td valign="top" align="center">0.708 &#x000B1; 0.025</td>
<td valign="top" align="center">0.710 &#x000B1; 0.016</td>
<td valign="top" align="center">0.708 &#x000B1; 0.002</td>
</tr>
<tr>
<td valign="top" align="left">SVC</td>
<td valign="top" align="center">0.780 &#x000B1; 0.048</td>
<td valign="top" align="center">0.705 &#x000B1; 0.044</td>
<td valign="top" align="center">0.705 &#x000B1; 0.043</td>
<td valign="top" align="center">0.705 &#x000B1; 0.034</td>
<td valign="top" align="center">0.704 &#x000B1; 0.018</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>Bold values indicate the best performance achieved in each metric column.</p>
</table-wrap-foot>
</table-wrap>
<p>Considering the rapid development of state-space models, we additionally evaluated a variant of BOBM in which the original Mamba backbone was replaced by the recently released Mamba-2 architecture (BOBM-Mamba2). As reported in <xref ref-type="table" rid="T2">Table 2</xref>, BOBM with the original Mamba backbone achieved slightly better performance in the 7-day prediction cohort than the BOBM-Mamba 2 variant. These results suggest that, for our dataset size and clinical temporal resolution, the original Mamba Tab configuration remains better aligned with the characteristics of the sepsis prediction task than Mamba-2.</p>
<p>All deep learning models demonstrated robust clinical predictive performance across the three temporal prediction windows, with the 7-day prediction cohort exhibiting superior overall performance. As illustrated in <xref ref-type="table" rid="T2">Table 2</xref>, our model achieved clinical decision support standards in the 7-day cohort with key performance indicators, while its Accuracy, Precision, and Recall all exceeded the 94% threshold, and significantly outperforming traditional machine learning models, the MLP baseline, and the Mamba-2 variant.</p>
<sec>
<label>3.1.1</label>
<title>Short-term prediction performance (7-day cohort)</title>
<p>In the 7-day prediction task, our proposed model demonstrated significant superiority with an AUC of 0.950 &#x000B1; 0.039, representing a 5.56% improvement over the best-performing baseline model (XGBoost: 0.900 &#x000B1; 0.032). Moreover, our model achieved superior performance metrics including Accuracy (0.945 &#x000B1; 0.041), Precision (0.942 &#x000B1; 0.033), Recall (0.940 &#x000B1; 0.031), and F1-score (0.938 &#x000B1; 0.007), all exceeding those of the baseline models. Notably, traditional machine learning algorithms (e.g., Random Forest and Logistic Regression) exhibited suboptimal performance in this task (AUC &#x0003C; 0.82), indicating that deep learning methodologies possess distinct advantages in capturing short-term disease risk features.</p>
</sec>
<sec>
<label>3.1.2</label>
<title>Mid-term prediction performance (14-day cohort)</title>
<p>As the prediction horizon extended to 14 days, a general decline in performance was observed across all models, potentially reflecting the increasingly complex non-linear dynamics of sepsis progression over this timeframe. Nevertheless, our model maintained the highest AUC (0.860 &#x000B1; 0.032) and F1-score (0.825 &#x000B1; 0.007), with a recall rate (0.838 &#x000B1; 0.019) marginally outperforming the second-best model (DNN: 0.832 &#x000B1; 0.006) by 0.6%, demonstrating the model&#x00027;s sustained capability to effectively identify at-risk individuals in mid-term predictions. Comparative analysis revealed that the LSTM model underperformed with an AUC of 0.790 &#x000B1; 0.040 in this cohort, falling below CNN and DNN, possibly due to the heightened requirements for sequential modeling capabilities imposed by the complexity of mid-term temporal dependencies.</p>
</sec>
<sec>
<label>3.1.3</label>
<title>Long-term prediction performance (28-day cohort)</title>
<p>In the 28-day prediction task, our model&#x00027;s AUC rebounded to 0.910 &#x000B1; 0.008, significantly surpassing all comparison models (with the best-performing baseline LSTM at 0.870 &#x000B1; 0.029), demonstrating its robust capacity to capture long-term risk trajectories. Specifically, the model achieved a precision of 0.915 &#x000B1; 0.018 while maintaining a high recall, indicating its ability to simultaneously minimize missed diagnosis risk and control false-positive rates. Notably, XGBoost demonstrated an improvement in this task with an AUC of 0.850 &#x000B1; 0.002, representing a 6.25% increase compared to the 14-day cohort; this suggests that gradient boosting tree algorithms possess certain capabilities in capturing long-term feature patterns, though they still exhibit a substantial performance gap compared to our proposed model (&#x00394;AUC = 0.06).</p>
</sec>
<sec>
<label>3.1.4</label>
<title>Cross-temporal stability analysis</title>
<p>Comparative analysis across different prediction windows indicates that our proposed model consistently demonstrates robust performance, maintaining an AUC between 0.860 &#x000B1; 0.032 and 0.950 &#x000B1; 0.039. Notably, the model&#x00027;s F1-score in the 28-day group approaches that of the 7-day group, validating its capacity to effectively model the long-term dynamic characteristics of disease progression. Furthermore, the performance nadir observed across all models in the 14-day group may be attributed to the increased confounding factors (such as therapeutic interventions and disease trajectory inflection points) within this time window, warranting further investigation in subsequent studies.</p>
<p>In the context of early sepsis prediction, precision reflects the model&#x00027;s capacity to optimize medical resource allocation (proportion of correctly predicted positive cases). Our model achieved a precision of 0.942 &#x000B1; 0.033 in the 7-day group, indicating only 6 false positives per 100 positive predictions, representing a 78% reduction in overtreatment risk compared to Random Forest models (precision: 0.752 &#x000B1; 0.038). As a direct measurement of missed diagnosis risk, our model demonstrated a sensitivity (recall) of 0.940 &#x000B1; 0.031, exhibiting a 25.3% improvement in case detection capability compared to conventional clinical screening tools (average recall &#x0007E;0.75). This enhancement holds substantial clinical value by potentially reducing delays in diagnosis and mitigating the associated risk of septic shock progression in ICU patients.</p>
<p>The F1-score, the harmonic mean of precision and recall, reached 0.938 &#x000B1; 0.007, indicating our model&#x00027;s effective balance between minimizing false positives and false negatives. Furthermore, the model maintained a high F1-score of 0.905 in the 28-day group, underscoring its stability for long-term risk prediction. By contrast, while LSTM models perform well on temporal sequence modeling, their corresponding 28-day F1-score was lower than our model&#x00027;s, potentially attributable to limitations in their feature representation capabilities.</p>
</sec>
<sec>
<label>3.1.5</label>
<title>ROC curve analysis</title>
<p>The AUC metric plays a crucial role in medical research as it provides clinically meaningful interpretation of disease classification among healthy subjects. Experimental results demonstrate that our proposed model exhibits superior and consistent classification performance across various prediction time windows (<xref ref-type="fig" rid="F4">Figure 4</xref>).</p>
<fig position="float" id="F4">
<label>Figure 4</label>
<caption><p>The receiver operating characteristic (ROC) curves of our model, the CNN, DNN, LSTM, XGBClassifier, RandomForestClassifier, MLPClassifier, LogisticRegression, and SVC models. The ROC curves, from left to right, illustrate the performance of early prediction algorithms using independent sample cohorts at 7, 14, and 28 days prior to sepsis onset.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1731854-g0004.tif">
<alt-text content-type="machine-generated">Three ROC curve charts compare different models&#x00027; performance across 7-day, 14-day, and 28-day groups. The x-axis represents the false positive rate, and the y-axis the true positive rate. Each chart includes multiple curves for various models like CNN, DNN, and others, with AUC scores indicated in legends. Scores range from 0.70 to 0.95, demonstrating model accuracy. The first chart shows the highest AUC for &#x0201C;Our Model&#x0201D; at 0.95, while in the other two charts, AUC values for &#x0201C;Our Model&#x0201D; slightly decrease to 0.86 and 0.91.</alt-text>
</graphic>
</fig>
<p>In the 7-day short-term prediction task, our model achieved an AUC of 0.95, significantly outperforming traditional machine learning models and baseline deep learning models. Notably, at a clinically relevant high-specificity threshold, the model&#x00027;s true positive rate demonstrated a relative improvement of 23.6% over the next-best model, CNN.</p>
<p>As the prediction time window extends to 14 days, despite the increased predictive complexity, our model maintains a high AUC value (0.88), consistently outperforming alternative algorithms. Under the 28-day long-term prediction window, the model exhibits robust stability with an AUC of 0.91, whereas other methods such as CNN (0.86) and DNN (0.85) demonstrate comparatively inferior performance.</p>
<p>Importantly, across all time windows, traditional machine learning methods such as RandomForestClassifier and LogisticRegression consistently underperform compared to deep learning approaches, confirming the superiority of deep learning architectures in capturing complex temporal features within sepsis clinical data. Furthermore, the relatively minor performance fluctuation observed as prediction time windows extend indicates the temporal robustness of our approach, providing reliable decision support for early intervention in clinical practice. This characteristic enables our model to maintain high sensitivity while reducing long-term misdiagnosis risk, fulfilling the requirements for clinical dynamic monitoring.</p>
</sec>
</sec>
<sec>
<label>3.2</label>
<title>Explainability analysis</title>
<p>The SHAP methodology, based on Shapley values from game theory, quantifies each feature&#x00027;s contribution to individual predictions, providing verifiable interpretations for deep learning models. This approach demonstrates strong alignment between influential features and clinical guidelines, enhancing model decision transparency and assisting clinicians in rapidly validating the medical rationale while optimizing individualized treatment strategies. SHAP values reflect the statistical associations between features and prediction outcomes, enabling clinicians to incorporate both direct causal effects and proxy variable effects during decision-making processes.</p>
<p>The overall feature importance ranking and summary plot (<xref ref-type="fig" rid="F5">Figure 5</xref>) clearly illustrate the global contribution and distribution of features across the dataset. Across all three prediction horizons, platelet_min (minimum platelet count) and creatinine_max (maximum creatinine level) consistently ranked as the most important features, exerting the most significant influence on the model&#x00027;s predictions. This indicates that the model effectively learned to prioritize variables critically for assessing renal and coagulation function, aligning with their fundamental roles in sepsis pathophysiology. At a more granular level, <xref ref-type="fig" rid="F6">Figure 6</xref> presents SHAP value distributions for each time window, detailing how variations in individual feature measurements impact the prediction score. Generally, lower platelet_min values and higher creatinine_max values increased the prediction score, thereby driving positive predictions (i.e., sepsis alerts). The high importance attributed to mbp_mean (mean arterial pressure) is consistent with clinical logic, as low MAP (&#x0003C; 65 mmHg) suggests shock and is associated with increased mortality risk.</p>
<fig position="float" id="F5">
<label>Figure 5</label>
<caption><p>SHAP summary plot for the top 20 clinical features contributing to the model. <bold>(A&#x02013;C)</bold>, respectively, represent independent cohorts sampled 7, 14, and 28 days prior to the onset of sepsis. Key predictive features influencing the model&#x00027;s output for each cohort were identified using SHAP value analysis.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1731854-g0005.tif">
<alt-text content-type="machine-generated">Three bar charts labeled A, B, and C show factors impacting model outputs using SHAP values. Chart A highlights creatinine_max and platelet_min as having the greatest impact. Chart B shows creatinine_max and platelet_min as the influential factors. Chart C features platelet_min and creatinine_max as the most significant. Bars represent mean SHAP values, indicating average impact magnitude.</alt-text>
</graphic>
</fig>
<fig position="float" id="F6">
<label>Figure 6</label>
<caption><p>Beeswarm plots. <bold>(A&#x02013;C)</bold> Present SHAP beeswarm plots for independent patient cohorts stratified by pre-onset intervals (7-, 14-, and 28-day groups). Within these plots, features are ranked in descending order of importance from top to bottom; the color of each point signifies the Feature value (red: high, blue: low), and the x-axis denotes the SHAP value. Negative SHapley values indicate that a given feature contributes to a lower predicted risk score, while positive Shapley values indicate a contribution to higher predicted risk.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1731854-g0006.tif">
<alt-text content-type="machine-generated">Three plots labeled A, B, and C display SHAP values indicating feature impacts on model outputs. Each plot lists various medical metrics, such as creatinine, platelet counts, and temperature, with features colored from blue to pink, representing low to high values. The x-axis shows SHAP values ranging from negative to positive, illustrating the effect size.</alt-text>
</graphic>
</fig>
<p>Minimum glucose level demonstrated moderate importance (<xref ref-type="fig" rid="F5">Figure 5</xref>), corroborating findings from related studies (<xref ref-type="bibr" rid="B54">54</xref>) that link hypoglycemia to potential sepsis presence. Although features like temperature_mean and hemoglobin_min had lower overall importance rankings, they still contributed to the model&#x00027;s predictions, reflecting the known association between factors like hemoglobin levels and sepsis risk. The collective influence of these features underpins the model&#x00027;s ability to predict sepsis onset.</p>
<p>The sepsis prediction model exhibits dynamic feature importance across different time windows, reflecting the model&#x00027;s sensitivity to disease progression. In the 7-day window (<xref ref-type="fig" rid="F6">Figure 6A</xref>), maximum respiratory rate is associated with acute respiratory compensation, consistent with its role as an early warning indicator. Furthermore, SHAP contributions of features reflecting acid-base balance (e.g., anion gap, bicarbonate) and coagulation (International Normalized Ratio, INR) are significantly higher within this initial window compared to those in the 14- and 28-day horizons. This finding aligns with the acute physiological disturbances characteristic of early sepsis and underscores the model&#x00027;s ability to detect risks associated with acid-base imbalances.</p>
<p>Transitioning to the 14-day window (<xref ref-type="fig" rid="F6">Figure 6B</xref>), features representing platelet count extremes exhibit markedly higher importance compared to the 7-day window. Similarly, the importance of minimum glucose level increases. As the time window extends to 14 days, the contribution of mean arterial pressure rises significantly. Beyond 14 days (<xref ref-type="fig" rid="F6">Figure 6C</xref>), the relative importance of predictors appears more stable, although fluctuations in platelet count extremes remain highly correlated with sepsis progression, potentially suggesting significant platelet activation or pro-inflammatory states. This sensitivity to both high and low platelet extremes may offer greater diagnostic utility than traditional single-threshold monitoring. Notably, mean oxygen saturation shows significantly increased importance in the 28-day window, indicating that oxygenation status becomes a more critical predictive factor in long-term prediction. The 28-day feature importance distribution becomes more dispersed, suggesting that long-term prediction necessitates considering additional factors such as cumulative organ damage, altered immunometabolism, and iatrogenic risks. Despite this dispersion, indicators of renal function and hematological parameters remain crucial.</p>
<sec>
<label>3.2.1</label>
<title>Nonlinear interaction analysis</title>
<p>SHAP dependence plot (<xref ref-type="fig" rid="F7">Figure 7</xref>) illustrating how a primary feature&#x00027;s value influences its contribution to the model&#x00027;s prediction.</p>
<fig position="float" id="F7">
<label>Figure 7</label>
<caption><p>SHAP dependency plots for representative clinical features contributing to the model: maximum creatinine, minimum mean arterial pressure, and minimum platelet count. The panels display the impact of three key predictors: <bold>(A)</bold> Maximum creatinine, <bold>(B)</bold> Minimum mean arterial pressure, and <bold>(C)</bold> Minimum platelet count. Each point represents an individual sample. SHAP values greater than zero indicate an increased predicted risk of sepsis associated with the corresponding feature value. Point color, determined by the secondary (interaction) feature in each panel, visualizes interaction effects, showing how the secondary feature modulates the primary feature&#x00027;s contribution to the prediction.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-12-1731854-g0007.tif">
<alt-text content-type="machine-generated">Three scatter plots labeled A, B, and C. Plot A shows SHAP values for creatinine_max against creatinine_max, with data points colored by platelet_min values. Plot B displays SHAP values for mbp_min against mbp_min, also colored by platelet_min. Plot C depicts SHAP values for platelet_min against platelet_min, with colors indicating platelet_max. Data points range from blue to pink, showing varying platelet levels.</alt-text>
</graphic>
</fig>
<sec>
<label>3.2.1.1</label>
<title>Dual risk correlation</title>
<p><xref ref-type="fig" rid="F7">Figure 7A</xref> depicts the interaction between maximum creatinine and minimum platelet count in predicting sepsis risk. Maximum creatinine consistently ranks among the most influential predictors, potentially complementing other features for enhanced risk stratification. creatinine_max exhibits a strong positive correlation with SHAP values, indicating that higher levels consistently increase the predicted risk score, potentially reflecting early clinical manifestations of acute kidney injury (AKI).</p>
<p>When creatinine_max falls below a certain threshold, platelet count shows a significant negative correlation with SHAP values; specifically, lower platelet_min values (blue points) are associated with higher SHAP values (higher predicted risk). This observation aligns with a potential mechanism of concurrent platelet consumption and acute kidney injury during sepsis progression.</p>
<p>Conversely, in the higher creatinine range, a contrasting positive correlation is observed: some instances with high creatinine_max and concurrently elevated platelet_min are also associated with positive SHAP values, increasing the predicted risk. This complex pattern may reflect distinct underlying pathological states.</p>
</sec>
<sec>
<label>3.2.1.2</label>
<title>Regulatory role of platelet count</title>
<p>Low mean arterial pressure (MAP) values (&#x0003C; 60 mmHg) were observed to correspond with high SHapley values, indicating their positive contribution to the model&#x00027;s prediction of sepsis risk. This finding aligns with the clinical understanding (<xref ref-type="bibr" rid="B55">55</xref>) of septic shock, where low MAP is recognized as a key indicator of adverse outcomes.</p>
<p><xref ref-type="fig" rid="F7">Figure 7B</xref> illustrates the interaction effect between minimum mean arterial pressure and minimum platelet count on model predictions. Specifically, when mbp_min decreases to values below 40 mmHg, SHAP values become predominantly positive, indicating that severe hypotensive states are associated with an elevated risk of adverse outcomes. This observation aligns with established clinical knowledge that sustained hypotension results in inadequate tissue perfusion. Interestingly, in the presence of relatively higher platelet_min values when mbp_min is low, these positive SHAP values become even larger, signifying an amplified predicted sepsis risk. Conversely, at higher mbp_min levels, SHAP values tend to become negative, suggesting these higher MAP values are associated with a lower predicted sepsis risk by the model.</p>
<p>The interaction between minimum platelet count and minimum mean arterial pressure exhibits a complex, non-monotonic relationship with the predicted sepsis risk. In the intermediate ranges, SHAP values exhibit significant fluctuations, with certain intervals showing positive values (indicating elevated risk) and others displaying negative values (suggesting risk reduction). In higher mbp_min ranges, elevated platelet_min values attenuate the predictive tendency of mbp_min toward sepsis risk, whereas, in lower mbp_min ranges, high platelet counts paradoxically intensify the predicted sepsis risk propensity as mbp_min decreases.</p>
</sec>
<sec>
<label>3.2.1.3</label>
<title>Platelet dynamic trajectory analysis</title>
<p><xref ref-type="fig" rid="F7">Figure 7C</xref> illustrates the combined influence of the minimum platelet count and the maximum platelet count on the predicted sepsis risk, as quantified by SHAP values. When platelet_min falls below 100 &#x000D7; 10<sup>9</sup>/L (represented on the left portion of the x-axis), the corresponding SHAP values are positive and become increasingly positive as the count decreases further. This finding strongly aligns with the International Society on Thrombosis and Haemostasis (ISTH) diagnostic criteria for disseminated intravascular coagulation (DIC), which utilizes a platelet threshold of &#x0003C; 100 &#x000D7; 10<sup>9</sup>/L. Conversely, when the minimum platelet count is relatively high, the SHAP values tend to be slightly negative, indicating a modestly reduced predicted sepsis risk associated with higher baseline platelet levels.</p>
<p>Interestingly, a key observation arises in the low platelet_min range. SHAP values remain significantly positive (indicating high predicted risk) even when the corresponding maximum platelet count during the observation period was relatively high. This indicates that a significant reduction in platelets, resulting in a low platelet_min, serves as a critical indicator of increased sepsis risk, potentially offering greater predictive utility than the peak platelet count. Therefore, the dynamic variation in platelet count, reflected by the interplay between platelet_min and platelet_max, appears to capture predictive information beyond that available from static measurements alone.</p>
</sec>
</sec>
</sec>
<sec>
<label>3.3</label>
<title>Cross-dataset performance evaluation</title>
<p>Evaluating prediction models solely on a single dataset may constrain the assessment of their real-world applicability due to potential dataset-specific biases or overfitting. Multi-center data validation can mitigate performance degradation stemming from geographical or equipment variations; therefore, we evaluated our model on two additional datasets.</p>
<p>The datasets used for external validation were the eICU (<xref ref-type="bibr" rid="B56">56</xref>) Collaborative Research Database (eICU-CRD) and the Critical Care Database for Infected Patients from Zigong Fourth People&#x00027;s Hospital (<xref ref-type="bibr" rid="B57">57</xref>). The eICU-CRD, a multi-center intensive care unit (ICU) database developed by the Massachusetts Institute of Technology (MIT) in collaboration with Philips Healthcare, is designed to facilitate critical care research and computational algorithm development. It encompasses ICU patient data from over 200 hospitals across the United States, comprising approximately 200,000 ICU admission records from 2014 to 2015 across diverse ICU types. With its large scale and broad geographical representation, the database serves as a valuable complementary resource to other critical care databases like MIMIC.</p>
<p>The second dataset is the Critical care database comprising patients with infection at Zigong Fourth People&#x00027;s Hospital (v1.1) (<xref ref-type="bibr" rid="B57">57</xref>) (hereafter, &#x0201C;<italic>Zigong</italic>&#x0201D; dataset), reportedly the first publicly available multi-source clinical database focusing on adult ICU patients with infections in China. It was developed through collaboration between the Zigong Fourth People&#x00027;s Hospital in Sichuan province and multiple research institutions. This database includes data from infected patients admitted to the hospital&#x00027;s ICU between 2019 and 2020. The database features comprehensive data integration and incorporates specialized procedures for keyword extraction and cleaning of clinical notes originally recorded in Chinese. This resource addresses a significant gap in publicly available Asian critical care infection data, thereby contributing to global critical care research and facilitating the adaptation and validation of AI-based medical tools for diverse populations.</p>
<p>The researchers obtained approval from the relevant institutional review board (IRB) and were granted permission to access and utilize the database for data extraction and analysis in accordance with established protocols. As detailed in <xref ref-type="table" rid="T3">Table 3</xref>, our proposed model demonstrated robust generalization capabilities when evaluated on two independent and heterogeneous clinical datasets (<xref ref-type="bibr" rid="B58">58</xref>): the <italic>Zigong</italic> dataset and the eICU database. It achieved Area Under the Receiver Operating Characteristic Curve (AUC) values of 0.978 &#x000B1; 0.074 and 0.982 &#x000B1; 0.090 on the <italic>Zigong</italic> and eICU datasets, respectively. This performance significantly surpasses that of the benchmark traditional machine learning and deep learning models, exceeding the highest performing baseline (RandomForest-Classifier on eICU) by 3.6% points and the lowest (LogisticRegression on <italic>Zigong</italic>) by 8.6% points. Notably, the model maintained a strong balance between precision and recall, achieving F1-scores of 0.946 &#x000B1; 0.078 on the <italic>Zigong</italic> dataset and 0.951 on the eICU dataset. Compared to XGBoost, this represents an improvement of 3.4% points on <italic>Zigong</italic> and 2.7% points on eICU. Against LSTM, the improvements were 7.1% points on <italic>Zigong</italic> Data and 6.4% points on eICU. This consistent performance across diverse datasets underscores the model&#x00027;s robustness and generalizability to variations in data collection protocols and clinical environments.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Comparison results of the performance of the model with different models in other clinical data.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Dataset</bold></th>
<th valign="top" align="left"><bold>Models</bold></th>
<th valign="top" align="center"><bold>AUC</bold></th>
<th valign="top" align="center"><bold>Accuracy</bold></th>
<th valign="top" align="center"><bold>Precision</bold></th>
<th valign="top" align="center"><bold>Recall</bold></th>
<th valign="top" align="center"><bold>F1-score</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" rowspan="9">Zigong</td>
<td valign="top" align="left">Our model</td>
<td valign="top" align="center">0.978 &#x000B1; 0.074</td>
<td valign="top" align="center">0.945 &#x000B1; 0.047</td>
<td valign="top" align="center">0.952 &#x000B1; 0.023</td>
<td valign="top" align="center">0.940 &#x000B1; 0.042</td>
<td valign="top" align="center">0.946 &#x000B1; 0.078</td>
</tr>
 <tr>
<td valign="top" align="left">CNN</td>
<td valign="top" align="center">0.923 &#x000B1; 0.016</td>
<td valign="top" align="center">0.892 &#x000B1; 0.041</td>
<td valign="top" align="center">0.885 &#x000B1; 0.048</td>
<td valign="top" align="center">0.898 &#x000B1; 0.060</td>
<td valign="top" align="center">0.891 &#x000B1; 0.085</td>
</tr>
 <tr>
<td valign="top" align="left">DNN</td>
<td valign="top" align="center">0.915 &#x000B1; 0.003</td>
<td valign="top" align="center">0.887 &#x000B1; 0.031</td>
<td valign="top" align="center">0.879 &#x000B1; 0.076</td>
<td valign="top" align="center">0.895 &#x000B1; 0.017</td>
<td valign="top" align="center">0.887 &#x000B1; 0.053</td>
</tr>
 <tr>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="center">0.908 &#x000B1; 0.070</td>
<td valign="top" align="center">0.875 &#x000B1; 0.060</td>
<td valign="top" align="center">0.868 &#x000B1; 0.028</td>
<td valign="top" align="center">0.882 &#x000B1; 0.026</td>
<td valign="top" align="center">0.875 &#x000B1; 0.052</td>
</tr>
 <tr>
<td valign="top" align="left">XGBClassifier</td>
<td valign="top" align="center">0.941 &#x000B1; 0.028</td>
<td valign="top" align="center">0.912 &#x000B1; 0.049</td>
<td valign="top" align="center">0.920 &#x000B1; 0.052</td>
<td valign="top" align="center">0.905 &#x000B1; 0.021</td>
<td valign="top" align="center">0.912 &#x000B1; 0.088</td>
</tr>
 <tr>
<td valign="top" align="left">RandomForestClassifier</td>
<td valign="top" align="center">0.934 &#x000B1; 0.022</td>
<td valign="top" align="center">0.907 &#x000B1; 0.063</td>
<td valign="top" align="center">0.915 &#x000B1; 0.059</td>
<td valign="top" align="center">0.900 &#x000B1; 0.016</td>
<td valign="top" align="center">0.907 &#x000B1; 0.027</td>
</tr>
 <tr>
<td valign="top" align="left">MLPClassifier</td>
<td valign="top" align="center">0.918 &#x000B1; 0.100</td>
<td valign="top" align="center">0.890 &#x000B1; 0.094</td>
<td valign="top" align="center">0.883 &#x000B1; 0.006</td>
<td valign="top" align="center">0.897 &#x000B1; 0.054</td>
<td valign="top" align="center">0.890 &#x000B1; 0.084</td>
</tr>
 <tr>
<td valign="top" align="left">LogisticRegression</td>
<td valign="top" align="center">0.892 &#x000B1; 0.050</td>
<td valign="top" align="center">0.853 &#x000B1; 0.085</td>
<td valign="top" align="center">0.847 &#x000B1; 0.033</td>
<td valign="top" align="center">0.859 &#x000B1; 0.052</td>
<td valign="top" align="center">0.853 &#x000B1; 0.005</td>
</tr>
 <tr>
<td valign="top" align="left">SVC</td>
<td valign="top" align="center">0.901 &#x000B1; 0.089</td>
<td valign="top" align="center">0.868 &#x000B1; 0.002</td>
<td valign="top" align="center">0.861 &#x000B1; 0.026</td>
<td valign="top" align="center">0.875 &#x000B1; 0.038</td>
<td valign="top" align="center">0.868 &#x000B1; 0.042</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="9">eICU</td>
<td valign="top" align="left">Our model</td>
<td valign="top" align="center">0.982 &#x000B1; 0.090</td>
<td valign="top" align="center">0.951 &#x000B1; 0.037</td>
<td valign="top" align="center">0.958 &#x000B1; 0.063</td>
<td valign="top" align="center">0.944 &#x000B1; 0.001</td>
<td valign="top" align="center">0.951 &#x000B1; 0.066</td>
</tr>
 <tr>
<td valign="top" align="left">CNN</td>
<td valign="top" align="center">0.915 &#x000B1; 0.067</td>
<td valign="top" align="center">0.901 &#x000B1; 0.045</td>
<td valign="top" align="center">0.910 &#x000B1; 0.079</td>
<td valign="top" align="center">0.892 &#x000B1; 0.010</td>
<td valign="top" align="center">0.901 &#x000B1; 0.030</td>
</tr>
 <tr>
<td valign="top" align="left">DNN</td>
<td valign="top" align="center">0.927 &#x000B1; 0.027</td>
<td valign="top" align="center">0.894 &#x000B1; 0.077</td>
<td valign="top" align="center">0.903 &#x000B1; 0.059</td>
<td valign="top" align="center">0.885 &#x000B1; 0.077</td>
<td valign="top" align="center">0.894 &#x000B1; 0.030</td>
</tr>
 <tr>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="center">0.920 &#x000B1; 0.020</td>
<td valign="top" align="center">0.887 &#x000B1; 0.081</td>
<td valign="top" align="center">0.896 &#x000B1; 0.085</td>
<td valign="top" align="center">0.878 &#x000B1; 0.010</td>
<td valign="top" align="center">0.887 &#x000B1; 0.052</td>
</tr>
 <tr>
<td valign="top" align="left">XGBClassifier</td>
<td valign="top" align="center">0.903 &#x000B1; 0.042</td>
<td valign="top" align="center">0.894 &#x000B1; 0.062</td>
<td valign="top" align="center">0.900 &#x000B1; 0.014</td>
<td valign="top" align="center">0.889 &#x000B1; 0.070</td>
<td valign="top" align="center">0.924 &#x000B1; 0.012</td>
</tr>
 <tr>
<td valign="top" align="left">RandomForestClassifier</td>
<td valign="top" align="center">0.946 &#x000B1; 0.050</td>
<td valign="top" align="center">0.917 &#x000B1; 0.032</td>
<td valign="top" align="center">0.925 &#x000B1; 0.060</td>
<td valign="top" align="center">0.909 &#x000B1; 0.004</td>
<td valign="top" align="center">0.917 &#x000B1; 0.000</td>
</tr>
 <tr>
<td valign="top" align="left">MLPClassifier</td>
<td valign="top" align="center">0.930 &#x000B1; 0.044</td>
<td valign="top" align="center">0.897 &#x000B1; 0.073</td>
<td valign="top" align="center">0.906 &#x000B1; 0.059</td>
<td valign="top" align="center">0.888 &#x000B1; 0.084</td>
<td valign="top" align="center">0.897 &#x000B1; 0.028</td>
</tr>
 <tr>
<td valign="top" align="left">LogisticRegression</td>
<td valign="top" align="center">0.898 &#x000B1; 0.021</td>
<td valign="top" align="center">0.857 &#x000B1; 0.090</td>
<td valign="top" align="center">0.851 &#x000B1; 0.093</td>
<td valign="top" align="center">0.863 &#x000B1; 0.001</td>
<td valign="top" align="center">0.857 &#x000B1; 0.073</td>
</tr>
<tr>
<td valign="top" align="left">SVC</td>
<td valign="top" align="center">0.913 &#x000B1; 0.076</td>
<td valign="top" align="center">0.879 &#x000B1; 0.010</td>
<td valign="top" align="center">0.872 &#x000B1; 0.045</td>
<td valign="top" align="center">0.886 &#x000B1; 0.053</td>
<td valign="top" align="center">0.879 &#x000B1; 0.058</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<label>4</label>
<title>Discussion</title>
<p>In this study, we propose a novel deep-learning framework for the early prediction of sepsis, specifically targeting detection within a clinically actionable timeframe of 7&#x02013;28 days prior to the onset of clinical suspicion. Our approach uniquely integrates structured state-space models (SSMs) within a Boosting framework. This novel integration facilitates the automatic adjustment of feature weight distributions, enables the construction of dynamic surrogate models through a forward-backward optimization mechanism, and enhances computational efficiency and scalability via multi-paradigm integration. Consequently, our framework aims to overcome limitations inherent in traditional single-paradigm predictive models. Experimental results demonstrate that our model achieves consistently high predictive accuracy across the defined time windows. Additionally, the framework supports model interpretability through the application of SHAP (SHapley Additive exPlanations) values for assessing local feature contributions and overall feature importance analysis.</p>
<p>Across various public Electronic Health Record (EHR) datasets, our model achieved a predictive accuracy ranging from 0.978 &#x000B1; 0.074 to 0.982 &#x000B1; 0.090 across diverse external datasets, demonstrating superior performance compared to baseline deep learning and traditional machine learning methods. This validates the effectiveness, generalizability, and efficiency of our model. It can rapidly adapt to diverse clinical settings, thereby paving the way for responsive healthcare systems.</p>
<p>Early diagnosis of sepsis currently faces numerous challenges. While approaches such as genomic profiling, monitoring of inflammatory markers, and EHR-based machine learning models have been proposed, patient heterogeneity, data noise, and variations in clinical workflows substantially impair their performance. Although current clinical diagnostic methods, such as the Sequential Organ Failure Assessment (SOFA) score and Procalcitonin/C-reactive Protein (PCT/CRP) testing, are widely adopted, their static assessment approach struggles to capture the dynamic pathological progression (AUC: 0.61&#x02013;0.88) (<xref ref-type="bibr" rid="B59">59</xref>), and they fail to detect early baseline fluctuation signals during the initial stages of infection (<xref ref-type="bibr" rid="B59">59</xref>). The lightweight dynamic prediction model developed in this study enables continuous monitoring within the 7- to 28-day window prior to clinical suspicion, significantly extending the intervention window compared to traditional methods (predictive accuracy: 0.978&#x02013;0.982). Furthermore, its adaptability across multiple time windows and strong generalizability provides critical infrastructure support for regional sepsis surveillance.</p>
<p>The model is strategically designed to meet the diverse requirements of various medical scenarios. Its lightweight architecture reduces computational demands, enabling operation on standard CPUs. Furthermore, its dynamic multi-paradigm integration mechanism facilitates optimal resource allocation, while the modular design allows for rapid implementation in primary healthcare settings. In contrast to existing treatment-oriented systems (<xref ref-type="bibr" rid="B60">60</xref>), the proposed model addresses limitations inherent in traditional algorithms for high-dimensional feature selection through a forward-backward optimization process and a dynamic agent framework. Additionally, SHAP values are employed to enhance clinical interpretability by identifying key predictors, such as creatinine levels, thereby supporting informed decision-making and fostering clinical trust. Economic analyses (<xref ref-type="bibr" rid="B61">61</xref>) indicate that medical costs for sepsis patients significantly exceed those for non-infected individuals, particularly when associated with nosocomial infections, where costs can increase substantially. Consequently, early warning facilitated by such models holds the potential to reduce complication rates and mortality, thereby alleviating the overall healthcare burden.</p>
<p>Nevertheless, this study has certain limitations: the heterogeneity of public databases could result in model generalization bias; while the sample imbalance issue was mitigated through the use of SMOTE, synthetic data could introduce clinically irrelevant artifacts; moreover, unmeasured confounding variables, including race and treatment preferences, as well as the generalizability to pediatric populations, require further validation through multi-center studies.</p>
<p>Future research will prioritize several key areas. These include leveraging Hospital Information Systems (HIS) for embedded Application Programming Interface (API) development, establishing a closed-loop management system encompassing the continuum from diagnosis to intervention, and optimizing individualized prediction accuracy via integrated multi-source data. Such advancements aim for healthcare professionals to rapidly access critical patient indicators and perform effective risk stratification. Ultimately, this work seeks to improve the overall quality of sepsis care&#x02014;spanning diagnosis, treatment, and management&#x02014;while enhancing the efficiency of resource utilization.</p>
</sec>
<sec sec-type="conclusion" id="s5">
<label>5</label>
<title>Conclusion</title>
<p>In summary, our proposed BOBM model, through a deeply coupled framework of Mamba-Tab and Boosting techniques, effectively enables early sepsis prediction across various time windows. Its lightweight architecture facilitates clinical deployment, and it demonstrates strong generalization capabilities. These innovations enhance the utility of clinical physiological indicators as predictive features, while simultaneously improving model interpretability.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The datasets presented in this study are publicly available. The MIMIC-IV dataset can be found on PhysioNet (<ext-link ext-link-type="uri" xlink:href="https://physionet.org/content/mimiciv">https://physionet.org/content/mimiciv</ext-link>/). The eICU-CRD is available at <ext-link ext-link-type="uri" xlink:href="https://physionet.org/content/eicu-crd/">https://physionet.org/content/eicu-crd/</ext-link>.</p>
</sec>
<sec sec-type="ethics-statement" id="s7">
<title>Ethics statement</title>
<p>Ethical approval was not required for the study involving humans in accordance with the local legislation and institutional requirements. Written informed consent to participate in this study was not required from the participants or the participants&#x00027; legal guardians/next of kin in accordance with the national legislation and the institutional requirements.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>WL: Data curation, Formal analysis, Investigation, Methodology, Visualization, Writing &#x02013; original draft. KX: Conceptualization, Methodology, Writing &#x02013; review &#x00026; editing. BG: Data curation, Methodology, Validation, Writing &#x02013; review &#x00026; editing. HZ: Data curation, Methodology, Validation, Writing &#x02013; review &#x00026; editing. DS: Conceptualization, Methodology, Writing &#x02013; review &#x00026; editing. RM: Methodology, Resources, Writing &#x02013; review &#x00026; editing. QW: Funding acquisition, Resources, Methodology, Supervision, Project administration, Writing &#x02013; review &#x00026; editing. QY: Conceptualization, Funding acquisition, Methodology, Project administration, Resources, Supervision, Writing &#x02013; review &#x00026; editing.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s10">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="s12">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmed.2025.1731854/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmed.2025.1731854/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kumar</surname> <given-names>S</given-names></name> <name><surname>Tripathy</surname> <given-names>S</given-names></name> <name><surname>Jyoti</surname> <given-names>A</given-names></name> <name><surname>Singh</surname> <given-names>SG</given-names></name></person-group>. <article-title>Recent advances in biosensors for diagnosis and detection of sepsis: a comprehensive review</article-title>. <source>Biosens Bioelectron</source>. (<year>2019</year>) 124&#x02013;<volume>5</volume>:<fpage>205</fpage>&#x02013;<lpage>15</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.bios.2018.10.034</pub-id><pub-id pub-id-type="pmid">30388563</pub-id></mixed-citation>
</ref>
<ref id="B2">
<label>2.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mancini</surname> <given-names>N</given-names></name> <name><surname>Carletti</surname> <given-names>S</given-names></name> <name><surname>Ghidoli</surname> <given-names>N</given-names></name> <name><surname>Cichero</surname> <given-names>P</given-names></name> <name><surname>Burioni</surname> <given-names>R</given-names></name> <name><surname>Clementi</surname> <given-names>M</given-names></name></person-group>. <article-title>The era of molecular and other non-culture-based methods in diagnosis of sepsis</article-title>. <source>Clin Microbiol Rev.</source> (<year>2010</year>) <volume>23</volume>:<fpage>235</fpage>&#x02013;<lpage>51</lpage>. doi: <pub-id pub-id-type="doi">10.1128/CMR.00043-09</pub-id><pub-id pub-id-type="pmid">20065332</pub-id></mixed-citation>
</ref>
<ref id="B3">
<label>3.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Opota</surname> <given-names>O</given-names></name> <name><surname>Croxatto</surname> <given-names>A</given-names></name> <name><surname>Prod&#x00027;hom</surname> <given-names>G</given-names></name> <name><surname>Greub</surname> <given-names>G</given-names></name></person-group>. <article-title>Blood culture-based diagnosis of bacteraemia: state of the art</article-title>. <source>Clin Microbiol Infect.</source> (<year>2015</year>) <volume>21</volume>:<fpage>313</fpage>&#x02013;<lpage>22</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cmi.2015.01.003</pub-id><pub-id pub-id-type="pmid">25753137</pub-id></mixed-citation>
</ref>
<ref id="B4">
<label>4.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rello</surname> <given-names>J</given-names></name> <name><surname>Alonso-Tarr&#x000E9;s</surname> <given-names>C</given-names></name></person-group>. <article-title>Emerging technologies for microbiologic diagnosis of sepsis: the rapid determination of resistance to antimicrobial agents should be the key</article-title>. <source>Clin Infect Dis.</source> (<year>2021</year>) <volume>73</volume>:<fpage>1173</fpage>&#x02013;<lpage>5</lpage>. doi: <pub-id pub-id-type="doi">10.1093/cid/ciab355</pub-id><pub-id pub-id-type="pmid">33895796</pub-id></mixed-citation>
</ref>
<ref id="B5">
<label>5.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Komorowski</surname> <given-names>M</given-names></name> <name><surname>Green</surname> <given-names>A</given-names></name> <name><surname>Tatham</surname> <given-names>KC</given-names></name> <name><surname>Seymour</surname> <given-names>C</given-names></name> <name><surname>Antcliffe</surname> <given-names>D</given-names></name></person-group>. <article-title>Sepsis biomarkers and diagnostic tools with a focus on machine learning</article-title>. <source>EBioMedicine.</source> (<year>2022</year>) <volume>86</volume>:<fpage>104394</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ebiom.2022.104394</pub-id><pub-id pub-id-type="pmid">36470834</pub-id></mixed-citation>
</ref>
<ref id="B6">
<label>6.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vincent</surname> <given-names>JL</given-names></name></person-group>. <article-title>The clinical challenge of sepsis identification and monitoring</article-title>. <source>PLoS Med.</source> (<year>2016</year>) <volume>13</volume>:<fpage>e1002022</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pmed.1002022</pub-id><pub-id pub-id-type="pmid">27187803</pub-id></mixed-citation>
</ref>
<ref id="B7">
<label>7.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rudd</surname> <given-names>KE</given-names></name> <name><surname>Kissoon</surname> <given-names>N</given-names></name> <name><surname>Limmathurotsakul</surname> <given-names>D</given-names></name> <name><surname>Bory</surname> <given-names>S</given-names></name> <name><surname>Mutahunga</surname> <given-names>B</given-names></name> <name><surname>Seymour</surname> <given-names>CW</given-names></name> <etal/></person-group>. <article-title>The global burden of sepsis: barriers and potential solutions</article-title>. <source>Crit Care.</source> (<year>2018</year>) <volume>22</volume>:<fpage>232</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13054-018-2157-z</pub-id><pub-id pub-id-type="pmid">30243300</pub-id></mixed-citation>
</ref>
<ref id="B8">
<label>8.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Umscheid</surname> <given-names>CA</given-names></name> <name><surname>Betesh</surname> <given-names>J</given-names></name> <name><surname>VanZandbergen</surname> <given-names>C</given-names></name> <name><surname>Hanish</surname> <given-names>A</given-names></name> <name><surname>Tait</surname> <given-names>G</given-names></name> <name><surname>Mikkelsen</surname> <given-names>ME</given-names></name> <etal/></person-group>. <article-title>Development, implementation, and impact of an automated early warning and response system for sepsis</article-title>. <source>J Hosp Med.</source> (<year>2015</year>) <volume>10</volume>:<fpage>26</fpage>&#x02013;<lpage>31</lpage>. doi: <pub-id pub-id-type="doi">10.1002/jhm.2259</pub-id><pub-id pub-id-type="pmid">25263548</pub-id></mixed-citation>
</ref>
<ref id="B9">
<label>9.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>JH</given-names></name> <name><surname>Kang</surname> <given-names>DR</given-names></name></person-group>. <article-title>From traditional statistical methods to machine and deep learning for prediction models</article-title>. <source>Cardiovasc Prev Pharmacother.</source> (<year>2020</year>) <volume>2</volume>:<fpage>50</fpage>&#x02013;<lpage>5</lpage>. doi: <pub-id pub-id-type="doi">10.36011/cpp.2020.2.e6</pub-id></mixed-citation>
</ref>
<ref id="B10">
<label>10.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tripepi</surname> <given-names>G</given-names></name> <name><surname>Jager</surname> <given-names>KJ</given-names></name> <name><surname>Dekker</surname> <given-names>FW</given-names></name> <name><surname>Zoccali</surname> <given-names>C</given-names></name></person-group>. <article-title>Linear and logistic regression analysis</article-title>. <source>Kidney Int.</source> (<year>2008</year>) <volume>73</volume>:<fpage>806</fpage>&#x02013;<lpage>10</lpage>. doi: <pub-id pub-id-type="doi">10.1038/sj.ki.5002787</pub-id></mixed-citation>
</ref>
<ref id="B11">
<label>11.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ranstam</surname> <given-names>J</given-names></name> <name><surname>Cook</surname> <given-names>JA</given-names></name></person-group>. <article-title>LASSO regression</article-title>. <source>Br J Surg.</source> (<year>2018</year>) <volume>105</volume>:<fpage>1348</fpage>. doi: <pub-id pub-id-type="doi">10.1002/bjs.10895</pub-id></mixed-citation>
</ref>
<ref id="B12">
<label>12.</label>
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Ahamed</surname> <given-names>MA</given-names></name> <name><surname>Cheng</surname> <given-names>Q</given-names></name></person-group>. <article-title>MambaTab: a plug-and-play model for learning tabular data</article-title>. In: <source>Proceedings of the 2024 IEEE 7th International Conference on Multimedia Information Processing and Retrieval (MIPR)</source>. <publisher-loc>San Jose, CA</publisher-loc>: <publisher-name>IEEE</publisher-name> (<year>2024</year>). p. <fpage>369</fpage>&#x02013;<lpage>75</lpage>. doi: <pub-id pub-id-type="doi">10.1109/MIPR62202.2024.00065</pub-id><pub-id pub-id-type="pmid">39850741</pub-id></mixed-citation>
</ref>
<ref id="B13">
<label>13.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shah</surname> <given-names>BR</given-names></name> <name><surname>Laupacis</surname> <given-names>A</given-names></name> <name><surname>Hux</surname> <given-names>JE</given-names></name> <name><surname>Austin</surname> <given-names>PC</given-names></name></person-group>. <article-title>Propensity score methods gave similar results to traditional regression modeling in observational studies: a systematic review</article-title>. <source>J Clin Epidemiol.</source> (<year>2005</year>) <volume>58</volume>:<fpage>550</fpage>&#x02013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jclinepi.2004.10.016</pub-id><pub-id pub-id-type="pmid">15878468</pub-id></mixed-citation>
</ref>
<ref id="B14">
<label>14.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Islam</surname> <given-names>KR</given-names></name> <name><surname>Prithula</surname> <given-names>J</given-names></name> <name><surname>Kumar</surname> <given-names>J</given-names></name> <name><surname>Tan</surname> <given-names>TL</given-names></name> <name><surname>Reaz</surname> <given-names>MBI</given-names></name> <name><surname>Sumon</surname> <given-names>MSI</given-names></name> <etal/></person-group>. <article-title>Machine learning-based early prediction of sepsis using electronic health records: a systematic review</article-title>. <source>J Clin Med.</source> (<year>2023</year>) <volume>12</volume>:<fpage>5658</fpage>. doi: <pub-id pub-id-type="doi">10.3390/jcm12175658</pub-id><pub-id pub-id-type="pmid">37685724</pub-id></mixed-citation>
</ref>
<ref id="B15">
<label>15.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Islam</surname> <given-names>MM</given-names></name> <name><surname>Nasrin</surname> <given-names>T</given-names></name> <name><surname>Walther</surname> <given-names>BA</given-names></name> <name><surname>Wu</surname> <given-names>CC</given-names></name> <name><surname>Yang HC Li</surname> <given-names>YC</given-names></name></person-group>. <article-title>Prediction of sepsis patients using machine learning approach: a meta-analysis</article-title>. <source>Comput Methods Programs Biomed.</source> (<year>2019</year>) <volume>170</volume>:<fpage>1</fpage>&#x02013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cmpb.2018.12.027</pub-id><pub-id pub-id-type="pmid">30712598</pub-id></mixed-citation>
</ref>
<ref id="B16">
<label>16.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Deng</surname> <given-names>H</given-names></name> <name><surname>Sun</surname> <given-names>M</given-names></name> <name><surname>Wang</surname> <given-names>Y</given-names></name> <name><surname>Zeng</surname> <given-names>J</given-names></name> <name><surname>Yuan</surname> <given-names>T</given-names></name> <name><surname>Li</surname> <given-names>T</given-names></name> <etal/></person-group>. <article-title>Evaluating machine learning models for sepsis prediction: a systematic review of methodologies</article-title>. <source>iScience.</source> (<year>2021</year>) <volume>25</volume>:<fpage>103651</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.isci.2021.103651</pub-id><pub-id pub-id-type="pmid">35028534</pub-id></mixed-citation>
</ref>
<ref id="B17">
<label>17.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>Q</given-names></name> <name><surname>Campan</surname> <given-names>A</given-names></name> <name><surname>Ren</surname> <given-names>A</given-names></name> <name><surname>Eid</surname> <given-names>WE</given-names></name></person-group>. <article-title>Automating and improving cardiovascular disease prediction using machine learning and EMR data features from a regional healthcare system</article-title>. <source>Int J Med Inf.</source> (<year>2022</year>) <volume>163</volume>:<fpage>104786</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2022.104786</pub-id><pub-id pub-id-type="pmid">35512622</pub-id></mixed-citation>
</ref>
<ref id="B18">
<label>18.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Richter-Laskowska</surname> <given-names>M</given-names></name> <name><surname>Sobotnicka</surname> <given-names>E</given-names></name> <name><surname>Bednorz</surname> <given-names>A</given-names></name></person-group>. <article-title>Cognitive performance classification of older patients using machine learning and electronic medical records</article-title>. <source>Sci Rep.</source> (<year>2025</year>) <volume>15</volume>:<fpage>6564</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-025-90460-y</pub-id><pub-id pub-id-type="pmid">39994339</pub-id></mixed-citation>
</ref>
<ref id="B19">
<label>19.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Goh</surname> <given-names>KH</given-names></name> <name><surname>Wang</surname> <given-names>L</given-names></name> <name><surname>Yeow</surname> <given-names>AYK</given-names></name> <name><surname>Poh</surname> <given-names>H</given-names></name> <name><surname>Li</surname> <given-names>K</given-names></name> <name><surname>Yeow</surname> <given-names>JJL</given-names></name> <etal/></person-group>. <article-title>Artificial intelligence in sepsis early prediction and diagnosis using unstructured data in healthcare</article-title>. <source>Nat Commun.</source> (<year>2021</year>) <volume>12</volume>:<fpage>711</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-021-20910-4</pub-id><pub-id pub-id-type="pmid">33514699</pub-id></mixed-citation>
</ref>
<ref id="B20">
<label>20.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Adamson</surname> <given-names>B</given-names></name> <name><surname>Waskom</surname> <given-names>M</given-names></name> <name><surname>Blarre</surname> <given-names>A</given-names></name> <name><surname>Kelly</surname> <given-names>J</given-names></name> <name><surname>Krismer</surname> <given-names>K</given-names></name> <name><surname>Nemeth</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Approach to machine learning for extraction of real-world data variables from electronic health records</article-title>. <source>Front Pharmacol.</source> (<year>2023</year>) <volume>14</volume>:<fpage>1180962</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fphar.2023.1180962</pub-id><pub-id pub-id-type="pmid">37781703</pub-id></mixed-citation>
</ref>
<ref id="B21">
<label>21.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fleuren</surname> <given-names>LM</given-names></name> <name><surname>Klausch</surname> <given-names>TLT</given-names></name> <name><surname>Zwager</surname> <given-names>CL</given-names></name> <name><surname>Schoonmade</surname> <given-names>LJ</given-names></name> <name><surname>Guo</surname> <given-names>T</given-names></name> <name><surname>Roggeveen</surname> <given-names>LF</given-names></name> <etal/></person-group>. <article-title>Machine learning for the prediction of sepsis: a systematic review and meta-analysis of diagnostic test accuracy</article-title>. <source>Intensive Care Med.</source> (<year>2020</year>) <volume>46</volume>:<fpage>383</fpage>&#x02013;<lpage>400</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00134-019-05872-y</pub-id><pub-id pub-id-type="pmid">31965266</pub-id></mixed-citation>
</ref>
<ref id="B22">
<label>22.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Furukawa</surname> <given-names>M</given-names></name> <name><surname>Kinoshita</surname> <given-names>K</given-names></name> <name><surname>Yamaguchi</surname> <given-names>J</given-names></name> <name><surname>Hori</surname> <given-names>S</given-names></name> <name><surname>Sakurai</surname> <given-names>A</given-names></name></person-group>. <article-title>Sepsis patients with complication of hypoglycemia and hypoalbuminemia are an early and easy identification of high mortality risk</article-title>. <source>Intern Emerg Med.</source> (<year>2019</year>) <volume>14</volume>:<fpage>539</fpage>&#x02013;<lpage>48</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11739-019-02034-2</pub-id><pub-id pub-id-type="pmid">30729384</pub-id></mixed-citation>
</ref>
<ref id="B23">
<label>23.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>L&#x00027;Heureux</surname> <given-names>A</given-names></name> <name><surname>Grolinger</surname> <given-names>K</given-names></name> <name><surname>Elyamany</surname> <given-names>HF</given-names></name> <name><surname>Capretz</surname> <given-names>MAM</given-names></name></person-group>. <article-title>Machine learning with big data: challenges and approaches</article-title>. <source>IEEE Access</source>. (<year>2017</year>) <volume>5</volume>:<fpage>7776</fpage>&#x02013;<lpage>97</lpage>. doi: <pub-id pub-id-type="doi">10.1109/ACCESS.2017.2696365</pub-id></mixed-citation>
</ref>
<ref id="B24">
<label>24.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ramakrishnaiah</surname> <given-names>Y</given-names></name> <name><surname>Macesic</surname> <given-names>N</given-names></name> <name><surname>Webb</surname> <given-names>GI</given-names></name> <name><surname>Peleg</surname> <given-names>AY</given-names></name> <name><surname>Tyagi</surname> <given-names>S</given-names></name> <name><surname>EHR-ML</surname></name></person-group>. <article-title>a data-driven framework for designing machine learning applications with electronic health records</article-title>. <source>Int J Med Inform.</source> (<year>2025</year>) <volume>196</volume>:<fpage>105816</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2025.105816</pub-id></mixed-citation>
</ref>
<ref id="B25">
<label>25.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Miotto</surname> <given-names>R</given-names></name> <name><surname>Wang</surname> <given-names>F</given-names></name> <name><surname>Wang</surname> <given-names>S</given-names></name> <name><surname>Jiang</surname> <given-names>X</given-names></name> <name><surname>Dudley</surname> <given-names>JT</given-names></name></person-group>. <article-title>Deep learning for healthcare: review, opportunities and challenges</article-title>. <source>Brief Bioinform.</source> (<year>2018</year>) <volume>19</volume>:<fpage>1236</fpage>&#x02013;<lpage>46</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bib/bbx044</pub-id><pub-id pub-id-type="pmid">28481991</pub-id></mixed-citation>
</ref>
<ref id="B26">
<label>26.</label>
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Rout</surname> <given-names>SK</given-names></name> <name><surname>Sahu</surname> <given-names>B</given-names></name> <name><surname>Regulwar</surname> <given-names>GB</given-names></name> <name><surname>Kavididevi</surname> <given-names>V</given-names></name></person-group>. <article-title>Deep learning in early prediction of sepsis and diagnosis</article-title>. In: <source>Proceedings of the 2023 International Conference for Advancement in Technology (ICONAT)</source>. <publisher-loc>Goa</publisher-loc>: <publisher-name>IEEE</publisher-name> (<year>2023</year>). p. <fpage>1</fpage>&#x02013;<lpage>5</lpage>. doi: <pub-id pub-id-type="doi">10.1109/ICONAT57137.2023.10080152</pub-id></mixed-citation>
</ref>
<ref id="B27">
<label>27.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shashikumar</surname> <given-names>SP</given-names></name> <name><surname>Wardi</surname> <given-names>G</given-names></name> <name><surname>Malhotra</surname> <given-names>A</given-names></name> <name><surname>Nemati</surname> <given-names>S</given-names></name></person-group>. <article-title>Artificial intelligence sepsis prediction algorithm learns to say &#x0201C;I don&#x00027;t know&#x0201D;</article-title>. <source>NPJ Digit Med.</source> (<year>2021</year>) <volume>4</volume>:<fpage>134</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41746-021-00504-6</pub-id><pub-id pub-id-type="pmid">34504260</pub-id></mixed-citation>
</ref>
<ref id="B28">
<label>28.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>van der Vegt</surname> <given-names>AH</given-names></name> <name><surname>Campbell</surname> <given-names>V</given-names></name> <name><surname>Mitchell</surname> <given-names>I</given-names></name> <name><surname>Malycha</surname> <given-names>J</given-names></name> <name><surname>Simpson</surname> <given-names>J</given-names></name> <name><surname>Flenady</surname> <given-names>T</given-names></name> <etal/></person-group>. <article-title>Systematic review and longitudinal analysis of implementing artificial intelligence to predict clinical deterioration in adult hospitals: what is known and what remains uncertain</article-title>. <source>J Am Med Inform Assoc.</source> (<year>2024</year>) <volume>31</volume>:<fpage>509</fpage>&#x02013;<lpage>24</lpage>. doi: <pub-id pub-id-type="doi">10.1093/jamia/ocad220</pub-id><pub-id pub-id-type="pmid">37964688</pub-id></mixed-citation>
</ref>
<ref id="B29">
<label>29.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y</given-names></name> <name><surname>Zhang</surname> <given-names>R</given-names></name> <name><surname>Yang</surname> <given-names>Q</given-names></name> <name><surname>Zhou</surname> <given-names>Q</given-names></name> <name><surname>Zhang</surname> <given-names>S</given-names></name> <name><surname>Fan</surname> <given-names>Y</given-names></name> <etal/></person-group>. <article-title>FairCare: adversarial training of a heterogeneous graph neural network with attention mechanism to learn fair representations of electronic health records</article-title>. <source>Inf Process Manage.</source> (<year>2024</year>) <volume>61</volume>:<fpage>103682</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ipm.2024.103682</pub-id></mixed-citation>
</ref>
<ref id="B30">
<label>30.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nigo</surname> <given-names>M</given-names></name> <name><surname>Rasmy</surname> <given-names>L</given-names></name> <name><surname>Mao</surname> <given-names>B</given-names></name> <name><surname>Kannadath</surname> <given-names>BS</given-names></name> <name><surname>Xie</surname> <given-names>Z</given-names></name> <name><surname>Zhi</surname> <given-names>D</given-names></name></person-group>. <article-title>Deep learning model for personalized prediction of positive MRSA culture using time-series electronic health records</article-title>. <source>Nat Commun.</source> (<year>2024</year>) <volume>15</volume>:<fpage>2036</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-024-46211-0</pub-id><pub-id pub-id-type="pmid">38448409</pub-id></mixed-citation>
</ref>
<ref id="B31">
<label>31.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bomrah</surname> <given-names>S</given-names></name> <name><surname>Uddin</surname> <given-names>M</given-names></name> <name><surname>Upadhyay</surname> <given-names>U</given-names></name> <name><surname>Komorowski</surname> <given-names>M</given-names></name> <name><surname>Priya</surname> <given-names>J</given-names></name> <name><surname>Dhar</surname> <given-names>E</given-names></name> <etal/></person-group>. <article-title>A scoping review of machine learning for sepsis prediction- feature engineering strategies and model performance: a step towards explainability</article-title>. <source>Crit Care.</source> (<year>2024</year>) <volume>28</volume>:<fpage>180</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13054-024-04948-6</pub-id><pub-id pub-id-type="pmid">38802973</pub-id></mixed-citation>
</ref>
<ref id="B32">
<label>32.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dou</surname> <given-names>Y</given-names></name> <name><surname>Li</surname> <given-names>W</given-names></name> <name><surname>Zomaya</surname> <given-names>AY</given-names></name></person-group>. <article-title>Transformer-based unsupervised learning for early detection of sepsis (student abstract)</article-title>. <source>Proc AAAI Conf Artif Intell.</source> (<year>2022</year>) <volume>36</volume>:<fpage>12937</fpage>&#x02013;<lpage>8</lpage>. doi: <pub-id pub-id-type="doi">10.1609/aaai.v36i11.21605</pub-id></mixed-citation>
</ref>
<ref id="B33">
<label>33.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>L</given-names></name> <name><surname>Yin</surname> <given-names>Y</given-names></name> <name><surname>Glampson</surname> <given-names>B</given-names></name> <name><surname>Peach</surname> <given-names>R</given-names></name> <name><surname>Barahona</surname> <given-names>M</given-names></name> <name><surname>Delaney</surname> <given-names>BC</given-names></name> <etal/></person-group>. <article-title>Transformer-based deep learning model for the diagnosis of suspected lung cancer in primary care based on electronic health record data</article-title>. <source>EBioMedicine.</source> (<year>2024</year>) <volume>110</volume>:<fpage>105442</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ebiom.2024.105442</pub-id><pub-id pub-id-type="pmid">39536394</pub-id></mixed-citation>
</ref>
<ref id="B34">
<label>34.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Renc</surname> <given-names>P</given-names></name> <name><surname>Jia</surname> <given-names>Y</given-names></name> <name><surname>Samir</surname> <given-names>AE</given-names></name> <name><surname>Was</surname> <given-names>J</given-names></name> <name><surname>Li</surname> <given-names>Q</given-names></name> <name><surname>Bates</surname> <given-names>DW</given-names></name> <etal/></person-group>. <article-title>Zero shot health trajectory prediction using Transformer</article-title>. <source>npj Digit Med.</source> (<year>2024</year>) <volume>7</volume>:<fpage>256</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41746-024-01235-0</pub-id><pub-id pub-id-type="pmid">39300208</pub-id></mixed-citation>
</ref>
<ref id="B35">
<label>35.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname> <given-names>Y</given-names></name> <name><surname>Zhang</surname> <given-names>Y</given-names></name> <name><surname>Li</surname> <given-names>J</given-names></name> <name><surname>A</surname></name></person-group>. <article-title>time series driven model for early sepsis prediction based on Transformer module</article-title>. <source>BMC Med Res Methodol.</source> (<year>2024</year>) <volume>24</volume>:<fpage>23</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12874-023-02138-6</pub-id></mixed-citation>
</ref>
<ref id="B36">
<label>36.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Saria</surname> <given-names>S</given-names></name> <name><surname>Henry</surname> <given-names>KE</given-names></name></person-group>. <article-title>Too many definitions of sepsis: can machine learning leverage the electronic health record to increase accuracy and bring consensus?</article-title> <source>Crit Care Med</source>. (<year>2020</year>) <volume>48</volume>:<fpage>137</fpage>&#x02013;<lpage>41</lpage>. doi: <pub-id pub-id-type="doi">10.1097/CCM.0000000000004144</pub-id><pub-id pub-id-type="pmid">31939780</pub-id></mixed-citation>
</ref>
<ref id="B37">
<label>37.</label>
<mixed-citation publication-type="web"><person-group person-group-type="author"><name><surname>Gu</surname> <given-names>A</given-names></name> <name><surname>Dao</surname> <given-names>T</given-names></name></person-group>. <source>Mamba: Linear-Time Sequence Modeling With Selective State Spaces.</source> arXiv preprint [Preprint] (<year>2023</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.48550/arXiv.2312.00752">https://doi.org/10.48550/arXiv.2312.00752</ext-link> (Accessed August 14, 2025).</mixed-citation>
</ref>
<ref id="B38">
<label>38.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>He</surname> <given-names>X</given-names></name> <name><surname>Cao</surname> <given-names>K</given-names></name> <name><surname>Zhang</surname> <given-names>J</given-names></name> <name><surname>Yan</surname> <given-names>K</given-names></name> <name><surname>Wang</surname> <given-names>Y</given-names></name> <name><surname>Li</surname> <given-names>R</given-names></name> <etal/></person-group>. <article-title>Pan-Mamba: effective pan-sharpening with state space model</article-title>. <source>Inf Fusion.</source> (<year>2025</year>) <volume>115</volume>:<fpage>102779</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.inffus.2024.102779</pub-id></mixed-citation>
</ref>
<ref id="B39">
<label>39.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Elfwing</surname> <given-names>S</given-names></name> <name><surname>Uchibe</surname> <given-names>E</given-names></name> <name><surname>Doya</surname> <given-names>K</given-names></name></person-group>. <article-title>Sigmoid-weighted linear units for neural network function approximation in reinforcement learning</article-title>. <source>Neural Netw.</source> (<year>2018</year>) <volume>107</volume>:<fpage>3</fpage>&#x02013;<lpage>11</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neunet.2017.12.012</pub-id><pub-id pub-id-type="pmid">29395652</pub-id></mixed-citation>
</ref>
<ref id="B40">
<label>40.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Freund</surname> <given-names>Y</given-names></name> <name><surname>Iyer</surname> <given-names>R</given-names></name> <name><surname>Schapire</surname> <given-names>RE</given-names></name> <name><surname>Singer</surname> <given-names>Y</given-names></name></person-group>. <article-title>An efficient boosting algorithm for combining preferences</article-title>. <source>J Mach Learn Res.</source> (<year>2003</year>) <volume>4</volume>:<fpage>933</fpage>&#x02013;<lpage>69</lpage>. doi: <pub-id pub-id-type="doi">10.5555/945365.964285</pub-id></mixed-citation>
</ref>
<ref id="B41">
<label>41.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bickel</surname> <given-names>PJ</given-names></name> <name><surname>Ritov</surname> <given-names>Y</given-names></name> <name><surname>Zakai</surname> <given-names>A</given-names></name></person-group>. <article-title>Some theory for generalized boosting algorithms</article-title>. <source>J Mach Learn Res.</source> (<year>2006</year>) <volume>7</volume>:<fpage>705</fpage>&#x02013;<lpage>32</lpage>.</mixed-citation>
</ref>
<ref id="B42">
<label>42.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Di Fiore</surname> <given-names>F</given-names></name> <name><surname>Nardelli</surname> <given-names>M</given-names></name> <name><surname>Mainini</surname> <given-names>L</given-names></name></person-group>. <article-title>Active learning and Bayesian optimization: a unified perspective to learn with a goal</article-title>. <source>Arch Comput Methods Eng.</source> (<year>2024</year>) <volume>31</volume>:<fpage>2985</fpage>&#x02013;<lpage>3013</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11831-024-10064-z</pub-id></mixed-citation>
</ref>
<ref id="B43">
<label>43.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>M</given-names></name> <name><surname>Yang</surname> <given-names>S</given-names></name> <name><surname>Wu</surname> <given-names>C</given-names></name> <name><surname>Marom</surname> <given-names>N</given-names></name></person-group>. <article-title>Machine learning the Hubbard <italic>U</italic> parameter in DFT&#x0002B;<italic>U</italic> using Bayesian optimization</article-title>. <source>npj Comput Mater.</source> (<year>2020</year>) <volume>6</volume>:<fpage>180</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41524-020-00446-9</pub-id></mixed-citation>
</ref>
<ref id="B44">
<label>44.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>X</given-names></name> <name><surname>Jin</surname> <given-names>Y</given-names></name> <name><surname>Schmitt</surname> <given-names>S</given-names></name> <name><surname>Olhofer</surname> <given-names>M</given-names></name></person-group>. <article-title>Recent advances in Bayesian optimization</article-title>. <source>ACM Comput Surv.</source> (<year>2013</year>) <volume>55</volume>:<fpage>1</fpage>&#x02013;<lpage>36</lpage>. doi: <pub-id pub-id-type="doi">10.1145/3582078</pub-id></mixed-citation>
</ref>
<ref id="B45">
<label>45.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Johnson</surname> <given-names>AEW</given-names></name> <name><surname>Bulgarelli</surname> <given-names>L</given-names></name> <name><surname>Shen</surname> <given-names>L</given-names></name> <name><surname>Gayles</surname> <given-names>A</given-names></name> <name><surname>Shammout</surname> <given-names>A</given-names></name> <name><surname>Horng</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>MIMIC-IV, a freely accessible electronic health record dataset</article-title>. <source>Sci Data.</source> (<year>2023</year>) <volume>10</volume>:<fpage>1</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41597-023-01945-2</pub-id><pub-id pub-id-type="pmid">36596836</pub-id></mixed-citation>
</ref>
<ref id="B46">
<label>46.</label>
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Johnson</surname> <given-names>A</given-names></name> <name><surname>Bulgarelli</surname> <given-names>L</given-names></name> <name><surname>Pollard</surname> <given-names>T</given-names></name> <name><surname>Gow</surname> <given-names>B</given-names></name> <name><surname>Moody</surname> <given-names>B</given-names></name> <name><surname>Horng</surname> <given-names>S</given-names></name> <etal/></person-group>. <source>MIMIC-IV (Version 3.1)</source>. <publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>PhysioNet</publisher-name> (<year>2024</year>).</mixed-citation>
</ref>
<ref id="B47">
<label>47.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Singer</surname> <given-names>M</given-names></name> <name><surname>Deutschman</surname> <given-names>CS</given-names></name> <name><surname>Seymour</surname> <given-names>CW</given-names></name> <name><surname>Shankar-Hari</surname> <given-names>M</given-names></name> <name><surname>Annane</surname> <given-names>D</given-names></name> <name><surname>Bauer</surname> <given-names>M</given-names></name> <etal/></person-group>. <article-title>The third international consensus definitions for sepsis and septic shock (sepsis-3)</article-title>. <source>JAMA.</source> (<year>2016</year>) <volume>315</volume>:<fpage>801</fpage>&#x02013;<lpage>10</lpage>. doi: <pub-id pub-id-type="doi">10.1001/jama.2016.0287</pub-id></mixed-citation>
</ref>
<ref id="B48">
<label>48.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Iwashyna</surname> <given-names>TJ</given-names></name> <name><surname>Hodgson</surname> <given-names>CL</given-names></name> <name><surname>Pilcher</surname> <given-names>D</given-names></name> <name><surname>Bailey</surname> <given-names>M</given-names></name> <name><surname>van Lint</surname> <given-names>A</given-names></name> <name><surname>Chavan</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Timing of onset and burden of persistent critical illness in Australia and New Zealand: a retrospective, population-based, observational study</article-title>. <source>Lancet Respir Med.</source> (<year>2016</year>) <volume>4</volume>:<fpage>566</fpage>&#x02013;<lpage>73</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S2213-2600(16)30098-4</pub-id><pub-id pub-id-type="pmid">27155770</pub-id></mixed-citation>
</ref>
<ref id="B49">
<label>49.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>Z</given-names></name> <name><surname>Ho</surname> <given-names>KM</given-names></name> <name><surname>Gu</surname> <given-names>H</given-names></name> <name><surname>Hong</surname> <given-names>Y</given-names></name> <name><surname>Yu</surname> <given-names>Y</given-names></name></person-group>. <article-title>Defining persistent critical illness based on growth trajectories in patients with sepsis</article-title>. <source>Crit Care.</source> (<year>2020</year>) <volume>24</volume>:<fpage>57</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13054-020-2768-z</pub-id><pub-id pub-id-type="pmid">32070393</pub-id></mixed-citation>
</ref>
<ref id="B50">
<label>50.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ioanas</surname> <given-names>M</given-names></name> <name><surname>Cavalcanti</surname> <given-names>M</given-names></name> <name><surname>Ferrer</surname> <given-names>M</given-names></name> <name><surname>Valencia</surname> <given-names>M</given-names></name> <name><surname>Agusti</surname> <given-names>C</given-names></name> <name><surname>Puig</surname> <given-names>de</given-names></name></person-group>. <article-title>la Bellacasa J, et al. Hospital-acquired pneumonia: coverage and treatment adequacy of current guidelines</article-title>. <source>Eur Respir J.</source> (<year>2003</year>) <volume>22</volume>:<fpage>876</fpage>&#x02013;<lpage>82</lpage>. doi: <pub-id pub-id-type="doi">10.1183/09031936.03.00045903</pub-id></mixed-citation>
</ref>
<ref id="B51">
<label>51.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kahn</surname> <given-names>JM</given-names></name> <name><surname>Le</surname> <given-names>T</given-names></name> <name><surname>Angus</surname> <given-names>DC</given-names></name> <name><surname>Cox</surname> <given-names>CE</given-names></name> <name><surname>Hough</surname> <given-names>CL</given-names></name> <name><surname>White</surname> <given-names>DB</given-names></name> <etal/></person-group>. <article-title>The epidemiology of chronic critical illness in the United States<sup>&#x0002A;</sup></article-title>. <source>Crit Care Med.</source> (<year>2015</year>) <volume>43</volume>:<fpage>282</fpage>&#x02013;<lpage>7</lpage>. doi: <pub-id pub-id-type="doi">10.1097/CCM.0000000000000710</pub-id><pub-id pub-id-type="pmid">25377018</pub-id></mixed-citation>
</ref>
<ref id="B52">
<label>52.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gentile</surname> <given-names>LF</given-names></name> <name><surname>Cuenca</surname> <given-names>AG</given-names></name> <name><surname>Efron</surname> <given-names>PA</given-names></name> <name><surname>Ang</surname> <given-names>D</given-names></name> <name><surname>Bihorac</surname> <given-names>A</given-names></name> <name><surname>McKinley</surname> <given-names>BA</given-names></name> <etal/></person-group>. <article-title>Persistent inflammation and immunosuppression: a common syndrome and new horizon for surgical intensive care</article-title>. <source>J Trauma Acute Care Surg.</source> (<year>2012</year>) <volume>72</volume>:<fpage>1491</fpage>&#x02013;<lpage>501</lpage>. doi: <pub-id pub-id-type="doi">10.1097/TA.0b013e318256e000</pub-id><pub-id pub-id-type="pmid">22695412</pub-id></mixed-citation>
</ref>
<ref id="B53">
<label>53.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Efron</surname> <given-names>PA</given-names></name> <name><surname>Mohr</surname> <given-names>AM</given-names></name> <name><surname>Bihorac</surname> <given-names>A</given-names></name> <name><surname>Horiguchi</surname> <given-names>H</given-names></name> <name><surname>Hollen</surname> <given-names>MK</given-names></name> <name><surname>Segal</surname> <given-names>MS</given-names></name> <etal/></person-group>. <article-title>Persistent inflammation, immunosuppression, and catabolism and the development of chronic critical illness after surgery</article-title>. <source>Surgery.</source> (<year>2018</year>) <volume>164</volume>:<fpage>178</fpage>&#x02013;<lpage>84</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.surg.2018.04.011</pub-id><pub-id pub-id-type="pmid">29807651</pub-id></mixed-citation>
</ref>
<ref id="B54">
<label>54.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Miller</surname> <given-names>SI</given-names></name> <name><surname>Wallace RJ</surname> <given-names>Jr</given-names></name> <name><surname>Musher</surname> <given-names>DM</given-names></name> <name><surname>Septimus</surname> <given-names>EJ</given-names></name> <name><surname>Kohl</surname> <given-names>S</given-names></name> <name><surname>Baughn</surname> <given-names>RE</given-names></name></person-group>. <article-title>Hypoglycemia as a manifestation of sepsis</article-title>. <source>Am J Med.</source> (<year>1980</year>) <volume>68</volume>:<fpage>649</fpage>&#x02013;<lpage>54</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0002-9343(80)90250-8</pub-id><pub-id pub-id-type="pmid">6990758</pub-id></mixed-citation>
</ref>
<ref id="B55">
<label>55.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Maheshwari</surname> <given-names>K</given-names></name> <name><surname>Nathanson</surname> <given-names>BH</given-names></name> <name><surname>Munson</surname> <given-names>SH</given-names></name> <name><surname>Khangulov</surname> <given-names>V</given-names></name> <name><surname>Stevens</surname> <given-names>M</given-names></name> <name><surname>Badani</surname> <given-names>H</given-names></name> <etal/></person-group>. <article-title>The relationship between ICU hypotension and in-hospital mortality and morbidity in septic patients</article-title>. <source>Intensive Care Med.</source> (<year>2018</year>) <volume>44</volume>:<fpage>857</fpage>&#x02013;<lpage>67</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00134-018-5218-5</pub-id><pub-id pub-id-type="pmid">29872882</pub-id></mixed-citation>
</ref>
<ref id="B56">
<label>56.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Pollard</surname> <given-names>TJ</given-names></name> <name><surname>Johnson</surname> <given-names>AEW</given-names></name> <name><surname>Raffa</surname> <given-names>JD</given-names></name> <name><surname>Celi</surname> <given-names>LA</given-names></name> <name><surname>Mark</surname> <given-names>RG</given-names></name> <name><surname>Badawi</surname> <given-names>O</given-names></name></person-group>. <article-title>The eICU Collaborative Research Database, a freely available multi-center database for critical care research</article-title>. <source>Sci Data.</source> (<year>2018</year>) <volume>5</volume>:<fpage>180178</fpage>. doi: <pub-id pub-id-type="doi">10.1038/sdata.2018.178</pub-id><pub-id pub-id-type="pmid">30204154</pub-id></mixed-citation>
</ref>
<ref id="B57">
<label>57.</label>
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>P</given-names></name> <name><surname>Chen</surname> <given-names>L</given-names></name> <name><surname>Zhang</surname> <given-names>Z</given-names></name></person-group>. <source>Critical Care Database Comprising Patients With Infection at Zigong Fourth People&#x00027;s Hospital (Version 1.1)</source>. <publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>PhysioNet</publisher-name> (<year>2022</year>).</mixed-citation>
</ref>
<ref id="B58">
<label>58.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>P</given-names></name> <name><surname>Chen</surname> <given-names>L</given-names></name> <name><surname>Zhu</surname> <given-names>Y</given-names></name> <name><surname>Yu</surname> <given-names>S</given-names></name> <name><surname>Chen</surname> <given-names>R</given-names></name> <name><surname>Huang</surname> <given-names>W</given-names></name> <etal/></person-group>. <article-title>Critical care database comprising patients with infection</article-title>. <source>Front Public Health.</source> (<year>2022</year>) <volume>10</volume>:<fpage>852410</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpubh.2022.852410</pub-id><pub-id pub-id-type="pmid">35372245</pub-id></mixed-citation>
</ref>
<ref id="B59">
<label>59.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Minne</surname> <given-names>L</given-names></name> <name><surname>Abu-Hanna</surname> <given-names>A</given-names></name> <name><surname>de Jonge</surname> <given-names>E</given-names></name></person-group>. <article-title>Evaluation of SOFA-based models for predicting mortality in the ICU: a systematic review</article-title>. <source>Crit Care.</source> (<year>2008</year>) <volume>12</volume>:<fpage>R161</fpage>. doi: <pub-id pub-id-type="doi">10.1186/cc7160</pub-id><pub-id pub-id-type="pmid">19091120</pub-id></mixed-citation>
</ref>
<ref id="B60">
<label>60.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schober</surname> <given-names>P</given-names></name> <name><surname>Vetter</surname> <given-names>TR</given-names></name></person-group>. <article-title>Logistic regression in medical research</article-title>. <source>Anesth Analg.</source> (<year>2021</year>) <volume>132</volume>:<fpage>365</fpage>&#x02013;<lpage>66</lpage>. doi: <pub-id pub-id-type="doi">10.1213/ANE.0000000000005247</pub-id><pub-id pub-id-type="pmid">33449558</pub-id></mixed-citation>
</ref>
<ref id="B61">
<label>61.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>LaValley</surname> <given-names>MP</given-names></name></person-group>. <article-title>Logistic regression</article-title>. <source>Circulation.</source> (<year>2008</year>) <volume>117</volume>:<fpage>2395</fpage>&#x02013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.106.682658</pub-id></mixed-citation>
</ref>
<ref id="B62">
<label>62.</label>
<mixed-citation publication-type="web"><person-group person-group-type="author"><name><surname>Frazier</surname> <given-names>P</given-names></name></person-group>. <source>A Tutorial on Bayesian Optimization</source>. arXiv preprint [Preprint] (<year>2018</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.48550/arXiv.1807.02811">https://doi.org/10.48550/arXiv.1807.02811</ext-link> (Accessed August 14, 2025).</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0001">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1971175/overview">Changqing Cheng</ext-link>, Binghamton University, United States</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0002">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/361366/overview">Mart&#x000ED;n Manuel Ledesma</ext-link>, CONICET Institute of Experimental Medicine, Argentina</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3279934/overview">Yilin Fan</ext-link>, Hebei University of Technology, China</p>
</fn>
</fn-group>
</back>
</article>