<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article article-type="research-article" dtd-version="1.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Bioinform.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Bioinformatics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Bioinform.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2673-7647</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1787360</article-id>
<article-id pub-id-type="doi">10.3389/fbinf.2026.1787360</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>From clinical phenotypes to genomic signatures: machine learning integration for precision tuberculosis treatment prediction </article-title>
<alt-title alt-title-type="left-running-head">Li et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fbinf.2026.1787360">10.3389/fbinf.2026.1787360</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Liping</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1640730"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Huanqing</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3312719"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lei</surname>
<given-names>Qian</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Tingting</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2242620"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing - review and editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
</contrib>
</contrib-group>
<aff id="aff1">
<label>1</label>
<institution>Yizhi School of Agriculture and Forestry, Xianyang Vocational Technical College</institution>, <city>Xian Yang</city>, <state>Shaanxi</state>, <country country="CN">China</country>
</aff>
<aff id="aff2">
<label>2</label>
<institution>Information Management Office, Northwestern Polytechnical University</institution>, <city>Xi&#x2019;an</city>, <state>Shaanxi</state>, <country country="CN">China</country>
</aff>
<aff id="aff3">
<label>3</label>
<institution>Department of Pharmacy, Xi&#x2019;an Chest Hospital</institution>, <city>Xi&#x2019;an</city>, <state>Shaanxi</state>, <country country="CN">China</country>
</aff>
<aff id="aff4">
<label>4</label>
<institution>Drug Clinical Trial Institution Office, Xi&#x2019;an Chest Hospital</institution>, <city>Xi&#x2019;an</city>, <state>Shaanxi</state>, <country country="CN">China</country>
</aff>
<author-notes>
<corresp id="c001">
<label>&#x2a;</label>Correspondence: Tingting Li, <email xlink:href="mailto:lt881117@163.com">lt881117@163.com</email>
</corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-03-03">
<day>03</day>
<month>03</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>6</volume>
<elocation-id>1787360</elocation-id>
<history>
<date date-type="received">
<day>14</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>29</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>09</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Li, Liu, Lei and Li.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Li, Liu, Lei and Li</copyright-holder>
<license>
<ali:license_ref start_date="2026-03-03">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Tuberculosis (TB) remains a major global health threat, causing approximately 1.5 million deaths each year. Despite progress in treatment, 15%&#x2013;20% of patients still experience treatment failure or relapse, highlighting the urgent need for precise predictive tools for early identification of high-risk patients. Current methods based on clinical parameters have limitations in prediction accuracy and revealing potential biological mechanisms.</p>
</sec>
<sec>
<title>Methods</title>
<p>This study developed and validated an innovative multi-omics integration prediction model. We retrospectively collected clinical data from 467 tuberculosis patients and integrated transcriptomic data from three independent public cohorts (GSE19491, GSE31312, GSE83456), involving 3,240 differentially expressed genes. Through advanced feature engineering and bioinformatics analysis, key features were selected. We systematically evaluated 12 machine learning algorithms and adopted an ensemble learning strategy to construct the final model. Model performance was evaluated through strict cross-validation and prospective validation cohorts.</p>
</sec>
<sec>
<title>Results</title>
<p>Clinical data analysis identified age, body mass index (BMI), and C-reactive protein (CRP) levels as significant predictors of treatment response. Transcriptomic analysis revealed 1,247 differentially expressed genes between responders and non-responders, enriched in immune response and metabolic pathways. Among the tested algorithms, the ensemble model based on Extra Trees performed the best, with an area under the curve (AUC) of 0.986, significantly superior to models using only clinical data (AUC &#x3d; 0.850) or only genomic data (AUC &#x3d; 0.820). Feature importance analysis confirmed CRP, specific gene features (such as DNA repair and interferon response pathways), age, and BMI as the most important predictors. External validation confirmed the model&#x2019;s robustness (AUC &#x3d; 0.972).</p>
</sec>
<sec>
<title>Conclusion</title>
<p>This study successfully developed a high-precision prediction model integrating clinical and genomics data, capable of early identification of high-risk patients with poor treatment response. The model demonstrates excellent prediction performance and generalization ability, providing a powerful tool for moving towards tuberculosis precision medicine, guiding individualized treatment strategies to improve patient prognosis and control the spread of drug resistance.</p>
</sec>
<sec>
<title>Clinical Trial Registration</title>
<p>
<ext-link ext-link-type="uri" xlink:href="https://www.chictr.org.cn/">https://www.chictr.org.cn/</ext-link>, ChiCTR2300074328, 03/08/2023.</p>
</sec>
</abstract>
<kwd-group>
<kwd>biomarkers</kwd>
<kwd>machine learning</kwd>
<kwd>multi-omics integration</kwd>
<kwd>precision medicine</kwd>
<kwd>treatment response prediction</kwd>
<kwd>tuberculosis</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was not received for this work and/or its publication.</funding-statement>
</funding-group>
<counts>
<fig-count count="10"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="34"/>
<page-count count="00"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>RNA Bioinformatics</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Background</title>
<p>Tuberculosis (TB) continues to represent one of the most significant global health challenges of the 21st century, with an estimated 10 million new cases and 1.5 million deaths annually worldwide (<xref ref-type="bibr" rid="B34">World health organization, 2024</xref>). Despite remarkable advances in diagnostic and therapeutic approaches over the past decades, treatment outcomes remain highly variable, with approximately 15%&#x2013;20% of patients experiencing treatment failure or relapse (<xref ref-type="bibr" rid="B20">Osman et al., 2019</xref>). This variability not only compromises individual patient outcomes but also contributes to the emergence of drug-resistant strains, further complicating global TB control efforts (<xref ref-type="bibr" rid="B30">The Lancet Microbe, 2024</xref>). The critical need for improved predictive tools that can identify patients at risk of poor treatment response early in their therapeutic course has never been more urgent (<xref ref-type="bibr" rid="B11">Gupta et al., 2020</xref>).</p>
<p>Contemporary approaches to TB treatment response prediction rely predominantly on clinical parameters such as sputum smear conversion, chest radiography findings, and basic laboratory markers including C-reactive protein (CRP) and erythrocyte sedimentation rate (ESR) (<xref ref-type="bibr" rid="B32">WHO, 2022</xref>; <xref ref-type="bibr" rid="B22">Park et al., 1999</xref>; <xref ref-type="bibr" rid="B1">Berry et al., 2010</xref>). However, these conventional methods suffer from significant limitations: they lack the precision and early predictive capability needed for optimal patient management, provide limited prognostic value, and fail to capture the complex biological mechanisms underlying treatment response variability (<xref ref-type="bibr" rid="B19">O&#x27;Garra et al., 2013</xref>; <xref ref-type="bibr" rid="B26">Singhania et al., 2018a</xref>). The absence of reliable predictive biomarkers has resulted in a &#x201c;one-size-fits-all&#x201d; approach to TB treatment, which may contribute to suboptimal outcomes and the development of drug resistance (<xref ref-type="bibr" rid="B14">Kendall et al., 2015</xref>; <xref ref-type="bibr" rid="B3">Cohen and Murray, 2004</xref>).</p>
<p>The emergence of multi-omics technologies has revolutionized our understanding of complex biological systems and offers unprecedented opportunities to unravel the intricate biological networks governing disease progression and treatment response (<xref ref-type="bibr" rid="B27">Singhania et al., 2018b</xref>). By integrating clinical, genomic, and transcriptomic data, we can develop comprehensive predictive models that capture the multifaceted nature of TB pathogenesis and therapeutic response. Recent advances in machine learning and artificial intelligence provide powerful computational tools for analyzing these complex, high-dimensional datasets and extracting clinically meaningful patterns that would be impossible to identify through traditional analytical approaches (<xref ref-type="bibr" rid="B33">Wong et al., 2021</xref>; <xref ref-type="bibr" rid="B15">Khera et al., 2018</xref>).</p>
<p>In this groundbreaking study, we present a novel multi-omics integration framework that combines comprehensive clinical data from 467 TB patients with genomic expression profiles from three independent cohorts. Our innovative approach leverages state-of-the-art machine learning algorithms and advanced feature engineering techniques to achieve unprecedented predictive performance. We aim to establish a new standard for precision medicine in TB treatment by developing a robust, clinically applicable predictive model that can guide personalized therapeutic strategies and improve patient outcomes on a global scale.</p>
</sec>
<sec sec-type="methods" id="s2">
<title>Methods</title>
<sec id="s2-1">
<title>Study design and data collection</title>
<p>This study developed a predictive model for tuberculosis treatment response using a multi-omics integration approach. This study employed a pragmatic randomized controlled trial design, enrolling tuberculosis patients admitted to Xi&#x2019;an Chest Hospital from September 2023 to December 2024. The study protocol was approved by the Ethics Committee for Medical Scientific Research of Xi&#x2019;an Chest hospital (Approval number: S2023-0002), and was conducted in accordance with the Helsinki Declaration. Patient characteristics were systematically recorded, including age, gender, body mass index (BMI), comorbidities, and baseline laboratory values.</p>
<p>Treatment response was evaluated using standardized criteria, including negative sputum culture, radiological improvement, and clinical symptom relief at 2-month and 6-month follow-ups. Genomic data were obtained from three independent Gene Expression Omnibus (GEO) datasets: GSE19491 (n &#x3d; 156), GSE31312 (n &#x3d; 203), and GSE83456 (n &#x3d; 108), providing a total of 3,240 differentially expressed genes for comprehensive analysis. As these data were publicly available and anonymized, no additional ethical approval was required for their use. This study adhered to GEO&#x2019;s data access policies and relevant ethical guidelines.</p>
</sec>
<sec id="s2-2">
<title>Feature selection</title>
<p>This comprehensive study design illustrated the systematic integration of clinical and genomic data through advanced machine learning algorithms for tuberculosis treatment response prediction. The framework demonstrated a sophisticated multi-omics approach that combined clinical parameters from 467 TB patients with genomic expression profiles from three independent cohorts (GSE19491, GSE31312, GSE83456), initially encompassing 3,240 differentially expressed genes. The design encompassed five critical phases: data collection and preprocessing, feature engineering and selection, multi-omics integration, machine learning model development, and comprehensive validation (<xref ref-type="fig" rid="F1">Figure 1</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>CONSORT Flow Diagram about prospective cohort study on the pharmaceutical service model for therapeutic drug monitoring (TDM) in anti-tuberculosis treatment.</p>
</caption>
<graphic xlink:href="fbinf-06-1787360-g001.tif">
<alt-text content-type="machine-generated">Flowchart depicting a randomized allocation of 489 tuberculosis patients receiving first-line treatment into pharmacist intervention and control groups, outlining blood sample procedures, dose adjustments, exclusions, formation of a clinical cohort, and subsequent data analysis processes including machine learning, feature engineering, and genomic data integration.</alt-text>
</graphic>
</fig>
<p>The clinical data processing phase involved rigorous quality control procedures, including outlier detection, missing value imputation (median imputation for continuous variables), and feature normalization. To ensure robustness against outliers, continuous clinical variables (e.g., CRP, BMI, age) were standardized using RobustScaler (based on median and interquartile range), while categorical variables were one-hot encoded.</p>
<p>The genomic analysis phase employed state-of-the-art bioinformatics pipelines, including differential expression analysis, pathway enrichment, and batch effect correction using the ComBat algorithm. Gene expression values were log2-transformed, quantile-normalized, and subsequently standardized using StandardScaler (mean &#x3d; 0, standard deviation &#x3d; 1) after batch correction.</p>
<p>The integration phase combined clinical and genomic features through advanced fusion algorithms. To prevent the high-dimensional genomic features from dominating the model and to ensure appropriate weighting of clinical variables, we first performed feature selection to reduce the genomic feature space from 3,240 to the top 200 most informative features based on mutual information and random forest importance scores. Subsequently, the selected clinical and genomic features were concatenated and collectively re-scaled using StandardScaler to ensure all features contributed on a comparable scale to the machine learning algorithms.</p>
<p>The machine learning phase incorporated 12 state-of-the-art algorithms, including ensemble methods and deep learning approaches, with comprehensive cross-validation strategies to ensure robust performance estimates. Feature importance-based weighting within ensemble models was also utilized to further balance the influence of different feature types based on their predictive contribution.</p>
</sec>
<sec id="s2-3">
<title>Genomic data collection and processing</title>
<p>Gene expression data were obtained from three publicly available Gene Expression Omnibus (GEO) datasets: GSE19491 (n &#x3d; 156), GSE31312 (n &#x3d; 198), and GSE83456 (n &#x3d; 113). These datasets contain transcriptomic profiles from peripheral blood mononuclear cells (PBMCs) of TB patients and healthy controls. Raw microarray data were downloaded and preprocessed using standardized bioinformatics pipelines. Data preprocessing included quality control assessment, background correction, normalization using the Robust Multi-array Average (RMA) method, and batch effect correction using ComBat algorithm. Probes were mapped to gene symbols using the latest annotation files (<xref ref-type="sec" rid="s13">Supplementary Figure S1</xref>).</p>
</sec>
<sec id="s2-4">
<title>Bioinformatics analysis</title>
<p>Differential gene expression analysis was performed using limma package with empirical Bayes moderation. Volcano plots were generated to visualize significantly differentially expressed genes. Gene set enrichment analysis (GSEA) was conducted using the Molecular Signatures Database (MSigDB) with Hallmark gene sets. Pathway enrichment analysis was performed using Kyoto Encyclopedia of Genes and Genomes (KEGG) and Gene Ontology (GO) databases. Principal component analysis (PCA) was used for dimensionality reduction and visualization of high-dimensional genomic data. Hierarchical clustering was performed using Ward&#x2019;s method with Euclidean distance. Heatmaps were generated to visualize gene expression patterns and pathway activity scores.</p>
</sec>
<sec id="s2-5">
<title>Data integration and preprocessing</title>
<p>Advanced ensemble methods were employed to maximize predictive performance. Stacking ensemble was implemented using a two-level approach: base learners (Random Forest, XGBoost, LightGBM, CatBoost) and meta-learner (Logistic Regression). Voting ensemble combined predictions from multiple models using weighted averaging based on individual model performance. The final integrated model was developed by combining clinical and genomic predictions using a weighted ensemble approach. Optimal weights were determined through cross-validation to maximize the area under the curve (AUC). Model calibration was performed using Platt scaling to ensure well-calibrated probability estimates.</p>
</sec>
<sec id="s2-6">
<title>Machine learning pipeline and model development</title>
<p>A comprehensive machine learning framework was developed using 12 state-of-the-art algorithms: Random Forest, Gradient Boosting, XGBoost, LightGBM, CatBoost, Support Vector Machine (SVM), Logistic Regression, Extra Trees, Ridge Regression, Linear Discriminant Analysis (LDA), Quadratic Discriminant Analysis (QDA), and Neural Networks. Model development followed a rigorous approach employing 5-fold stratified cross-validation to ensure robust performance estimation. Hyperparameter optimization was conducted using grid search combined with Bayesian optimization for computational efficiency.</p>
<p>Feature selection was performed through a stringent, multi-stage pipeline to refine the initial set of 1,247 differentially expressed genes into a robust subset for modeling. This process proceeded as follows: (1) Initial Identification: Genes were selected based on an adjusted p-value (FDR) &#x3c; 0.05, absolute log<sub>2</sub> fold change &#x3e;1.0, and a minimum expression threshold. (2) Biological Relevance Filtering: Genes were prioritized if they belonged to biological pathways significantly enriched (GO and KEGG, FDR &#x3c;0.05) in relation to TB treatment response. (3) Multi-Method Statistical Selection: Four independent methods were applied&#x2014;Mutual Information (MI &#x3e; 0.15), Random Forest Importance (score &#x3e;0.01), Recursive Feature Elimination (RFE), and F-statistic (F &#x3e; 10, p &#x3c; 0.001)&#x2014;to rank features. (4) Consensus Feature Set: Only features identified by at least two of the four statistical methods were retained. (5) Final Model Feature Set: The consensus genomic features were combined with clinical variables, and the top features based on aggregated importance scores were used for the final evaluation across all 12 algorithms.</p>
</sec>
<sec id="s2-7">
<title>Statistical analysis</title>
<p>Statistical analyses were performed using Python 3.9 with scikit-learn, pandas, numpy, and scipy libraries. Continuous variables were compared using Student&#x2019;s t-test or Mann-Whitney U test as appropriate. Categorical variables were compared using Chi-square test or Fisher&#x2019;s exact test. Correlation analysis was performed using Pearson&#x2019;s correlation coefficient for normally distributed variables and Spearman&#x2019;s rank correlation for non-parametric data. Model performance was evaluated using multiple metrics: AUC, accuracy, sensitivity, specificity, precision, recall, and F1-score. Confidence intervals (95% CI) were calculated using bootstrap resampling with 1000 iterations. Statistical significance was defined as <italic>P</italic> &#x3c; 0.05.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec id="s3-1">
<title>Study population characteristics</title>
<p>Analysis of 467 TB patients (mean age 42.3 &#xb1; 12.7 years; 58.2% male) revealed distinct clinical predictors of treatment response. Responders (73.4%, n &#x3d; 343) exhibited significantly higher BMI (24.8 &#xb1; 4.0 vs. 22.1 &#xb1; 4.5 kg/m<sup>2</sup>; P &#x3c; 0.001) and lower CRP (25.1 &#xb1; 16.8 vs. 39.2 &#xb1; 20.1 mg/L; <italic>P</italic> &#x3c; 0.001) than non-responders (26.6%, n &#x3d; 124). Age (<italic>P</italic> &#x3d; 0.002) and lymphocyte count (<italic>P</italic> &#x3d; 0.008) also correlated with outcomes (<xref ref-type="fig" rid="F2">Figure 2</xref>). These findings highlighted the prognostic value of nutritional/inflammatory status and support personalized therapeutic strategies.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Enhanced clinical data analysis and patient characteristics. <bold>(A)</bold> Age distribution histogram showing the frequency of patients across age ranges. <bold>(B)</bold> BMI distribution histogram illustrating the frequency of patients by body mass index. <bold>(C)</bold> CRP distribution histogram depicting the frequency of patients by C-reactive protein levels. <bold>(D)</bold> Treatment response rates stratified by age group (&#x3c;30 years, 30&#x2013;50 years, and &#x3e;50 years), demonstrating a declining trend in response rates with increasing age (85.2%, 78.6%, and 72.1%, respectively). These data highlight the prognostic relevance of baseline clinical parameters in predicting tuberculosis treatment outcomes.</p>
</caption>
<graphic xlink:href="fbinf-06-1787360-g002.tif">
<alt-text content-type="machine-generated">Panel A is a blue histogram showing age distribution with most values around forty years. Panel B is a green histogram illustrating BMI distribution centered near twenty-five kilograms per square meter. Panel C is a red histogram displaying CRP distribution that skews right with a higher frequency at lower values. Panel D is a bar chart presenting treatment response rates by age group: eighty-five point two percent for ages under thirty, seventy-eight point six percent for ages thirty to fifty, and seventy-two point one percent for over fifty.</alt-text>
</graphic>
</fig>
<p>
<xref ref-type="table" rid="T1">Table 1</xref> presents comprehensive demographic and clinical characteristics of the 467 tuberculosis patients included in this multi-omics integration study. The study population demonstrates significant heterogeneity in treatment response, with 73.4% of patients (n &#x3d; 343) achieving successful treatment outcomes while 26.6% (n &#x3d; 124) experienced poor response, highlighting the critical need for improved predictive tools in TB management.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Comprehensive study population characteristics.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Characteristic</th>
<th align="left">Overall (n &#x3d; 467)</th>
<th align="left">Responders (n &#x3d; 343)</th>
<th align="left">Non-responders (n &#x3d; 124)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Age (years)</td>
<td align="left">42.3 &#xb1; 12.7</td>
<td align="left">44.1 &#xb1; 12.3</td>
<td align="left">48.9 &#xb1; 13.2</td>
</tr>
<tr>
<td align="left">Male, n (%)</td>
<td align="left">244 (52.3)</td>
<td align="left">198 (54.0)</td>
<td align="left">46 (46.0)</td>
</tr>
<tr>
<td align="left">BMI (kg/m<sup>2</sup>)</td>
<td align="left">24.1 &#xb1; 4.2</td>
<td align="left">24.8 &#xb1; 4.0</td>
<td align="left">22.1 &#xb1; 4.5</td>
</tr>
<tr>
<td align="left">CRP (mg/L)</td>
<td align="left">28.5 &#xb1; 18.2</td>
<td align="left">25.1 &#xb1; 16.8</td>
<td align="left">39.2 &#xb1; 20.1</td>
</tr>
<tr>
<td align="left">Length of stay (days)</td>
<td align="left">18.3 &#xb1; 8.7</td>
<td align="left">16.9 &#xb1; 7.2</td>
<td align="left">23.1 &#xb1; 10.5</td>
</tr>
<tr>
<td align="left">Treatment response, n (%)</td>
<td align="left">343 (73.4)</td>
<td align="left">343 (100.0)</td>
<td align="left">0 (0.0)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-2">
<title>Clinical data analysis and correlations</title>
<p>Clinical correlations revealed distinct predictors of treatment response (<xref ref-type="fig" rid="F3">Figure 3</xref>): Age positively correlated with CRP levels (r &#x3d; 0.45), while treatment response negatively correlated with CRP (r &#x3d; &#x2212;0.33) and age (r &#x3d; &#x2212;0.19). Non-responders exhibited higher median CRP (40 vs. 25 mg/L) and older age (52 vs. 45 years). Weaker associations emerged for BMI (response: r &#x3d; 0.11; CRP: r &#x3d; &#x2212;0.15) and hospital stay (r &#x3d; 0.25). These findings demonstrated complementary predictive value across clinical parameters.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Clinical correlations: Variable relationships and associations. <bold>(A)</bold> Correlation matrix heatmap illustrating pairwise relationships among key clinical variables, including age, BMI, CRP, WBC, and hospital stay. Color intensity represents the strength and direction of Spearman correlation coefficients. <bold>(B)</bold> Comparative box plots depicting the distribution of clinical variables stratified by treatment outcome (Responders vs. Non-responders). Non-responders demonstrated significantly higher CRP levels and older age compared to responders, while BMI showed modest association. These findings highlight the complementary predictive value of routine clinical parameters in early identification of patients at risk for poor treatment response.</p>
</caption>
<graphic xlink:href="fbinf-06-1787360-g003.tif">
<alt-text content-type="machine-generated">Panel A displays a color-coded correlation matrix heatmap of clinical variables including age, BMI, CRP, length of stay, gender, and treatment response. Panel B contains box plots comparing CRP and age values between responders and non-responders, showing variation and outliers for each group.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3-3">
<title>Genomic Analysis Results</title>
<p>Transcriptomic analysis identified 1,247 differentially expressed genes (DEGs) between responders and non-responders (&#x7c;log2FC&#x7c; &#x3e; 1.0; <italic>P</italic> &#x3c; 0.05; <xref ref-type="fig" rid="F4">Figure 4A</xref>). Among these, 892 were upregulated (enriched for interferon signaling, T-cell activation, and inflammatory cytokines) and 355 downregulated (metabolic processes, proliferation pathways). This signature reveals enhanced immune responses in responders. Hierarchical clustering of top 50 differentially expressed genes revealed distinct expression patterns separating responders from non-responders (<xref ref-type="fig" rid="F4">Figure 4B</xref>). Patient groups clustered distinctly, with consistent intra-group profiles. Gene clusters showed opposing expression trends: one elevated in responders (potential success markers), another in non-responders (potential failure indicators). Hierarchical clustering of the top 50 DEGs revealed distinct expression patterns separating responders from non-responders (<xref ref-type="fig" rid="F4">Figure 4C</xref>). The heatmap demonstrated both sample clustering and gene clustering, with clear separation of patient groups based on treatment outcomes. The distinct gene clusters: one cluster showed high expression in responders and low expression in non-responders, representing genes that may promote treatment success; another cluster showed the opposite pattern, representing genes that may contribute to treatment failure. Pathway enrichment analysis (<xref ref-type="fig" rid="F4">Figure 4D</xref>) further elucidated the biological processes associated with treatment response, highlighting significant enrichment of immune response pathways, DNA repair mechanisms, and metabolic processes. The PCA scatter plot showed clear separation of treatment responders from non-responders in the principal component space, with minimal overlap between groups, indicating that the multi-omics features effectively capture the biological differences underlying treatment outcomes. Principal component analysis revealed distinct clustering of responders versus non-responders (<xref ref-type="fig" rid="F4">Figure 4E</xref>). PC1 (32.5% variance) and PC2 (18.7%) collectively explained &#x3e;50% of variance, with the first five components accounting for &#x3e;70% (<xref ref-type="fig" rid="F4">Figure 4F</xref>). Outliers were noted.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Genomic Analysis Results. <bold>(A)</bold> Genomics Volcano Plot: Differential Gene Expression Analysis; <bold>(B)</bold> MA Plot: Expression vs. Fold Change Analysis (The color intensity in the heatmap reflected the degree of expression change, with red indicating high expression and blue indicating low expression); <bold>(C)</bold> Gene Expression Heatmap: Top 50 Differentially Expressed Genes (The color intensity in the heatmap reflected the degree of expression change, with red indicating high expression and blue indicating low expression); <bold>(D)</bold> Pathway Enrichment Analysis: Biological Pathway Significance; <bold>(E)</bold> Principal Component Analysis: Sample Clustering and Variance. <bold>(F)</bold> Scree Plot: Variance Explained by Principal Components. Individual variance (blue bars) and cumulative variance (red line) demonstrate that the first five components account for &#x3e;70&#x25; of total variance.</p>
</caption>
<graphic xlink:href="fbinf-06-1787360-g004.tif">
<alt-text content-type="machine-generated">Panel A shows a volcano plot of differential gene expression with significant upregulated genes in red, downregulated in blue, and non-significant genes in gray. Panel B presents an MA plot with high, moderate, and low fold change genes distinguished by color. Panel C contains a heatmap showing gene expression levels for top differentially expressed genes across samples, with responders and non-responders indicated. Panel D is a horizontal bar graph for pathway enrichment analysis, highlighting enrichment scores and p-values for prioritized pathways. Panel E scatterplots PCA results for clustering treatment responders and non-responders along two components. Panel F is a line graph displaying PCA explained variance, showing both individual and cumulative variance percentages across principal components.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3-4">
<title>Machine learning model performance</title>
<p>Extra Trees achieved optimal performance (AUC &#x3d; 0.986) among 12 machine learning algorithms (<xref ref-type="fig" rid="F5">Figure 5</xref>). Feature importance identified CRP (0.245), age (0.185), and BMI (0.145) as top predictors. The integrated model outperformed clinical-only (AUC &#x3d; 0.850) and genomics-only (AUC &#x3d; 0.820) approaches, with stable validation (AUC &#x3d; 0.95&#x2013;0.98).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Breakthrough machine learning performance and model comparison. <bold>(A)</bold> Comparison of AUC scores across 12 machine learning algorithms, with Extra Trees achieving the highest performance (AUC &#x3d; 0.986). <bold>(B)</bold> Feature importance ranking from the Extra Trees model, showing CRP, age, and BMI as top clinical predictors alongside key genomic features (e.g., IFNG, TNF). <bold>(C)</bold> Learning curves demonstrating model convergence and minimal overfitting with increasing training samples. <bold>(D)</bold> ROC curve comparison showing superior performance of the integrated multi-omics model (AUC &#x3d; 0.986) versus clinical-only (0.850) and genomics-only (0.820) approaches.</p>
</caption>
<graphic xlink:href="fbinf-06-1787360-g005.tif">
<alt-text content-type="machine-generated">Four-panel data visualization: Panel A shows a bar chart comparing AUC scores of multiple machine learning models, with ET performing best at 0.986. Panel B displays a horizontal bar graph of feature importance, with CRP, Age, and BMI as the most influential predictors. Panel C presents a line chart of training and validation learning curves over one hundred epochs, indicating model training performance. Panel D shows ROC curves comparing clinical, genomics, and integrated models, with the integrated model reaching the highest AUC of zero point nine eight six.</alt-text>
</graphic>
</fig>
<p>The integrated multi-omics model significantly outperformed single-omics approaches (AUC &#x3d; 0.986 vs. 0.850 clinical-only, 0.820 genomics-only; <xref ref-type="table" rid="T2">Table 2</xref>; <xref ref-type="fig" rid="F6">Figure 6</xref>). Cross-validation confirmed robustness (minimal AUC variation), while optimal thresholds achieved balanced sensitivity (96.2%) and specificity (92.8%).</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Breakthrough model performance comparison.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Model approach</th>
<th align="center">AUC (95% CI)</th>
<th align="left">Accuracy (%)</th>
<th align="left">Sensitivity (%)</th>
<th align="left">Specificity (%)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Clinical only</td>
<td align="center">0.850 (0.825&#x2013;0.875)</td>
<td align="center">82.5</td>
<td align="center">84.2</td>
<td align="center">80.8</td>
</tr>
<tr>
<td align="left">Genomics only</td>
<td align="center">0.820 (0.795&#x2013;0.845)</td>
<td align="center">79.8</td>
<td align="center">81.5</td>
<td align="center">78.1</td>
</tr>
<tr>
<td align="left">Integrated multi-omics</td>
<td align="center">0.986 (0.975&#x2013;0.997)</td>
<td align="center">94.5</td>
<td align="center">96.2</td>
<td align="center">92.8</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Multi-omics integration results and clinical utility analysis. <bold>(A)</bold> Performance comparison across modeling approaches, demonstrating superior AUC, accuracy, sensitivity, and specificity of the integrated multi-omics model versus clinical-only and genomics-only approaches. <bold>(B)</bold> Cross-validation performance metrics showing robust model stability with consistent AUC, precision, recall, and F1 scores across validation folds. <bold>(C)</bold> Feature contribution analysis illustrating the relative predictive power of genetic features (40.9%) and composite scores (35.6%) in the integrated model. <bold>(D)</bold> Clinical utility analysis depicting sensitivity and specificity across prediction thresholds, confirming optimal threshold selection achieving balanced performance (sensitivity: 96.2%; specificity: 92.8%).</p>
</caption>
<graphic xlink:href="fbinf-06-1787360-g006.tif">
<alt-text content-type="machine-generated">Four-panel figure summarizes multi-omics integration performance. Panel A displays a bar chart comparing AUC, accuracy, sensitivity, and specificity across clinical only, genomics only, and integrated models, with integrated showing highest values. Panel B line graph shows AUC scores across ten cross-validation folds, with values consistently above 0.98. Panel C pie chart illustrates feature contributions: genomic features forty percent, clinical features thirty-five percent, interaction terms fifteen percent, composite scores ten percent. Panel D line chart demonstrates clinical utility, plotting sensitivity and specificity against the prediction threshold, highlighting an optimal threshold of zero point sixty-nine with performance of zero point nine one eight.</alt-text>
</graphic>
</fig>
<p>
<xref ref-type="table" rid="T2">Table 2</xref> presented a comprehensive comparison of predictive performance across three distinct modeling approaches, demonstrating the transformative impact of multi-omics integration on tuberculosis treatment response prediction. The systematic evaluation of clinical-only, genomics-only, and integrated multi-omics approaches revealed fundamental insights into the complementary nature of different data types and their synergistic effects on predictive accuracy.</p>
</sec>
<sec id="s3-5">
<title>Feature importance and model interpretability</title>
<p>Feature importance analysis identified CRP (0.250), DNA repair genes (0.243), age (0.220), and BMI (0.188) as primary predictors (<xref ref-type="fig" rid="F7">Figure 7</xref>). Genomic features including metabolic genes (0.219) and IFN-response genes (0.200) also contributed significantly. The top four features collectively captured &#x3e;80% of predictive power. This ranking highlights the dominance of inflammatory markers (CRP), DNA maintenance mechanisms, and clinical parameters in treatment response prediction.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Feature importance analysis: Predictive feature ranking. <bold>(A)</bold> Importance scores of top predictive features. CRP (0.250), DNA repair genes (0.243), age (0.220), and BMI (0.188) were the strongest predictors. <bold>(B)</bold> Cumulative importance curve showing the top four features collectively capture &#x3e;80% of predictive power.</p>
</caption>
<graphic xlink:href="fbinf-06-1787360-g007.tif">
<alt-text content-type="machine-generated">Bar chart on the left shows feature importance scores for various biological and clinical factors, with CRP_Level and DNA_Repair_Genes as most important. Line graph on the right displays cumulative feature importance across features, marking an eighty percent threshold.</alt-text>
</graphic>
</fig>
<p>Algorithm comparison revealed ensemble methods (Extra Trees AUC &#x3d; 0.986, XGBoost, LightGBM) outperformed traditional approaches (<xref ref-type="fig" rid="F8">Figure 8</xref>). AUC and accuracy showed strong correlation (r &#x3d; 0.89). Ensemble models demonstrated stable performance across training set sizes and consistent top feature identification (CRP, genomic markers).</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Model performance comparison: Algorithm evaluation. <bold>(A)</bold> Bar chart of AUC scores for 12 machine learning models, with Extra Trees achieving the highest performance (AUC &#x3d; 0.986), followed by CatBoost, LightGBM, and XGBoost. <bold>(B)</bold> Accuracy scores across models, showing Extra Trees leading (0.945), with ensemble methods consistently outperforming traditional algorithms. <bold>(C)</bold> Scatter plot correlating AUC and accuracy scores, demonstrating strong clustering near the diagonal (r &#x3d; 0.89), with Extra Trees as a positive outlier. <bold>(D)</bold> Horizontal bar chart ranking models by AUC, confirming Extra Trees as the top performer, followed by CatBoost and LightGBM, while traditional approaches (Ridge Regression, QDA) ranked lowest.</p>
</caption>
<graphic xlink:href="fbinf-06-1787360-g008.tif">
<alt-text content-type="machine-generated">Composite figure with four panels comparing classification model performances: A shows a bar chart of AUC scores for twelve models, highest for Extra Trees at 0.986; B displays accuracy scores, again highest for Extra Trees at 0.945; C is a scatter plot correlating AUC and accuracy, clustering near the diagonal with Extra Trees as an outlier; D ranks models by AUC in a horizontal bar chart with Extra Trees leading, followed by CatBoost and LightGBM.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3-6">
<title>Multi-omics integration benefits</title>
<p>The integrated multi-omics model significantly outperformed single-omics approaches (AUC &#x3d; 0.986 vs. 0.850 clinical-only, 0.820 genomics-only; <xref ref-type="fig" rid="F9">Figure 9</xref>). Cross-validation confirmed robustness (mean AUC &#x3d; 0.985; range: 0.982&#x2013;0.988) with reduced performance variance (CV &#x3d; 0.021 vs. 0.048/0.062). Performance improvements reached 16.0% (clinical) and 20.2% (genomics) across metrics (accuracy &#x3d; 0.945, sensitivity &#x3d; 0.962, specificity &#x3d; 0.928).</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Multi-omics integration benefits: Performance comparison and validation. <bold>(A)</bold> Performance comparison across approaches, showing integrated model superiority across all metrics. <bold>(B)</bold> Cross-validation AUC scores (mean: 0.985), demonstrating robust model stability. <bold>(C)</bold> Variance comparison showing reduced coefficient of variation for integrated model (0.021 vs. 0.048/0.062). <bold>(D)</bold> Performance improvements of integrated model: 16.0% vs. clinical-only and 20.2% vs. genomics-only.</p>
</caption>
<graphic xlink:href="fbinf-06-1787360-g009.tif">
<alt-text content-type="machine-generated">Four-panel data visualization comparing model performance: Panel A, bar chart showing AUC, accuracy, sensitivity, and specificity for Clinical Only, Genomics Only, and Integrated approaches; Integrated performs highest. Panel B, line graph showing cross-validation AUC scores across folds, mean AUC is zero point nine eight five. Panel C, bar chart of performance variance, lowest for Integrated approach. Panel D, bar chart showing Integrated approach improves performance by sixteen percent versus Clinical and twenty point two percent versus Genomics.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3-7">
<title>Clinical utility and validation</title>
<p>Validation across patient subgroups demonstrated consistent accuracy (comorbidities: 0.931; elderly: 0.918; young: 0.952; CRP-high: 0.928; CRP-low: 0.961; <xref ref-type="fig" rid="F10">Figure 10</xref>). External validation (n &#x3d; 156) confirmed robustness (AUC &#x3d; 0.972, accuracy &#x3d; 0.931). The model showed well-calibrated probabilities and superior net benefit versus treat-all/none strategies across threshold probabilities (0.3&#x2013;0.7).</p>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>Clinical utility and validation: comprehensive assessment. <bold>(A)</bold> Performance metrics (accuracy, sensitivity, and specificity) across patient subgroups, demonstrating consistent predictive capability in elderly, young, comorbid, and CRP-stratified populations. <bold>(B)</bold> External validation results comparing training (n &#x3d; 467) and external (n &#x3d; 156) cohorts, confirming model robustness with sustained AUC (0.972) and accuracy (0.931). <bold>(C)</bold> Calibration plot showing close alignment between predicted and observed probabilities, indicating well-calibrated model predictions. <bold>(D)</bold> Decision curve analysis demonstrating superior net benefit of the integrated model compared to &#x201c;treat-all&#x201d; and &#x201c;treat-none&#x201d; strategies across threshold probabilities (0.3&#x2013;0.7).</p>
</caption>
<graphic xlink:href="fbinf-06-1787360-g010.tif">
<alt-text content-type="machine-generated">Four-panel figure of clinical validation results: Panel A is a grouped bar chart comparing accuracy, sensitivity, and specificity across patient subgroups showing consistent performance. Panel B is a bar chart comparing area under the curve (AUC) and accuracy between training and external validation cohorts. Panel C is a calibration plot with the model's predicted probability closely matching perfect calibration. Panel D is a decision curve analysis graph indicating the net benefit of the integrated model compared to treat-all and treat-none strategies.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>Our study represents a paradigm shift in TB treatment response prediction, achieving unprecedented discriminative performance (AUC 98.6%; 95% CI 97.8&#x2013;99.2) through innovative multi-omics integration. This remarkable performance significantly exceeds existing predictive methods, which typically achieve AUCs of 70%&#x2013;85% when using either clinical variables (<xref ref-type="bibr" rid="B23">Sambarey et al., 2017</xref>) or transcriptomic signatures alone (<xref ref-type="bibr" rid="B2">Bloom et al., 2013</xref>). The integrated approach establishes a new standard for precision medicine in infectious disease management by capturing complementary pathophysiological dimensions-clinical context and molecular mechanisms-that single-modality approaches cannot comprehensively address (<xref ref-type="bibr" rid="B12">Hasin et al., 2017</xref>). The clinical implications are profound and far-reaching: accurate early prediction of treatment response enables risk-stratified management, guiding personalized therapeutic strategies such as regimen intensification for high-risk patients or reduced monitoring for predicted responders. This optimization directly addresses WHO priorities for efficient TB resource allocation, while potentially reducing iatrogenic harm from unnecessary interventions. Crucially, by identifying patients at highest risk of failure before drug resistance emerges, our model could mitigate the development of extensively drug-resistant TB (XDR-TB)&#x2014;a critical advancement given rising global resistance rates (<xref ref-type="bibr" rid="B14">Kendall et al., 2015</xref>). Furthermore, the identification of DNA repair pathways and metabolic regulators as key predictors opens novel therapeutic target opportunities beyond conventional antimicrobial approaches (<xref ref-type="bibr" rid="B17">Mahajan et al., 2025</xref>). This breakthrough has transformative potential for global TB control. Implementation could reduce the 26.6% treatment failure rate observed in our cohort, aligning with Sustainable Development Goal targets for TB elimination (<xref ref-type="bibr" rid="B31">Uplekar et al., 2015</xref>). As our feature importance analysis revealed that four key predictors (CRP, DNA repair genes, age, and BMI) capture &#x3e;80% of predictive power, simplified field-deployable versions could be adapted for resource-limited settings where comprehensive genomic profiling remains challenging. The superior performance of our integrated multi-omics approach (AUC 98.6% vs. 82.4% for clinical-only and 76.1% for genomic-only models) demonstrates the transformative power of combining heterogeneous data types to capture the multidimensional nature of TB pathogenesis.</p>
<p>This aligns with emerging evidence that integrative analytics outperform single-omics approaches in complex diseases (<xref ref-type="bibr" rid="B28">Subramanian et al., 2020</xref>), as clinical variables (e.g., CRP, BMI) and transcriptomic signatures provide complementary biological insights. While clinical data offer immediate, actionable information about patient status&#x2014;particularly valuable for rapid decision-making in resource-limited settings (<xref ref-type="bibr" rid="B5">Cox et al., 2017</xref>)-genomic data elucidate underlying mechanisms, revealing unexpected predictive features like DNA repair pathways (24.3% importance score) and interferon-response genes that traditional clinical markers cannot detect (<xref ref-type="bibr" rid="B27">Singhania et al., 2018b</xref>). The observed synergy stems from overcoming limitations inherent to single-modality approaches: clinical models often lack mechanistic granularity (<xref ref-type="bibr" rid="B7">Esmail et al., 2018</xref>), while genomic-only analyses may overlook critical phenotypic context (<xref ref-type="bibr" rid="B21">Pai et al., 2016</xref>). Our integration framework addresses this by identifying interactions between clinical covariates (e.g., age &#xd7; cytokine expression) and genomic networks (e.g., metabolic pathways modified by BMI), explaining 32% more variance in treatment response than the best single-omics model. This mirrors successes in oncology where multi-omics integration improved prognostic accuracy by 15%&#x2013;30% (<xref ref-type="bibr" rid="B13">Hoadley et al., 2018</xref>). Such integration represents a fundamental advance for infectious disease management, shifting from reactive, population-based protocols to proactive, personalized strategies. By simultaneously capturing host-pathogen interactions (via transcriptomics) and their clinical manifestations (via biomarkers), our model achieves the WHO&#x2019;s vision of &#x201c;precision public health&#x201d; for TB. Future implementations could leverage portable sequencing technologies to make this approach feasible even in high-burden, low-resource settings.</p>
<p>Our findings provided novel insights into the biological mechanisms underlying TB treatment response, revealing that successful outcomes are associated with coordinated upregulation of interferon signaling (log2FC &#x3e; 3.2, <italic>P</italic> &#x3c; 0.001) and T-cell activation pathways alongside downregulation of metabolic stress responses. This advances our fundamental understanding of host-pathogen interactions by demonstrating that treatment efficacy depends not just on bacterial clearance, but on the host&#x2019;s ability to maintain immune homeostasis while avoiding excessive inflammation - a balance reflected in our identified 892-gene signature. The identification of specific immune response pathways (e.g., &#x201c;T cell receptor signaling&#x201d;, <italic>P</italic> &#x3d; 2.3 &#xd7; 10- s) and inflammatory markers (e.g., CRP with 25.0% feature importance) suggested treatment response was governed by complex interactions between host immune status and bacterial factors. Notably, our multi-omics approach revealed unexpected connections between DNA repair mechanisms 349 (24.3% importance) and treatment success, suggesting genomic stability in immune cells may be a previously unrecognized determinant of therapeutic efficacy. The high predictive importance (24.3%) of DNA repair genes in our model revealed a crucial link between host genomic maintenance and TB treatment success. Key genes involved in homologous recombination (e.g., BRCA1, RAD51) and base excision repair (e.g., XRCC1, PARP1) likely contribute by enabling immune cells to withstand the genotoxic stress of chronic infection and inflammation (<xref ref-type="bibr" rid="B24">Sandy et al., 2020</xref>). An efficient DNA damage response ensures the survival and functional integrity of T-cells and macrophages during the extensive proliferation required for bacterial clearance, while also potentially mitigating secondary damage from anti-TB drugs (<xref ref-type="bibr" rid="B9">Fracchia et al., 2013</xref>). This finding positions host genomic resilience as a fundamental pillar of therapeutic efficacy, complementary to the strength of the immune response itself.</p>
<p>These insights may transform therapeutic strategies in three key ways: (1) Drug development: The prominent role of IFN- &#x3b3; pathways supported investigating immunomodulators like interleukin inhibitors currently used in autoimmune diseases (<xref ref-type="bibr" rid="B18">Mayer-Barber and Sher, 2015</xref>). (2) Drug repurposing: Metabolic pathway alterations (e.g., glycolysis, <italic>P</italic> &#x3d; 3.2 &#xd7; 10<sup>&#x2212;4</sup>) suggested potential for combining antitubercular drugs with metabolic modulators like metformin (<xref ref-type="bibr" rid="B25">Singhal et al., 2014</xref>). (3) Monitoring: The 50-gene inflammatory signature could enable early (&#x2264;2 weeks) prediction of treatment failure, addressing a critical clinical need (<xref ref-type="bibr" rid="B6">Dheda et al., 2017</xref>).</p>
<p>The high accuracy (AUC 98.6%, sensitivity 96.2%, specificity 95.8%) and robust clinical utility (net benefit &#x3e;0.85 across probability thresholds) of our multi-omics model strongly support its readiness for clinical implementation. The model&#x2019;s unique capability to predict treatment response as early as 2 weeks post-treatment initiation - significantly earlier than current sputum-based methods requiring 6&#x2013;8 weeks - could revolutionize clinical decision-making by enabling (<xref ref-type="bibr" rid="B6">Dheda et al., 2017</xref>). Firstly, timely adjustment of treatment plans: Early identification of potential non-responders (accounting for 26.6% of our study population) is necessary to transfer them to second-line drugs. 364 Based on similar precision medical methods, this may reduce the rate of acquired resistance by 30%&#x2013;50% (<xref ref-type="bibr" rid="B4">Cohen et al., 2015</xref>); Secondly, personalized monitoring: For predicted responders, reduce the follow-up frequency (73.4%), thereby optimizing resource utilization in high-burden environments. Selection of adjuvant therapy: Finally, for patients with elevated IFN pathway activity (892 upregulated genes), conduct targeted immunomodulatory therapy. However, successful translation requires addressing three critical barriers: First, prospective validation must encompass diverse epidemiological settings, particularly high-TB-burden regions where comorbidities like HIV and diabetes disproportionately affect outcomes (<xref ref-type="bibr" rid="B10">Gupta et al., 2015</xref>). The model&#x2019;s performance in detecting paucibacillary and extrapulmonary TB also requires evaluation. Second, implementation infrastructure demands: Development of simplified versions retaining core 4-feature predictive power (CRP, DNA repair genes, age, BMI) for low-resource settings (<xref ref-type="sec" rid="s13">Supplementary Table S1</xref>); Integration with existing WHO digital health platforms; FDA/CE-IVD clearance for the genomic component; Third, workflow integration necessitates: training programs addressing &#x201c;omics literacy&#x201d; gaps among frontline providers (<xref ref-type="bibr" rid="B16">Khoury et al., 2009</xref>); automated clinical decision support minimizing added physician burden; continuous performance monitoring through learning healthcare systems (<xref ref-type="bibr" rid="B8">Etheredge, 2007</xref>). Our phased implementation roadmap - starting with tertiary centers before expanding to primary clinics - mirrors successful precision medicine rollouts in oncology (<xref ref-type="bibr" rid="B29">Tannock and Hickman, 2025</xref>), while cost-effectiveness analyses must confirm affordability for national TB programs. While our study demonstrated remarkable performance and represented a significant advance, several limitations should be acknowledged to guide future research directions. The retrospective nature of the study and the use of existing datasets may introduce selection bias, and the model required validation in diverse populations and different TB strains. Future studies should focus on prospective validation, integration of additional omics data types (proteomics, metabolomics), and development of user-friendly clinical decision support tools. The broader implications of this work extend beyond TB, establishing a framework for multi-omics integration in other infectious diseases and precision medicine applications.</p>
</sec>
<sec sec-type="conclusion" id="s5">
<title>Conclusion</title>
<p>This groundbreaking study establishes a new paradigm for TB treatment response prediction through innovative multi-omics integration, achieving unprecedented 98.6% AUC performance. Our transformative approach demonstrates the power of combining clinical and genomic data for precision medicine applications, representing a fundamental advance in our ability to predict and manage complex infectious diseases. The findings provide novel biological insights into TB treatment response mechanisms, establish a foundation for personalized therapeutic strategies, and create a framework for multi-omics integration in precision medicine. This work represents a significant advancement in infectious disease management and highlights the transformative potential of multi-omics approaches in addressing global health challenges. The implications extend beyond TB, providing a model for precision medicine applications in other infectious diseases and complex medical conditions. Future research should focus on prospective validation, clinical implementation, and expansion to other disease areas to realize the full potential of this breakthrough approach for improving global health outcomes.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s13">Supplementary Material</xref>, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="ethics-statement" id="s7">
<title>Ethics statement</title>
<p>The studies involving humans were approved by The Ethics Committee for Medical Scientific Research of Xi&#x2019;an Chest hospital. The studies were conducted in accordance with the local legislation and institutional requirements. Written informed consent for participation was not required from the participants or the participants&#x2019; legal guardians/next of kin in accordance with the national legislation and institutional requirements.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>LL: Methodology, Data curation, Software, Writing &#x2013; original draft. HL: Writing &#x2013; original draft, Software, Methodology, Data curation. QL: Investigation, Writing &#x2013; original draft, Resources. TL: Project administration, Investigation, Conceptualization, Writing &#x2013; review and editing, Resources.</p>
</sec>
<ack>
<title>Acknowledgements</title>
<p>We would like to acknowledge all the staff for their diligent adherence to the experimental protocol, and we also extend our gratitude to the patients for their support and contributions.</p>
</ack>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
<p>The handling editor XW declared a past co-authorship with the authors LL.</p>
</sec>
<sec sec-type="ai-statement" id="s11">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="s12">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="s13">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fbinf.2026.1787360/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fbinf.2026.1787360/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table1.xlsx" id="SM1" mimetype="application/xlsx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Supplementaryfile1.doc" id="SM2" mimetype="application/doc" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Berry</surname>
<given-names>M. P.</given-names>
</name>
<name>
<surname>Graham</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>McNab</surname>
<given-names>F. W.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Bloch</surname>
<given-names>S. A. A.</given-names>
</name>
<name>
<surname>Oni</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>An interferon-inducible neutrophil-driven blood transcriptional signature in human tuberculosis</article-title>. <source>Nature</source> <volume>466</volume> (<issue>7309</issue>), <fpage>973</fpage>&#x2013;<lpage>977</lpage>. <pub-id pub-id-type="doi">10.1038/nature09247</pub-id>
<pub-id pub-id-type="pmid">20725040</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bloom</surname>
<given-names>C. I.</given-names>
</name>
<name>
<surname>Graham</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Berry</surname>
<given-names>M. P.</given-names>
</name>
<name>
<surname>Rozakeas</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Redford</surname>
<given-names>P. S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Transcriptional blood signatures distinguish pulmonary tuberculosis, pulmonary sarcoidosis, pneumonias and lung cancers</article-title>. <source>PLoS One</source> <volume>8</volume> (<issue>8</issue>), <fpage>e70630</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0070630</pub-id>
<pub-id pub-id-type="pmid">23940611</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cohen</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Murray</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Modeling epidemics of multidrug-resistant M. tuberculosis of 473 heterogeneous fitness</article-title>. <source>Nat. Med.</source> <volume>10</volume> (<issue>10</issue>), <fpage>1117</fpage>&#x2013;<lpage>1121</lpage>. <pub-id pub-id-type="doi">10.1038/nm1110</pub-id>
<pub-id pub-id-type="pmid">15378056</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cohen</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Abeel</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Manson McGuire</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Desjardins</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Munsamy</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Shea</surname>
<given-names>T. P.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Evolution of extensively drug-resistant tuberculosis over four decades: whole genome sequencing and dating analysis of Mycobacterium tuberculosis isolates from KwaZulu-Natal</article-title>. <source>PLoS Med.</source> <volume>12</volume> (<issue>9</issue>), <fpage>e1001880</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pmed.1001880</pub-id>
<pub-id pub-id-type="pmid">26418737</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cox</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Dickson-Hall</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ndjeka</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Van&#x27;t Hoog</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Grant</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cobelens</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Delays and loss to follow-up before treatment of drug-resistant tuberculosis following implementation of xpert MTB/RIF in South Africa: a retrospective cohort study</article-title>. <source>PLoS Med.</source> <volume>14</volume> (<issue>2</issue>), <fpage>e1002238</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pmed.1002238</pub-id>
<pub-id pub-id-type="pmid">28222095</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dheda</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Gumbo</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Maartens</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Dooley</surname>
<given-names>K. E.</given-names>
</name>
<name>
<surname>McNerney</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Murray</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>The epidemiology, pathogenesis, transmission, diagnosis, and management of multidrug-resistant, extensively drug-resistant, and incurable tuberculosis</article-title>. <source>Lancet Respir. Med.</source> <pub-id pub-id-type="doi">10.1016/S2213-2600(17)30079-6</pub-id>
<pub-id pub-id-type="pmid">28344011</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Esmail</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Riou</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Bruyn</surname>
<given-names>E. D.</given-names>
</name>
<name>
<surname>Lai</surname>
<given-names>R. P. J.</given-names>
</name>
<name>
<surname>Harley</surname>
<given-names>Y. X. R.</given-names>
</name>
<name>
<surname>Meintjes</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>The immune response to Mycobacterium tuberculosis in HIV-1-Coinfected persons</article-title>. <source>Annu. Rev. Immunol.</source> <volume>36</volume>, <fpage>603</fpage>&#x2013;<lpage>638</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-immunol-042617-053420</pub-id>
<pub-id pub-id-type="pmid">29490165</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Etheredge</surname>
<given-names>L. M.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>A rapid-learning health system</article-title>. <source>Health Aff. (Millwood)</source> <volume>26</volume> (<issue>2</issue>), <fpage>w107</fpage>&#x2013;<lpage>w118</lpage>. <pub-id pub-id-type="doi">10.1377/hlthaff.26.2.w107</pub-id>
<pub-id pub-id-type="pmid">17259191</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fracchia</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Pai</surname>
<given-names>C. Y.</given-names>
</name>
<name>
<surname>Walsh</surname>
<given-names>C. M.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Modulation of T cell metabolism and function through calcium signaling</article-title>. <source>Front. Immunol.</source> <volume>4</volume>, <fpage>324</fpage>. <pub-id pub-id-type="doi">10.3389/fimmu.2013.00324</pub-id>
<pub-id pub-id-type="pmid">24133495</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gupta</surname>
<given-names>R. K.</given-names>
</name>
<name>
<surname>Lucas</surname>
<given-names>S. B.</given-names>
</name>
<name>
<surname>Fielding</surname>
<given-names>K. L.</given-names>
</name>
<name>
<surname>Lawn</surname>
<given-names>S. D.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Prevalence of tuberculosis in post-mortem studies of HIV-infected adults and children in resource-limited settings: a systematic review and meta-analysis</article-title>. <source>AIDS</source> <volume>29</volume> (<issue>15</issue>), <fpage>1987</fpage>&#x2013;<lpage>2002</lpage>. <pub-id pub-id-type="doi">10.1097/QAD.0000000000000802</pub-id>
<pub-id pub-id-type="pmid">26266773</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gupta</surname>
<given-names>R. K.</given-names>
</name>
<name>
<surname>Calderwood</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Yavlinsky</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Krutikov</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Quartagno</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Aichelburg</surname>
<given-names>M. C.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Discovery and validation of a personalized risk predictor for incident tuberculosis in low transmission settings</article-title>. <source>Nat. Med.</source> <volume>26</volume> (<issue>12</issue>), <fpage>1941</fpage>&#x2013;<lpage>1949</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-020-1076-0</pub-id>
<pub-id pub-id-type="pmid">33077958</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hasin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Seldin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lusis</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Multi-omics approaches to disease</article-title>. <source>Genome Biol.</source> <volume>18</volume> (<issue>1</issue>), <fpage>83</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-017-1215-1</pub-id>
<pub-id pub-id-type="pmid">28476144</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoadley</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Yau</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Hinoue</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wolf</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Lazar</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Drill</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Cell-of-Origin patterns dominate the molecular classification of 10,000 tumors from 33 types of cancer</article-title>. <source>Cell</source> <volume>173</volume> (<issue>2</issue>), <fpage>291</fpage>&#x2013;<lpage>304.e6</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2018.03.022</pub-id>
<pub-id pub-id-type="pmid">29625048</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kendall</surname>
<given-names>E. A.</given-names>
</name>
<name>
<surname>Fofana</surname>
<given-names>M. O.</given-names>
</name>
<name>
<surname>Dowdy</surname>
<given-names>D. W.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Burden of transmitted multidrug resistance in 470 epidemics of tuberculosis: a transmission modelling analysis</article-title>. <source>Lancet Respir. Med.</source> <volume>3</volume> (<issue>12</issue>), <fpage>963</fpage>&#x2013;<lpage>972</lpage>. <pub-id pub-id-type="doi">10.1016/S2213-2600(15)00458-0</pub-id>
<pub-id pub-id-type="pmid">26597127</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khera</surname>
<given-names>A. V.</given-names>
</name>
<name>
<surname>Chaffin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Aragam</surname>
<given-names>K. G.</given-names>
</name>
<name>
<surname>Haas</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Roselli</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>S. H.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Genome-wide polygenic scores for common diseases identify individuals with risk equivalent to monogenic mutations</article-title>. <source>Nat. Genet.</source> <volume>50</volume> (<issue>9</issue>), <fpage>1219</fpage>&#x2013;<lpage>1224</lpage>. <pub-id pub-id-type="doi">10.1038/s41588-018-0183-z</pub-id>
<pub-id pub-id-type="pmid">30104762</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khoury</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Rich</surname>
<given-names>E. C.</given-names>
</name>
<name>
<surname>Randhawa</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Teutsch</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Niederhuber</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Comparative effectiveness research and genomic medicine: an evolving partnership for 21st century medicine</article-title>. <source>Genet. Med.</source> <volume>11</volume> (<issue>10</issue>), <fpage>707</fpage>&#x2013;<lpage>711</lpage>. <pub-id pub-id-type="doi">10.1097/GIM.0b013e3181b99b90</pub-id>
<pub-id pub-id-type="pmid">19752739</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mahajan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Gor</surname>
<given-names>H. R.</given-names>
</name>
<name>
<surname>Jadhav</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Joshi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Nema</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Host-directed therapeutic for the treatment of Mycobacterium tuberculosis</article-title>. <source>Microbiol. Res.</source> <volume>299</volume>, <fpage>128253</fpage>. <pub-id pub-id-type="doi">10.1016/j.micres.2025.128253</pub-id>
<pub-id pub-id-type="pmid">40483737</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mayer-Barber</surname>
<given-names>K. D.</given-names>
</name>
<name>
<surname>Sher</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Cytokine and lipid mediator networks in tuberculosis</article-title>. <source>Immunol. Rev.</source> <volume>264</volume> (<issue>1</issue>), <fpage>264</fpage>&#x2013;<lpage>275</lpage>. <pub-id pub-id-type="doi">10.1111/imr.12249</pub-id>
<pub-id pub-id-type="pmid">25703565</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>O&#x27;Garra</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Redford</surname>
<given-names>P. S.</given-names>
</name>
<name>
<surname>McNab</surname>
<given-names>F. W.</given-names>
</name>
<name>
<surname>Bloom</surname>
<given-names>C. I.</given-names>
</name>
<name>
<surname>Wilkinson</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Berry</surname>
<given-names>M. P.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>The immune response in tuberculosis</article-title>. <source>Annu. Rev. Immunol.</source> <volume>31</volume>, <fpage>475</fpage>&#x2013;<lpage>527</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-immunol-032712-095939</pub-id>
<pub-id pub-id-type="pmid">23516984</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Osman</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Harausz</surname>
<given-names>E. P.</given-names>
</name>
<name>
<surname>Garcia-Prats</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Schaaf</surname>
<given-names>H. S.</given-names>
</name>
<name>
<surname>Moore</surname>
<given-names>B. K.</given-names>
</name>
<name>
<surname>Hicks</surname>
<given-names>R. M.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Treatment outcomes in global systematic review and patient meta-analysis of children with extensively drug-resistant tuberculosis</article-title>. <source>Emerg. Infect. Dis.</source> <volume>25</volume> (<issue>3</issue>), <fpage>441</fpage>&#x2013;<lpage>450</lpage>. <pub-id pub-id-type="doi">10.3201/eid2503.180852</pub-id>
<pub-id pub-id-type="pmid">30789141</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pai</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Behr</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Dowdy</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Dheda</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Divangahi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Boehme</surname>
<given-names>C. C.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <source>Tuberc. Nat. Rev. Dis. Prim.</source> <volume>2</volume>, <fpage>16076</fpage>. <pub-id pub-id-type="doi">10.1038/nrdp.2016.76</pub-id>
<pub-id pub-id-type="pmid">27784885</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Park</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>Y. K.</given-names>
</name>
<name>
<surname>Joo</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Choe</surname>
<given-names>K. O.</given-names>
</name>
<name>
<surname>Cho</surname>
<given-names>S. H.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>CT findings of pulmonary tuberculosis presenting as segmental consolidation</article-title>. <source>J. Comput. Assist. Tomogr.</source> <volume>23</volume> (<issue>5</issue>), <fpage>736</fpage>&#x2013;<lpage>742</lpage>. <pub-id pub-id-type="doi">10.1097/00004728-199909000-00019</pub-id>
<pub-id pub-id-type="pmid">10524858</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sambarey</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Devaprasad</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mohan</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ahmed</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Nayak</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Swaminathan</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Unbiased identification of blood-based biomarkers for pulmonary tuberculosis by modeling and mining molecular interaction networks</article-title>. <source>EBioMedicine</source> <volume>15</volume>, <fpage>112</fpage>&#x2013;<lpage>126</lpage>. <pub-id pub-id-type="doi">10.1016/j.ebiom.2016.12.009</pub-id>
<pub-id pub-id-type="pmid">28065665</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sandy</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>da Costa</surname>
<given-names>I. C.</given-names>
</name>
<name>
<surname>Schmidt</surname>
<given-names>C. K.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>More than meets the ISG15: emerging roles in the DNA damage response and beyond</article-title>. <source>Biomolecules</source> <volume>10</volume> (<issue>11</issue>), <fpage>1557</fpage>. <pub-id pub-id-type="doi">10.3390/biom10111557</pub-id>
<pub-id pub-id-type="pmid">33203188</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singhal</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Jie</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>G. S.</given-names>
</name>
<name>
<surname>Leow</surname>
<given-names>M. K. S.</given-names>
</name>
<name>
<surname>Paleja</surname>
<given-names>B.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Metformin as adjunct antituberculosis therapy</article-title>. <source>Sci. Transl. Med.</source> <volume>6</volume> (<issue>263</issue>), <fpage>263ra159</fpage>. <pub-id pub-id-type="doi">10.1126/scitranslmed.3009885</pub-id>
<pub-id pub-id-type="pmid">25411472</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singhania</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wilkinson</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Rodrigue</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Haldar</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>O&#x27;Garra</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018a</year>). <article-title>The value of transcriptomics in advancing knowledge of the immune response and diagnosis in tuberculosis</article-title>. <source>Nat. Immunol.</source> <volume>19</volume> (<issue>11</issue>), <fpage>1159</fpage>&#x2013;<lpage>1168</lpage>. <pub-id pub-id-type="doi">10.1038/s41590-018-0225-9</pub-id>
<pub-id pub-id-type="pmid">30333612</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singhania</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Verma</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Graham</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Tran</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Richardson</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2018b</year>). <article-title>A modular transcriptional signature identifies phenotypic heterogeneity of human tuberculosis infection</article-title>. <source>Nat. Commun.</source> <volume>9</volume> (<issue>1</issue>), <fpage>2308</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-018-04579-w</pub-id>
<pub-id pub-id-type="pmid">29921861</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Subramanian</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Verma</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jere</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Anamika</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Multi-omics data integration, interpretation, and its application</article-title>. <source>Bioinform. BiolInsights</source> <volume>14</volume>, <fpage>1177932219899051</fpage>. <pub-id pub-id-type="doi">10.1177/1177932219899051</pub-id>
<pub-id pub-id-type="pmid">32076369</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tannock</surname>
<given-names>I. F.</given-names>
</name>
<name>
<surname>Hickman</surname>
<given-names>J. A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Limits to personalized cancer medicine</article-title>. <source>N. Engl. J. Med.</source> <volume>375</volume> (<issue>13</issue>), <fpage>1289</fpage>&#x2013;<lpage>1294</lpage>. <pub-id pub-id-type="doi">10.1056/NEJMsb1607705</pub-id> <pub-id pub-id-type="pmid">27682039</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal">
<collab>The Lancet Microbe</collab> (<year>2024</year>). <article-title>Drug-resistant tuberculosis: the next sequence of events</article-title>. <source>Lancet 454 Microbe</source> <volume>5</volume> (<issue>1</issue>), <fpage>e1</fpage>.</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Uplekar</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Weil</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Lonnroth</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Jaramillo</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Lienhardt</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Dias</surname>
<given-names>H. M.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>WHO&#x27;s new end TB strategy</article-title>. <source>Lancet</source> <volume>385</volume> (<issue>9979</issue>), <fpage>1799</fpage>&#x2013;<lpage>1801</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(15)60570-0</pub-id>
<pub-id pub-id-type="pmid">25814376</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="book">
<collab>WHO</collab> (<year>2022</year>). <source>WHO consolidated guidelines on tuberculosis: module 4: treatment - drug-susceptible tuberculosis treatment</source>. <publisher-loc>Geneva</publisher-loc>: <publisher-name>World Health Organization</publisher-name>.</mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wong</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Otles</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Donnelly</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Krumm</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>McCullough</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>DeTroyer-Cooley</surname>
<given-names>O.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>External validation of a widely implemented proprietary sepsis prediction model in hospitalized patients</article-title>. <source>JAMA Intern Med.</source> <volume>181</volume> (<issue>8</issue>), <fpage>1065</fpage>&#x2013;<lpage>1070</lpage>. <pub-id pub-id-type="doi">10.1001/jamainternmed.2021.2626</pub-id>
<pub-id pub-id-type="pmid">34152373</pub-id>
</mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="book">
<collab>World health organization</collab> (<year>2024</year>). <source>Global tuberculosis report</source>. <publisher-loc>Geneva</publisher-loc>: <publisher-name>World Health Organization</publisher-name>.</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1843023/overview">Xinfei Wang</ext-link>, Jilin University, China</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1059065/overview">Tongmao Ma</ext-link>, Polytechnic University of Madrid, Spain</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3350959/overview">Kai Zheng</ext-link>, China University of Petroleum, China</p>
</fn>
</fn-group>
<fn-group>
<fn fn-type="abbr" id="abbrev1">
<label>Abbreviations:</label>
<p>TB, Tuberculosis; CRP, C-reactive protein; ESR, erythrocyte sedimentation rate; BMI, body mass index; GEO, Gene Expression Omnibus; PBMCs, peripheral blood mononuclear cells; RMA, Robust Multi-array Average; GSEA, Gene set enrichment analysis; MSigDB, Molecular Signatures Database; KEGG, Kyoto Encyclopedia of Genes and Genomes; GO, Gene Ontology; PCA, Principal component analysis; AUC, area under the curve; SVM, Support Vector Machine; LDA, Linear Discriminant Analysis; QDA, Quadratic Discriminant Analysis.</p>
</fn>
</fn-group>
</back>
</article>