<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2025.1635280</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Oncology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Machine learning assisted breathomic approach for early-stage thoracic cancer detection</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes" corresp="yes">
<name>
<surname>Chen</surname>
<given-names>Zhenguang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2918781/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Peng</surname>
<given-names>Minhua</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1747052/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Fan</surname>
<given-names>Pengnan</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Sai</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Cheng</surname>
<given-names>Xinxin</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Xu</surname>
<given-names>Bo</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Ruiping</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/800725/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hu</surname>
<given-names>Xiao</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wei</surname>
<given-names>Wei</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhao</surname>
<given-names>Tingting</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2890178/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kong</surname>
<given-names>Jun</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liang</surname>
<given-names>Weiliang</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Qiu</surname>
<given-names>Xiangcheng</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Sitong</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wang</surname>
<given-names>Junqi</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Thoracic Surgery, The First Affiliated Hospital, Sun Yat-sen University</institution>, <addr-line>Guangzhou, Guangdong</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>ChromX Health Co., Ltd.</institution>, <addr-line>Guangzhou, Guangdong</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Center for Private Medical Service &amp; Healthcare, The First Affiliated Hospital, Sun Yat-sen University</institution>, <addr-line>Guangzhou, Guangdong</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>State Key Laboratory of Oncology in South China, Sun Yat-sen University Cancer Center</institution>, <addr-line>Guangzhou, Guangdong</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Department of Thoracic Surgery, Guizhou Hospital of the First Affiliated Hospital of Sun Yat-sen University</institution>, <addr-line>Guiyang, Guizhou</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff6">
<sup>6</sup>
<institution>Jingjinji National Center of Technology Innovation</institution>, <addr-line>Beijing</addr-line>,&#xa0;<country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Michael N. Kammer, Universit&#xe9; Toulouse 1 Capitole, France</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1547733/overview">Yuanpin Zhou</ext-link>, Zhejiang University, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1389243/overview">Qing-Qing Yu</ext-link>, Jining First People&#x2019;s Hospital, China</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Zhenguang Chen, <email xlink:href="mailto:chzheng@mail.sysu.edu.cn">chzheng@mail.sysu.edu.cn</email>; Junqi Wang, <email xlink:href="mailto:junqi.wang@chromxhealth.com">junqi.wang@chromxhealth.com</email>
</p>
</fn>
<fn fn-type="equal" id="fn003">
<p>&#x2020;These authors have contributed equally to this work and share first authorship</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>17</day>
<month>09</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>15</volume>
<elocation-id>1635280</elocation-id>
<history>
<date date-type="received">
<day>26</day>
<month>05</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>25</day>
<month>08</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Chen, Peng, Fan, Chen, Cheng, Xu, Chen, Hu, Wei, Zhao, Kong, Liang, Qiu, Chen and Wang.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Chen, Peng, Fan, Chen, Cheng, Xu, Chen, Hu, Wei, Zhao, Kong, Liang, Qiu, Chen and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Objective</title>
<p>This study explores the feasibility of using breathomic biomarkers analyzed by machine learning as a non-invasive diagnostic tool to differentiate between benign and malignant thoracic lesions, aiming to enhance early detection of thoracic cancers and inform clinical decision-making.</p>
</sec>
<sec>
<title>Methods</title>
<p>This study enrolled 132 participants with confirmed diagnosis of lung cancer, esophageal cancer, thymoma, and benign diseases. Exhaled breath samples were analyzed by thermal desorption-gas chromatography-mass spectrometry. A logistic regression algorithm was employed to construct a classification model for benign and malignant thoracic lesions. This model was trained on a subset of 80 cases and subsequently validated in a separate set comprising 52 samples.</p>
</sec>
<sec>
<title>Results</title>
<p>A logistic regression model based on thirteen exhaled volatile organic compounds (VOCs) was developed to differentiate benign and malignant thoracic lesions. The 13-VOC model achieved an AUC of 0.85 (0.72, 0.96), accuracy of 0.79 (0.66, 0.88), sensitivity of 0.82 (0.67, 0.91), and a specificity of 0.71 (0.45, 0.88). It correctly classified 80% of lung cancer, 80% of thymoma, and 100% of esophageal cancer cases, distinguishing 71.4% of benign lesions. For lung cancer, the model achieved an AUC of 0.79 (0.57, 0.98), sensitivity of 0.80 (0.63, 0.91), and specificity of 0.63 (0.31, 0.86), with 81.8% accuracy in detecting early-stage (Stage 0 + I + II) disease. The model outperformed a 4-serum tumor marker panel in sensitivity (0.90 vs. 0.39, <italic>p</italic> &lt; 0.001). Additionally, in a cohort of 58 cancer patients, model-predicted risk significantly decreased post-surgery (<italic>p</italic> &lt; 0.01), indicating a strong correlation with disease burden reduction.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>This study demonstrates the feasibility of utilizing breathomics biomarkers for developing a non-invasive machine learning model for the early diagnosis of thoracic malignancies. These findings provide a foundation for breath analysis as a promising tool for early cancer detection, potentially facilitating improved clinical decision-making and enhancing patient outcomes.</p>
</sec>
</abstract>
<abstract abstract-type="graphical">
<title>Graphical Abstract</title>
<p>This ML-based breathomics study employs TD-GC-MS to analyze 13 exhaled VOCs, achieving superior sensitivity to 4 serum markers in distinguishing lung/thymoma/esophageal cancers from benign conditions. Post-surgical risk reduction confirmed VOC biomarkers' correlation with disease burden.</p>
<p>
<graphic xlink:href="fonc-15-1635280-g000.tif" position="anchor">
<alt-text content-type="machine-generated">Flowchart detailing a study on clinical cohorts, sample collection, machine learning, and model application. Step 1: Clinical cohorts with training, validation, and follow-up sets. Step 2: Sample and data collection involves breath exhalation, using a breath sampler, storing TD tubes at negative twenty degrees Celsius, followed by thermal desorption, GC-MS analysis, and raw data generation. Step 3: Machine learning process includes feature selection, model selection using various algorithms, and feature finalization. Step 4: Model evaluation involves a thirteen-VOC model, risk stratification, model application, and potential postoperative monitoring.</alt-text>
</graphic>
</p>
</abstract>
<kwd-group>
<kwd>breathomics</kwd>
<kwd>volatile organic compounds</kwd>
<kwd>exhaled breath</kwd>
<kwd>thoracic cancer</kwd>
<kwd>machine learning</kwd>
<kwd>early diagnosis</kwd>
<kwd>thermal desorption-gas chromatography-mass spectrometry</kwd>
<kwd>postoperative monitoring</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="72"/>
<page-count count="17"/>
<word-count count="7217"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Thoracic Oncology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>Thoracic malignancies, particularly lung and esophageal cancers, represent a significant global health burden. Lung cancer is the leading cause of cancer-related deaths worldwide, with nearly 2.5 million new cases and over 1.8 million fatalities in 2022 (<xref ref-type="bibr" rid="B1">1</xref>). Despite treatment advancements, the five-year survival rate remains below 20%, primarily due to diagnoses at advanced stages (<xref ref-type="bibr" rid="B2">2</xref>). Similarly, the prognosis for esophageal cancer is also bleak, with a five-year survival rate below 20% (<xref ref-type="bibr" rid="B3">3</xref>), mirroring the situation for lung cancer, as evidenced by 511,000 new cases and 445,000 deaths attributed to the disease worldwide in 2022 (<xref ref-type="bibr" rid="B1">1</xref>). Thymomas, though rare, can lead to serious complications like myasthenia gravis. While their global incidence is between 0.13 and 0.26 per 100,000 individuals (<xref ref-type="bibr" rid="B4">4</xref>), their impact on patients&#x2019; quality of life is significant. These factors underscore the urgent need for improved diagnostic modalities for thoracic malignancies. Current diagnostic approaches, including imaging and invasive procedures like biopsy, the gold standard for thoracic tumor diagnosis, face limitations such as the imprecision to reliably differentiate benign from malignant lesions and the risk of complications associated with invasive procedures (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>). Particularly, the limited sensitivity of conventional blood-based tumor marker assays is underscored by the fact that 60-70% of cases are diagnosed at late stages, primarily due to these methods&#x2019; inability to detect early biological changes&#x200b; and distinguish between overlapping clinical features, thereby delaying timely intervention (<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B8">8</xref>). Therefore, there is an urgent need to develop more precise, non-invasive, and highly sensitive tools to improve the early detection and diagnostic accuracy of thoracic tumors.</p>
<p>Exhaled breath volatile organic compounds (VOCs) are carbon-based molecules, primarily derived from endogenous metabolic processes and systemic circulation. Over 3,000 VOCs have been identified, reflecting the complex metabolic activity within the human body (<xref ref-type="bibr" rid="B9">9</xref>&#x2013;<xref ref-type="bibr" rid="B12">12</xref>). Disease processes (e.g., oxidative stress, inflammation) or pathogens (e.g., bacteria and viruses), can perturb normal metabolic pathways, including lipid peroxidation, amino acid metabolism, and carbohydrate metabolism, leading to unique alterations in the VOC profile, creating disease-specific signatures (<xref ref-type="bibr" rid="B13">13</xref>). These VOCs, diffusing from blood into breath, serve as dynamic biomarkers, enabling the detection of subtle changes associated with disease onset and progression. Breath analysis of these VOC profiles thus offers a non-invasive, real-time method for early disease detection (<xref ref-type="bibr" rid="B14">14</xref>). Previous studies have demonstrated the potential of breath VOCs as biomarkers in identification of a variety of cancers, including lung cancer (<xref ref-type="bibr" rid="B15">15</xref>&#x2013;<xref ref-type="bibr" rid="B18">18</xref>), breast cancer (<xref ref-type="bibr" rid="B19">19</xref>), and gastrointestinal malignancies (<xref ref-type="bibr" rid="B20">20</xref>&#x2013;<xref ref-type="bibr" rid="B22">22</xref>). Gordon et&#xa0;al. were pioneers in using gas chromatography-mass spectrometry (GC-MS) to identify alkenes in the breath of lung cancer patients (<xref ref-type="bibr" rid="B23">23</xref>). Kumar et&#xa0;al. reported that a panel of 12 VOCs detected using a profile-3 selected ion flow tube mass spectrometry instrument could distinguish esophageal cancer from normal controls, achieving an AUC of 0.97 in the initial analysis and 0.92 &#xb1; 0.01 in the validation set (<xref ref-type="bibr" rid="B24">24</xref>). However, research efforts have predominantly focused on distinguishing cancer patients from healthy controls, with limited emphasis on differentiating between benign diseases and cancer patients. Furthermore, to the best of our knowledge, no studies have investigated the use of VOCs as biomarkers for identifying thymomas so far. This distinction is particularly important in thoracic tumors, where benign diseases such as granulomas or hamartomas may mimic malignancies on medical imaging, leading to diagnostic uncertainty and potentially unnecessary invasive procedures.</p>
<p>This study introduces a novel machine learning model that employs a comprehensive panel of breath-derived VOC biomarkers analyzed using GC-MS to achieve simultaneous early detection of lung cancer, esophageal cancer, and thymoma&#x2014;the first breathomics-based strategy for multi-thoracic cancer diagnosis. By evaluating pre/postoperative predictions, we will assess its potential for real-time postoperative monitoring. Notably, we will also compare the sensitivity of this breath-based approach with conventional blood-based tumor markers, with the goal of providing a non-invasive solution for early detection and postoperative monitoring of thoracic cancers.</p>
</sec>
<sec id="s2">
<title>Methods</title>
<sec id="s2_1">
<title>Study design and participants</title>
<p>This cross-sectional study, conducted from November 2021 to January 2022 at the East Division of the First Affiliated Hospital of Sun Yat-sen University in Guangzhou, China, received approval from the Ethics Committee of the First Affiliated Hospital of Sun Yat-sen University (No. 2022-016). All subjects provided signed informed consent. Inclusion criteria were adult participants aged 18&#x2013;80 years with clinical suspicion of malignant thoracic tumors, supported by imaging evidence (CT/PET-CT) and a multidisciplinary team (MDT) assessment prior to histological confirmation. Eligible participants encompassed treatment-na&#xef;ve, newly diagnosed thoracic cancer patients scheduled for surgical resection for diagnostic evaluation, and patients with a history of treated or recurrent thoracic malignancy, provided comprehensive treatment records were available. Exclusion criteria encompassed individuals who were unwilling or unable to provide in-person informed consent, those with unqualified breath samples, patients with relapsed diseases and incomplete treatment histories, individuals suffering from other malignant tumors, those with severe bronchial asthma or confirmed tuberculosis, and those with severe liver damage or kidney diseases. Each participant had undergone resection surgery and was pathologically confirmed to be categorized into one of the following groups: lung cancer, thymoma, esophageal cancer, and benign disease controls. Demographic and clinical information were meticulously recorded and collected. This study was registered in the Chinese Clinical Trial Registry (Registration No.: ChiCTR2200061264).</p>
</sec>
<sec id="s2_2">
<title>Exhale breath collection</title>
<p>All samples were collected following the same standardized procedure. Prior to collection, subjects were asked to rinse their mouths with purified water and rest for 15 minutes to stabilize their respiratory patterns. All subjects were required to abstain from food and beverages except water and smoking for at least 12 hours before the collection. To minimize the influence of diurnal metabolic variations, all collections were scheduled between 7:00 AM and 9:00 AM.</p>
<p>Subjects were instructed to remain seated and breathe normally through a mask for 3 minutes. During exhalation, breath samples were concurrently drawn through a breath sampler (CXBC-Alpha, ChromX Health Co., Ltd) containing an internal sampling pump and a flow control module (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). 900 mL of breath samples were collected at a rate of 300 mL/min and directed into thermal desorption tubes. These tubes, pre-conditioned with 99.9% nitrogen gas to ensure a clean and inert environment, contained Carbopack X and Carbopack B for sample enrichment, concentrating the target compounds for later analysis. All collected samples were sealed with inert end caps immediately and stored at -20&#xb0;C to maintain their integrity and analyzed by thermal desorption-gas chromatography-mass spectrometry (TD-GC-MS) within 7 days to ensure timely and accurate results.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Exhaled breath collection device. The images depicted the schematic diagram <bold>(A)</bold> and sectional view <bold>(B)</bold> of the exhaled breath collection device.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-15-1635280-g001.tif">
<alt-text content-type="machine-generated">Medical device illustration. Panel A shows the exterior with a touch screen and handle. Panel B displays the interior, labeled with a start button, TD tube, main control board, and Luer taper along with a disposable face mask connected by a tube.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s2_3">
<title>TD-GC-MS analysis</title>
<p>Breath samples were analyzed by TD-GC-MS using a system incorporating a high-throughput autosampler, a thermal desorber (TD100-xr, MARKES), and an 7890B-5977A GC/MSD (Agilent Technologies). Separation was performed on an HP-5MS capillary column with nitrogen carrier gas. The mass spectrometer operated in electron ionization (EI) mode at 70 eV, acquiring data in full scan mode (m/z 33-450). Detailed instrument parameters are provided in Supplementary Materials.</p>
</sec>
<sec id="s2_4">
<title>GC-MS quantification and pre-analysis quality control</title>
<p>Raw GC-MS data were processed using MSDial v5.4 for peak detection, quantification, and alignment. The software generated matrices of peak area (VOC area matrix) and signal-to-noise ratio (SNR matrix). Prior to statistical analysis, a data preprocessing and filtering protocol was implemented in Python 3.9.18 to ensure data robustness. Firstly, the signal-to-noise ratio (SNR) matrix was used to assess response reliability. A VOC measurement was classified as valid if its SNR value exceeded 10; measurements below this threshold were excluded due to significant noise interference. For individual samples, the response rate was calculated as the percentage of valid VOC measurements relative to the total measurements in the sample. Samples with a response rate &#x2265;80% were retained for further analysis. Similarly, compound-specific response rates were determined for each VOC by calculating the proportion of valid measurements across all samples. To ensure analytical robustness, only VOCs with a response rate &#x2265;50% were included in the validated dataset, which was designated as the &#x201c;valid VOC area matrix&#x201d;. Secondly, the valid VOC area matrix was then log10-transformed to address heteroscedasticity, followed by normalization to account for variations in instrument response and sample loading. These steps enabled meaningful comparison of VOC abundances across samples.</p>
</sec>
<sec id="s2_5">
<title>Dataset partition</title>
<p>A dataset of 132 participants with malignant or benign thoracic lesions was used in this study, comprising 97 malignant and 35 benign samples. For biomarker discovery and model development, the dataset was randomly split into a discovery set (60%, <italic>n</italic> = 79; 59 malignant, 20 benign) and a testing set (40%, <italic>n</italic> = 53; 38 malignant, 15 benign). The discovery set (training set) was used for feature selection and model training, while the testing set served for independent model evaluation.</p>
</sec>
<sec id="s2_6">
<title>Biomarker screening</title>
<p>To identify VOCs differentially expressed between malignant and benign thoracic lesions, two complementary approaches were employed. First, the Wilcoxon rank-sum test was used to assess the distribution of individual VOCs across the two groups, generating corresponding <italic>p</italic>-values. Second, orthogonal partial least squares-discriminant analysis (OPLS-DA) was performed to evaluate the collective contribution of VOCs to group classification and to calculate variable importance in projection (VIP) scores (<xref ref-type="bibr" rid="B25">25</xref>). VOCs meeting both criteria of a <italic>p</italic> - value &lt; 0.05 and a VIP score &gt; 1 were selected as candidate biomarkers.</p>
<p>Putative biomarker identification was subsequently conducted using Agilent MassHunter Qualitative Analysis 10.0 software and the NIST 17 mass spectral library. Finally, metabolic pathway-associated VOCs reported in the literature were selected as candidate biomarkers for inclusion in diagnostic model development.</p>
</sec>
<sec id="s2_7">
<title>Machine learning algorithms selection and evaluation</title>
<p>Given the complexity inherent in omics data, it is essential to identify the most suitable model for the dataset at hand. To this end, five commonly used machine learning algorithms were systematically evaluated: logistic regression (LR) (<xref ref-type="bibr" rid="B26">26</xref>), random forest (RF) (<xref ref-type="bibr" rid="B27">27</xref>), <italic>k</italic>-nearest neighbors (KNN) (<xref ref-type="bibr" rid="B28">28</xref>), eXtreme Gradient Boosting (XGBoost) (<xref ref-type="bibr" rid="B29">29</xref>), and support vector machine (SVM) (<xref ref-type="bibr" rid="B30">30</xref>). Among these, logistic regression algorithm demonstrated the highest robustness and effectiveness, based on its superior performance across both the discovery and testing datasets. Consequently, logistic regression model was deployed for diagnostic prediction.</p>
</sec>
<sec id="s2_8">
<title>Feature selection</title>
<p>To minimize overfitting, a progressive feature selection approach was employed. Biomarkers were ranked by their area under the receiver operating characteristic curve (ROC-AUC) scores. A logistic regression model was trained using 5-fold cross-validation with stratified sampling, iteratively adding one feature at a time, starting with the highest-ranked biomarker. This process continued until no further significant improvement in model performance was observed.</p>
</sec>
<sec id="s2_9">
<title>Hyperparameter optimization</title>
<p>With the optimal feature subset identified, logistic regression hyperparameters were tuned using grid search with stratified sampling. The following hyperparameters were considered: regularization method, regularization strength, early stopping criteria, and class weights. The parameter combination that yielded the highest AUC score was selected for final model training.</p>
</sec>
<sec id="s2_10">
<title>Final model evaluation</title>
<p>The final logistic regression model, incorporating the optimized feature subset and hyperparameters, was trained on the training dataset. The model was then finalized, and a classification threshold was determined using the Youden index. Subsequently, the model&#x2019;s performance was evaluated independently on the validation dataset. Performance was assessed using five metrics: F1-score, accuracy, sensitivity, specificity, and AUC, along with their respective confidence intervals. Further analyses were performed using this finalized model.</p>
</sec>
<sec id="s2_11">
<title>Statistical analysis</title>
<p>Statistical analyses were performed using Python (version 3.9.18). Continuous variables are presented as mean &#xb1; standard deviation or median [min, max], as appropriate. Categorical variables are presented as counts and percentages. The Wilcoxon rank-sum test was used to compare continuous variables between independent groups (e.g., malignant <italic>vs</italic>. benign). The Chi-square test was used to compare categorical variables. ROC analysis was performed using scikit-learn python (v1.5.1). 95% confidence intervals (95% CI) for AUC, F1-score, sensitivity, specificity, and accuracy were calculated using a binomial distribution. All statistical tests were two-sided, with a significant level of <italic>&#x3b1;</italic> = 0.05, unless otherwise stated.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Study population</title>
<p>145 participants were enrolled in this study. Exclusion criteria were applied to exclude individuals outside the age range of 18 to 80 years, those who declined participation, and those who provided invalid breath samples, resulting in a final cohort of 132 eligible participants for analysis. Among these, 77 were diagnosed with lung cancer, 13 with thymoma, 7 with esophageal cancer, and 35 had benign diseases, as confirmed by pathological results (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). The demographic and clinical data of these participants are presented in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>. Statistical comparisons between the case and control groups were conducted on basic demographic characteristics, including age, gender, body mass index (BMI), smoking and alcohol consumption status, and family cancer history. As detailed in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>, no significant difference was observed in these factors.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Schematic representations of the research framework.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-15-1635280-g002.tif">
<alt-text content-type="machine-generated">Flowchart showing a study process. Participants from the East Division of the First Affiliated Hospital of Sun Yat-sen University (n=145) provided breath samples. GCMS data was collected from 138 participants. After surgery, six were excluded due to GC-MS quality control failure. Final participants were 132, divided into a model training set (LC=47, Thy=8, EC=4, Benign=21) and a model validation set (LC=30, Thy=5, EC=3, Benign=14).</alt-text>
</graphic>
</fig>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Patient demographic and clinical characteristics.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" colspan="2" align="left">Characteristics</th>
<th valign="middle" align="center">Training set (<italic>n</italic> = 80)</th>
<th valign="middle" align="center">Validation set (<italic>n</italic> = 52)</th>
<th valign="middle" align="center">Total (<italic>n</italic> = 132)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="2" align="left">Gender</td>
<td valign="middle" align="left">Male</td>
<td valign="middle" align="center">34 (42.50%)</td>
<td valign="middle" align="center">18 (34.62%)</td>
<td valign="middle" align="center">52 (39.39%)</td>
</tr>
<tr>
<td valign="middle" align="left">Female</td>
<td valign="middle" align="center">46 (57.50%)</td>
<td valign="middle" align="center">34 (65.38%)</td>
<td valign="middle" align="center">80 (60.61%)</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="left">Age, year</td>
<td valign="middle" align="left">Median [Min, Max]</td>
<td valign="middle" align="center">58 [24, 81]</td>
<td valign="middle" align="center">53 [13, 76]</td>
<td valign="middle" align="center">57 [13, 81]</td>
</tr>
<tr>
<td valign="middle" align="left">Mean (SD)</td>
<td valign="middle" align="center">56.58 (12.22)</td>
<td valign="middle" align="center">52.48 (14.67)</td>
<td valign="middle" align="center">54.92 (13.36)</td>
</tr>
<tr>
<td valign="middle" align="left">BMI</td>
<td valign="middle" align="left">Mean (SD)</td>
<td valign="middle" align="center">23.9 (2.74)</td>
<td valign="middle" align="center">22.49 (3.62)</td>
<td valign="middle" align="center">23.28 (3.22)</td>
</tr>
<tr>
<td valign="middle" rowspan="4" align="left">Smoking</td>
<td valign="middle" align="left">Never</td>
<td valign="middle" align="center">40 (50.00%)</td>
<td valign="middle" align="center">35 (67.31%)</td>
<td valign="middle" align="center">75 (56.82%)</td>
</tr>
<tr>
<td valign="middle" align="left">Ever</td>
<td valign="middle" align="center">4 (5.00%)</td>
<td valign="middle" align="center">1 (1.92%)</td>
<td valign="middle" align="center">5 (3.79%)</td>
</tr>
<tr>
<td valign="middle" align="left">Current</td>
<td valign="middle" align="center">4 (5.00%)</td>
<td valign="middle" align="center">2 (3.85%)</td>
<td valign="middle" align="center">6 (4.55%)</td>
</tr>
<tr>
<td valign="middle" align="left">Unknown</td>
<td valign="middle" align="center">32 (40.00%)</td>
<td valign="middle" align="center">14 (26.92%)</td>
<td valign="middle" align="center">46 (34.85%)</td>
</tr>
<tr>
<td valign="middle" rowspan="4" align="left">Drinking</td>
<td valign="middle" align="left">Never</td>
<td valign="middle" align="center">44 (55.00%)</td>
<td valign="middle" align="center">38 (73.08%)</td>
<td valign="middle" align="center">82 (62.12%)</td>
</tr>
<tr>
<td valign="middle" align="left">Ever</td>
<td valign="middle" align="center">2 (2.50%)</td>
<td valign="middle" align="center">0 (0.00%)</td>
<td valign="middle" align="center">2 (1.52%)</td>
</tr>
<tr>
<td valign="middle" align="left">Current</td>
<td valign="middle" align="center">2 (2.50%)</td>
<td valign="middle" align="center">0 (0.00%)</td>
<td valign="middle" align="center">2 (1.52%)</td>
</tr>
<tr>
<td valign="middle" align="left">Unknown</td>
<td valign="middle" align="center">32 (40.00%)</td>
<td valign="middle" align="center">14 (26.92%)</td>
<td valign="middle" align="center">46 (34.85%)</td>
</tr>
<tr>
<td valign="middle" rowspan="3" align="left">Family cancer</td>
<td valign="middle" align="left">Yes</td>
<td valign="middle" align="center">2 (2.50%)</td>
<td valign="middle" align="center">6 (11.54%)</td>
<td valign="middle" align="center">8 (6.06%)</td>
</tr>
<tr>
<td valign="middle" align="left">No</td>
<td valign="middle" align="center">45 (56.25%)</td>
<td valign="middle" align="center">32 (61.54%)</td>
<td valign="middle" align="center">77 (58.33%)</td>
</tr>
<tr>
<td valign="middle" align="left">Unknown</td>
<td valign="middle" align="center">33 (41.25%)</td>
<td valign="middle" align="center">14 (26.92%)</td>
<td valign="middle" align="center">47 (35.61%)</td>
</tr>
<tr>
<td valign="middle" rowspan="5" align="left">Lesion size</td>
<td valign="middle" align="left">&lt; 10 mm</td>
<td valign="middle" align="center">16 (20.00%)</td>
<td valign="middle" align="center">9 (17.31%)</td>
<td valign="middle" align="center">25 (18.94%)</td>
</tr>
<tr>
<td valign="middle" align="left">10&#x2013;20 mm</td>
<td valign="middle" align="center">25 (31.25%)</td>
<td valign="middle" align="center">22 (42.31%)</td>
<td valign="middle" align="center">47 (35.61%)</td>
</tr>
<tr>
<td valign="middle" align="left">20&#x2013;30 mm</td>
<td valign="middle" align="center">19 (23.75%)</td>
<td valign="middle" align="center">7 (13.46%)</td>
<td valign="middle" align="center">26 (19.70%)</td>
</tr>
<tr>
<td valign="middle" align="left">&gt; 30 mm</td>
<td valign="middle" align="center">17 (21.25%)</td>
<td valign="middle" align="center">11 (21.15%)</td>
<td valign="middle" align="center">28 (21.21%)</td>
</tr>
<tr>
<td valign="middle" align="left">Unknown</td>
<td valign="middle" align="center">3 (3.75%)</td>
<td valign="middle" align="center">3 (5.77%)</td>
<td valign="middle" align="center">6 (4.55%)</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="left">Histopathology</td>
<td valign="middle" align="left">Malignant</td>
<td valign="middle" align="center">59 (73.75%)</td>
<td valign="middle" align="center">38 (73.08%)</td>
<td valign="middle" align="center">97 (73.48%)</td>
</tr>
<tr>
<td valign="middle" align="left">Benign</td>
<td valign="middle" align="center">21 (26.25%)</td>
<td valign="middle" align="center">14 (26.92%)</td>
<td valign="middle" align="center">35 (26.51%)</td>
</tr>
<tr>
<td valign="middle" rowspan="3" align="left">Malignant subgroup</td>
<td valign="middle" align="left">LC</td>
<td valign="middle" align="center">47 (58.75%)</td>
<td valign="middle" align="center">30 (57.69%)</td>
<td valign="middle" align="center">77 (79.38%)</td>
</tr>
<tr>
<td valign="middle" align="left">Thymoma</td>
<td valign="middle" align="center">8 (10.00%)</td>
<td valign="middle" align="center">5 (9.62%)</td>
<td valign="middle" align="center">13 (13.40%)</td>
</tr>
<tr>
<td valign="middle" align="left">EC</td>
<td valign="middle" align="center">4 (5.00%)</td>
<td valign="middle" align="center">3 (5.77%)</td>
<td valign="middle" align="center">7 (7.22%)</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="left">Benign subgroup</td>
<td valign="middle" align="left">Benign nodules</td>
<td valign="middle" align="center">12 (15.00%)</td>
<td valign="middle" align="center">8 (15.38%)</td>
<td valign="middle" align="center">20 (57.14%)</td>
</tr>
<tr>
<td valign="middle" align="left">Benign others</td>
<td valign="middle" align="center">9 (11.25%)</td>
<td valign="middle" align="center">6 (11.54%)</td>
<td valign="middle" align="center">15 (42.86%)</td>
</tr>
<tr>
<td valign="middle" rowspan="9" align="left">Benign histopathology</td>
<td valign="middle" align="left">Hamartoma</td>
<td valign="middle" align="center">2 (16.67%)</td>
<td valign="middle" align="center">0 (0.00%)</td>
<td valign="middle" align="center">2 (10.00%)</td>
</tr>
<tr>
<td valign="middle" align="left">Inflammation</td>
<td valign="middle" align="center">5 (41.67%)</td>
<td valign="middle" align="center">5 (62.50%)</td>
<td valign="middle" align="center">10 (50.00%)</td>
</tr>
<tr>
<td valign="middle" align="left">Tuberculosis</td>
<td valign="middle" align="center">1 (8.33%)</td>
<td valign="middle" align="center">0 (0.00%)</td>
<td valign="middle" align="center">1 (5.00%)</td>
</tr>
<tr>
<td valign="middle" align="left">Other nodule</td>
<td valign="middle" align="center">4 (33.33%)</td>
<td valign="middle" align="center">3 (37.50%)</td>
<td valign="middle" align="center">7 (35.00%)</td>
</tr>
<tr>
<td valign="middle" align="left">Mediastinal cyst</td>
<td valign="middle" align="center">2 (22.22%)</td>
<td valign="middle" align="center">3 (60.00%)</td>
<td valign="middle" align="center">5 (35.71%)</td>
</tr>
<tr>
<td valign="middle" align="left">Thymic hyperplasia</td>
<td valign="middle" align="center">1 (11.11%)</td>
<td valign="middle" align="center">0 (0.00%)</td>
<td valign="middle" align="center">1 (7.15%)</td>
</tr>
<tr>
<td valign="middle" align="left">Thymolipoma</td>
<td valign="middle" align="center">1 (11.11%)</td>
<td valign="middle" align="center">0 (0.00%)</td>
<td valign="middle" align="center">1 (7.15%)</td>
</tr>
<tr>
<td valign="middle" align="left">Esophageal hiatal hernia</td>
<td valign="middle" align="center">0 (0.00%)</td>
<td valign="middle" align="center">1 (20.00%)</td>
<td valign="middle" align="center">1 (7.14%)</td>
</tr>
<tr>
<td valign="middle" align="left">Others</td>
<td valign="middle" align="center">5 (55.56%)</td>
<td valign="middle" align="center">1 (20.00%)</td>
<td valign="middle" align="center">6 (42.86%)</td>
</tr>
<tr>
<td valign="middle" rowspan="3" align="left">LC histopathology</td>
<td valign="middle" align="left">Adenocarcinoma</td>
<td valign="middle" align="center">39 (82.98%)</td>
<td valign="middle" align="center">27 (90.00%)</td>
<td valign="middle" align="center">66 (85.71%)</td>
</tr>
<tr>
<td valign="middle" align="left">Squamous carcinoma</td>
<td valign="middle" align="center">4 (8.51%)</td>
<td valign="middle" align="center">2 (6.67%)</td>
<td valign="middle" align="center">6 (7.79%)</td>
</tr>
<tr>
<td valign="middle" align="left">Others</td>
<td valign="middle" align="center">4 (8.51%)</td>
<td valign="middle" align="center">1 (3.33%)</td>
<td valign="middle" align="center">5 (5.19%)</td>
</tr>
<tr>
<td valign="middle" align="left">EC histopathology</td>
<td valign="middle" align="left">Squamous carcinoma</td>
<td valign="middle" align="center">4 (100%)</td>
<td valign="middle" align="center">3 (100%)</td>
<td valign="middle" align="center">7 (100%)</td>
</tr>
<tr>
<td valign="middle" rowspan="3" align="left">Thymoma histopathology</td>
<td valign="middle" align="left">Type B2</td>
<td valign="middle" align="center">6 (75.00%)</td>
<td valign="middle" align="center">4 (80.00%)</td>
<td valign="middle" align="center">10 (76.92%)</td>
</tr>
<tr>
<td valign="middle" align="left">Type B3</td>
<td valign="middle" align="center">1 (12.5%)</td>
<td valign="middle" align="center">1 (20.00%)</td>
<td valign="middle" align="center">2 (15.38%)</td>
</tr>
<tr>
<td valign="middle" align="left">Type AB</td>
<td valign="middle" align="center">1 (12.5%)</td>
<td valign="middle" align="center">0 (0%)</td>
<td valign="middle" align="center">1 (7.69%)</td>
</tr>
<tr>
<td valign="middle" rowspan="6" align="left">AJCC stages</td>
<td valign="middle" align="left">Stage 0</td>
<td valign="middle" align="center">2 (2.50%)</td>
<td valign="middle" align="center">2 (3.85%)</td>
<td valign="middle" align="center">4 (3.03%)</td>
</tr>
<tr>
<td valign="middle" align="left">Stage I</td>
<td valign="middle" align="center">34 (42.5%)</td>
<td valign="middle" align="center">23 (44.23%)</td>
<td valign="middle" align="center">57 (43.18%)</td>
</tr>
<tr>
<td valign="middle" align="left">Stage II</td>
<td valign="middle" align="center">10 (12.5%)</td>
<td valign="middle" align="center">3 (5.77%)</td>
<td valign="middle" align="center">13 (9.85%)</td>
</tr>
<tr>
<td valign="middle" align="left">Stage III</td>
<td valign="middle" align="center">2 (2.50%)</td>
<td valign="middle" align="center">5 (9.62%)</td>
<td valign="middle" align="center">7 (5.30%)</td>
</tr>
<tr>
<td valign="middle" align="left">Stage IV</td>
<td valign="middle" align="center">8 (10.00%)</td>
<td valign="middle" align="center">5 (9.62%)</td>
<td valign="middle" align="center">13 (9.85%)</td>
</tr>
<tr>
<td valign="middle" align="left">Unknown</td>
<td valign="middle" align="center">24 (30.00%)</td>
<td valign="middle" align="center">14 (26.92%)</td>
<td valign="middle" align="center">38 (28.79%)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>BMI, body mass index; EC, esophageal cancer; LC, lung cancer.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_2">
<title>VOC identification and feature selection</title>
<p>Initial statistical screening using the Wilcoxon rank-sum test and OPLS-DA revealed twenty-seven VOCs that exhibited differential abundance (<italic>p</italic> &lt; 0.05) and high VIP scores (VIP &gt; 1) when comparing exhaled breath samples from malignant and benign groups. These candidate VOCs then underwent compound identification and further refinement to exclude those associated with drug metabolism, environmental contaminants, or unrelated to the disease pathology. This rigorous filtering process ultimately yielded a final set of 18 potentially disease-relevant VOCs (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>).</p>
</sec>
<sec id="s3_3">
<title>Diagnostic model selection and feature optimization</title>
<p>To identify the optimal diagnostic model for differentiating benign from malignant thoracic lesions, five machine learning algorithms including logistic regression, SVM, random forest, KNN, and XGBoost were trained using the pre-selected panel of 18 VOCs. Comparison of the models revealed that logistic regression demonstrated robust performance in both the training and validation sets, achieving AUCs of 0.85 (95% CI: 0.82, 0.89) and 0.83 (0.80, 0.89), respectively (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S2</bold>
</xref>). The DeLong test indicated that logistic regression significantly outperformed the KNN, XGBoost, and SVM models in both datasets (p &lt; 0.05). Furthermore, when compared to the random forest model, logistic regression demonstrated superior performance in the validation set (p &lt; 0.01). Consequently, the logistic regression model was selected for further analysis and performance evaluation.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>VOC identification and feature selection. <bold>(A)</bold> ROC curves display the classification performance of the VOC-models using five machine learning algorithms including LR, RF, KNN, XGBoost, and SVM. <bold>(B)</bold> the graph shows AUC values (y-axis) against the number of features (x-axis) in the VOC-model training set. <bold>(C)</bold> box plots comparing the scaled peak area of 13 VOCs in benign and malignant patients. y-axis: scaled VOC peak area by log-transformation and z-score normalization. Significance levels are denoted as follows: * p &lt; 0.05, ** p &lt; 0.01 (Rank-sum test). <bold>(D)</bold> representative chromatograph of 13 selected VOCs in malignant vs. benign patients. Scaled Total Ion Chromatogram TIC (Real TIC/1M).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-15-1635280-g003.tif">
<alt-text content-type="machine-generated">Panel A shows a ROC curve for different machine learning models, including LR, RF, KNN, XGBoost, and SVM, with varying AUC values. Panel B depicts a line graph of ROC-AUC versus the number of top VOCs, showing an upward trend. Panel C presents a series of box plots comparing log-transformed and Z-score peak area for benign and malignant cases across various VOCs. Panel D displays a chromatogram of scaled TIC over retention time for benign and malignant samples, highlighting specific chemical peaks.</alt-text>
</graphic>
</fig>
<p>Final feature selection was conducted using the logistic regression algorithm to optimize model performance. Analysis of the AUC as a function of the number of top features revealed diminishing returns beyond 13 features. As incorporating additional features did not substantially improve the AUC, the top 13 features were selected for model development (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>). These identified compounds represent a diverse range of hydrocarbons, including methyl-cyclohexane, camphene, and d-limonene, as well as oxygenated species such as butanal, 1-butanol, propanoic acid, and <italic>p</italic>-cresol. <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref> provides a comprehensive list of these compounds and their corresponding discriminant values. Analysis of the scaled VOC peak area (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3C</bold>
</xref>) demonstrated that all 13 VOCs were present at elevated levels in the malignant group (<italic>p</italic> &lt; 0.05). A representative chromatogram of the 13 VOCs in malignant and benign samples was shown in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3D</bold>
</xref>.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>13 VOCs identified for model development.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">VOC ID</th>
<th valign="middle" align="left">Average retention time (min)</th>
<th valign="middle" align="left">VOC name</th>
<th valign="middle" align="left">
<italic>P</italic> value</th>
<th valign="middle" align="left">VIP</th>
<th valign="middle" align="left">AUC</th>
<th valign="middle" align="left">Literature reported associated with cancers</th>
<th valign="middle" align="left">Possible biological origin(s)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">70</td>
<td valign="middle" align="left">2.738</td>
<td valign="middle" align="left">Butanal</td>
<td valign="middle" align="left">0.039</td>
<td valign="middle" align="left">2.132</td>
<td valign="middle" align="left">0.634</td>
<td valign="middle" align="left">EC (<xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B47">47</xref>, <xref ref-type="bibr" rid="B49">49</xref>)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">114</td>
<td valign="middle" align="left">3.498</td>
<td valign="middle" align="left">1-Butanol</td>
<td valign="middle" align="left">0.033</td>
<td valign="middle" align="left">2.153</td>
<td valign="middle" align="left">0.632</td>
<td valign="middle" align="left">LC (<xref ref-type="bibr" rid="B31">31</xref>)</td>
<td valign="middle" align="left">Alcohol metabolism, microbial fermentation</td>
</tr>
<tr>
<td valign="middle" align="left">157</td>
<td valign="middle" align="left">4.115</td>
<td valign="middle" align="left">Propanoic acid</td>
<td valign="middle" align="left">0.007</td>
<td valign="middle" align="left">2.792</td>
<td valign="middle" align="left">0.651</td>
<td valign="middle" align="left">LC (<xref ref-type="bibr" rid="B32">32</xref>)</td>
<td valign="middle" align="left">Lipid peroxidation, aldehyde metabolism</td>
</tr>
<tr>
<td valign="middle" align="left">182</td>
<td valign="middle" align="left">4.551</td>
<td valign="middle" align="left">Methyl-cyclohexane</td>
<td valign="middle" align="left">0.043</td>
<td valign="middle" align="left">1.962</td>
<td valign="middle" align="left">0.614</td>
<td valign="middle" align="left">LC (<xref ref-type="bibr" rid="B33">33</xref>, <xref ref-type="bibr" rid="B34">34</xref>), CRC (<xref ref-type="bibr" rid="B41">41</xref>)</td>
<td valign="middle" align="left">Hydrocarbon metabolism, environmental exposure</td>
</tr>
<tr>
<td valign="middle" align="left">206</td>
<td valign="middle" align="left">5.115</td>
<td valign="middle" align="left">Sec-Butyl acetate</td>
<td valign="middle" align="left">0.036</td>
<td valign="middle" align="left">1.774</td>
<td valign="middle" align="left">0.602</td>
<td valign="middle" align="left">LC (<xref ref-type="bibr" rid="B33">33</xref>)</td>
<td valign="middle" align="left">Esterification of alcohol and acetic acid</td>
</tr>
<tr>
<td valign="middle" align="left">226</td>
<td valign="middle" align="left">5.57</td>
<td valign="middle" align="left">Isobutyl acetate</td>
<td valign="middle" align="left">0.018</td>
<td valign="middle" align="left">2.804</td>
<td valign="middle" align="left">0.622</td>
<td valign="middle" align="left">Unknown</td>
<td valign="middle" align="left">potential lipid peroxidation or microbial origin</td>
</tr>
<tr>
<td valign="middle" align="left">242</td>
<td valign="middle" align="left">5.779</td>
<td valign="middle" align="left">Trans-1,2-Cyclopentanediol</td>
<td valign="middle" align="left">0.034</td>
<td valign="middle" align="left">2.04</td>
<td valign="middle" align="left">0.612</td>
<td valign="middle" align="left">Unknown</td>
<td valign="middle" align="left">possibly microbial or environmental</td>
</tr>
<tr>
<td valign="middle" align="left">309</td>
<td valign="middle" align="left">6.626</td>
<td valign="middle" align="left">Trans-2-Decenal</td>
<td valign="middle" align="left">0.036</td>
<td valign="middle" align="left">2.162</td>
<td valign="middle" align="left">0.611</td>
<td valign="middle" align="left">LC (<xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B40">40</xref>)</td>
<td valign="middle" align="left">Lipid peroxidation, oxidative stress</td>
</tr>
<tr>
<td valign="middle" align="left">355</td>
<td valign="middle" align="left">7.585</td>
<td valign="middle" align="left">Cis-2-Hexen-1-ol, (Z)-</td>
<td valign="middle" align="left">0.049</td>
<td valign="middle" align="left">2.925</td>
<td valign="middle" align="left">0.61</td>
<td valign="middle" align="left">Unknown</td>
<td valign="middle" align="left">Lipid peroxidation, plant-derived compounds</td>
</tr>
<tr>
<td valign="middle" align="left">467</td>
<td valign="middle" align="left">9</td>
<td valign="middle" align="left">Camphene</td>
<td valign="middle" align="left">0.025</td>
<td valign="middle" align="left">2.259</td>
<td valign="middle" align="left">0.611</td>
<td valign="middle" align="left">LC (<xref ref-type="bibr" rid="B35">35</xref>)</td>
<td valign="middle" align="left">Terpenoid metabolism</td>
</tr>
<tr>
<td valign="middle" align="left">525</td>
<td valign="middle" align="left">9.882</td>
<td valign="middle" align="left">6-methyl-5-Hepten-2-one</td>
<td valign="middle" align="left">0.049</td>
<td valign="middle" align="left">1.9</td>
<td valign="middle" align="left">0.584</td>
<td valign="middle" align="left">GC (<xref ref-type="bibr" rid="B43">43</xref>&#x2013;<xref ref-type="bibr" rid="B45">45</xref>), CRC (<xref ref-type="bibr" rid="B42">42</xref>), LC (<xref ref-type="bibr" rid="B37">37</xref>)</td>
<td valign="middle" align="left">Fatty acid oxidation, isoprenoid metabolism</td>
</tr>
<tr>
<td valign="middle" align="left">581</td>
<td valign="middle" align="left">10.581</td>
<td valign="middle" align="left">D-Limonene</td>
<td valign="middle" align="left">0.039</td>
<td valign="middle" align="left">1.473</td>
<td valign="middle" align="left">0.612</td>
<td valign="middle" align="left">LC (<xref ref-type="bibr" rid="B35">35</xref>, <xref ref-type="bibr" rid="B36">36</xref>)</td>
<td valign="middle" align="left">Terpene metabolism, dietary intake</td>
</tr>
<tr>
<td valign="middle" align="left">663</td>
<td valign="middle" align="left">11.661</td>
<td valign="middle" align="left">p-Cresol</td>
<td valign="middle" align="left">0.029</td>
<td valign="middle" align="left">1.658</td>
<td valign="middle" align="left">0.642</td>
<td valign="middle" align="left">LC (<xref ref-type="bibr" rid="B38">38</xref>), EC/GC (<xref ref-type="bibr" rid="B50">50</xref>, <xref ref-type="bibr" rid="B69">69</xref>&#x2013;<xref ref-type="bibr" rid="B72">72</xref>)</td>
<td valign="middle" align="left">Microbial metabolism (gut/oral), hepatic metabolism</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>AUC, area under curve; CRC, colorectal cancer; EC, esophageal cancer; GC, gastric cancer; LC, lung cancer; VOCs, volatile organic compounds; VIP, variable importance in the projection.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_4">
<title>Model performance in distinguishing benign from malignant thoracic lesions</title>
<p>In the training set (<italic>n</italic> = 80), the 13-VOC model demonstrated excellent performance with an AUC of 0.86 (0.83, 0.90), an accuracy of 0.83 (0.73, 0.89), a sensitivity of 0.86 (0.76, 0.93), and a specificity of 0.71 (0.50, 0.86). In the validation set (<italic>n</italic> = 52), the 13-VOC model achieved an AUC of 0.85 (0.81, 0.90), an accuracy of 0.79 (0.66, 0.88), a sensitivity of 0.82 (0.67, 0.91), and a specificity of 0.71 (0.45, 0.88), confirming its generalizability and clinical applicability (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S3</bold>
</xref>).</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Model performance in distinguishing benign from malignant thoracic lesions. <bold>(A&#x2013;D, G)</bold>, ROC curves for the 13-VOCs model in distinguishing malignant <bold>(A)</bold> <italic>vs</italic>. benign, lung cancer <bold>(B)</bold> <italic>vs</italic>. benign all, thymoma <bold>(C)</bold> <italic>vs</italic>. benign all, esophageal cancer <bold>(D)</bold> <italic>vs</italic>. benign all, and lung cancer <bold>(G)</bold> <italic>vs</italic>. benign nodules. <bold>(E, F)</bold>, Scatter plot depicting the relationship between VOC model prediction scores and the first principal component (PC1) in the training <bold>(E)</bold> and validation <bold>(F)</bold> sets, respectively. Each point represents an individual sample. The vertical red dashed line indicates the VOC model cutoff score of 0.64 used to discriminate between malignant and benign groups. <bold>(H, I)</bold>, VOC model prediction scores for individual samples (SampleID) across lung cancer and benign nodule groups in the training <bold>(H)</bold> and validation <bold>(I)</bold> sets, respectively. Samples are color-coded by category. The red dashed horizontal line represents the VOC model cutoff score of 0.64 used to distinguish between groups. Thymoma (n=13) and esophageal cancer (n=7) analyses are exploratory (limited sample size) and serve as hypothesis-generating observations.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-15-1635280-g004.tif">
<alt-text content-type="machine-generated">Graphs A, B, C, D, and G show receiver operating characteristic (ROC) curves with sensitivity versus 1-specificity for different cancer comparisons. Graphs E and F are scatter plots of volatile organic compound (VOC) model prediction scores versus principal component scores, highlighting cancer stages. Graphs H and I depict VOC model prediction scores against sample ID, with cancer stages indicated. Each graph includes additional details on areas under the curve and confidence intervals.</alt-text>
</graphic>
</fig>
<p>To further evaluate the performance of the detection model for individual cancer types, a subgroup analysis was conducted across various malignant thoracic lesions. Thymoma (n=13) and esophageal cancer (n=7) analyses are exploratory due to limited sample size and serve as hypothesis-generating observations. In the training set, the AUCs for lung cancer, thymoma, and esophageal cancer were 0.88 (0.85, 0.90), 0.81 (0.75, 0.88), and 0.80 (0.70, 0.96), respectively. In the validation set, corresponding AUCs were 0.84 (0.80, 0.90) for lung cancer, 0.86 (0.79, 1.00) for thymoma, and 0.91 (0.83, 0.95) for esophageal cancer (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4B&#x2013;D</bold>
</xref>). To further visualize the model&#x2019;s performance, prediction values for each participant were plotted against their actual disease status (lung cancer/thymoma/esophageal cancer <italic>vs</italic>. benign). Using a classification threshold of 0.64, the model achieved a high accuracy in the training set, correctly identifying 87.2% (75-94%) of lung cancer, 87.5% (53-98%) of thymoma, and 75% (30-95%) of esophageal cancer cases (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4E</bold>
</xref>). In the validation set, the model maintained high accuracy, correctly classifying 80% (63-91%) of lung cancer, 80% (38-96%) of thymoma, and 100% (44-100%) of esophageal cancer cases (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4F</bold>
</xref>). Additionally, the model demonstrated good specificity for benign lesions, correctly identifying 71.4% (50-86%, 45-88%) of such cases in both the training and validation sets (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4E&#x2013;F</bold>
</xref>). These findings emphasize the model&#x2019;s robust performance and generalized applicability in detecting various malignant thoracic lesions. Importantly, its ability to differentiate benign lesions underscores its potential to minimize unnecessary interventions and overtreatment, supporting its use in clinical practice.</p>
</sec>
<sec id="s3_5">
<title>Model performance in differentiating pulmonary lesions and across different lung cancer AJCC stages</title>
<p>Building upon previous findings, we further investigated the model&#x2019;s ability to differentiate malignant and benign pulmonary lesions. In the training set (<italic>n</italic> = 59), the 13-VOC model achieved an AUC of 0.82 (0.68, 0.95), sensitivity of 0.89 (0.77, 0.95), and specificity of 0.58 (0.32, 0.81). In the validation set (<italic>n</italic> = 38), the model exhibited an AUC of 0.79 (0.57, 0.98), sensitivity of 0.80 (0.63, 0.91), and specificity of 0.63 (0.31, 0.86) (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4G</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S3</bold>
</xref>).</p>
<p>Early detection of lung cancer is critical in clinical practice, allowing for timely interventions and curative resections that substantially increase patient survival rates. To assess our model&#x2019;s efficacy in diagnosing early lung cancer, we used the model to differentiate between various lung cancer stages and benign nodules. The predictive performance of the model was graphically demonstrated by plotting individual participant predictions against their corresponding ground truth classifications (lung cancer stages or benign nodule). With a predetermined classification cut-off at 0.64, the 13-VOC model demonstrated strong performance in identifying early-stage lung cancer, achieving high accuracy for stage 0 + I + II lung cancer (85.7% [70.6-93.7%]) and stage III + IV lung cancer (88.9% [56.5-98%]) in the training set, though the accuracy for benign nodules was comparatively lower at 58.3% (32-80.7%) (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4H</bold>
</xref>). In the validation set, the model maintained robust performance for stage 0 + I + II lung cancer (81.8% [61.5-92.7%]) and improved accuracy for benign nodules (66.7% [35.4-87.9%]), though there was a slight decrease in accuracy for stage III+IV lung cancer (71.4% [35.9-91.8%]) (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4I</bold>
</xref>). These findings highlight the model&#x2019;s potential for early detection and timely treatment of lung cancer, as well as its capacity to reduce unnecessary interventions and overtreatment&#x2014;an essential consideration in clinical decision-making. However, further optimization is necessary to enhance its ability to accurately differentiate benign nodules and address variability in diagnosing advanced-stage lung cancer.</p>
</sec>
<sec id="s3_6">
<title>Comparison of the diagnostic performance of the VOC model with traditional methods using serum tumor biomarkers</title>
<p>To determine whether the model represents an advancement in tumor diagnosis, we compared its predictive accuracy against that of four established clinical tumor biomarkers: CA125, ProGRP, CEA, and CFRA21-1. Among the 36 lung cancers patients, the discriminative sensitivities of CA125, ProGRP, CEA, and CFRA21&#x2013;1 were 0.061, 0.121, 0.152 and 0.242 respectively, while the 13-VOCs model showed a paired discriminative sensitivity of 0.895 (<italic>p</italic> &lt; 0.001) (<xref ref-type="fig" rid="f5">
<bold>Figures&#xa0;5A&#x2013;D, F</bold>
</xref>). Given the common clinical practice of combining these four biomarkers to enhance specificity, we hypothesized that classifying individuals as positive for lung cancer if any of the serum tumor biomarkers fell outside the normal range (i.e., CA125: 0&#x2013;35 KU/L, ProGRP: 0&#x2013;46 ng/L, CEA: 0-5&#x3bc;g/L, CFRA21-1: 0&#x2013;3 ng/L) could yield improved sensitivity. Of particular note, our 13-VOCs model significantly outperformed the 4-serum tumor marker panel, achieving a sensitivity of 0.895 compared to 0.394 (<italic>p</italic> &lt; 0.001) (<xref ref-type="fig" rid="f5">
<bold>Figures&#xa0;5E, F</bold>
</xref>). Importantly, this superior performance was not attributable to an elevated false positive rate (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>). These findings suggested that the 13-VOCs model represents a more robust diagnostic tool, potentially offering particular advantages for early detection, an area where traditional serum biomarkers have limited utility.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Comparison of the diagnostic performance of the 13-VOCs model with clinical serum tumor biomarkers among lung cancer patients. <bold>(A&#x2013;E)</bold>, diagnostic prediction of the lung cancer patients using the 13-VOCs model and clinical markers CA125, ProGRP, CEA, CFRA21-1, and the 4-serum tumor marker panel respectively. The blue vertical dashed line represents the clinical serum tumor biomarkers at various cutoffs, while the red horizontal dashed line indicates the VOC model cutoff score at 0.64. Each point corresponds to an individual lung cancer sample (n=36). <bold>(F)</bold>, comparison of the four individual serum tumor marker, 4-serum tumor marker panel and 13-VOCs models&#x2019; detection sensitivity in predicting lung cancer patients. Sensitivity differences between the 13-VOC model, each individual serum tumor marker, and the 4-serum tumor marker panel were evaluated using McNemar&#x2019;s test. Significance is denoted as follows: ***, p &lt; 0.001.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-15-1635280-g005.tif">
<alt-text content-type="machine-generated">Graphs A to E compare VOC model prediction scores against clinical cutoffs for CA125, ProGRP, CEA, CFRA21-1, and a 4-serum tumor marker panel. Dashed lines represent cutoffs. Graph F displays sensitivity comparisons for CA125, ProGRP, CEA, CFRA21-1, the 4-serum marker panel, and the VOC model, showing the highest sensitivity for the VOC model at 0.895.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3_7">
<title>Model performance for postoperative monitoring and follow-up</title>
<p>To assess whether the model accurately reflects dynamic changes in disease status and further validate that the features it captures are closely associated with disease activity or burden, we analyzed and compared the model&#x2019;s score changes between preoperative assessments and postoperative timepoints, 7 days to 1 month after surgery. Among the cancer patients (<italic>n</italic> = 54), postoperative predicted probabilities were significantly lower than preoperative probabilities (<italic>p</italic> &lt; 0.01), indicating a measurable decrease in predicted disease burden following surgical intervention (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6A</bold>
</xref>). Subgroup analysis confirmed this trend in both lung cancer (<italic>p</italic> &lt; 0.05) (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6C</bold>
</xref>) and thymoma (<italic>p</italic> &lt; 0.05) (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6D</bold>
</xref>), with postoperative scores remaining consistently lower across these malignancies. The postoperative reduction in esophageal cancer was not statistically significant (<italic>p</italic> &gt; 0.05) (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6E</bold>
</xref>), possibly due to the limited sample size. Notably, there was no significant difference in predicted probabilities between the postoperative and preoperative groups in cases of benign disease (<italic>p</italic> &gt; 0.05) (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6B</bold>
</xref>). Collectively, these findings demonstrate that the model effectively reflects the reduction in disease burden following lung cancer surgery, highlighting its potential utility for assessing the completeness of resection and detecting early signs of postoperative recurrence.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Model performance for postoperative monitoring and follow-up. <bold>(A&#x2013;E)</bold>, Comparison of VOC model prediction scores before (PreOp) and after (PostOp) surgery in the overall malignant group <bold>(A)</bold>, benign group <bold>(B)</bold>, lung cancer group <bold>(C)</bold>, thymoma group <bold>(D)</bold>, and esophageal cancer group <bold>(E)</bold>, respectively. Each line represents an individual patient&#x2019;s change in score, color-coded by the magnitude of change. Boxplots show the median and interquartile range. Comparisons in VOC prediction by scores postoperatively were performed using a paired t-test. Significance is denoted as follows: *p &lt; 0.05, **p &lt; 0.01, ns = not significant (p &#x2265; 0.05).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-15-1635280-g006.tif">
<alt-text content-type="machine-generated">Box plots labeled A to E show VOC model prediction scores for different conditions, comparing preoperative and postoperative scores.   A: &#x201c;All malignant&#x201d; shows a significant decrease (p&lt;0.01).   B: &#x201c;All benign&#x201d; shows no significant change.   C: &#x201c;Lung cancer&#x201d; shows significant decrease (p&lt;0.05).   D: &#x201c;Thymoma&#x201d; shows significant decrease (p&lt;0.05).   E: &#x201c;Esophageal cancer&#x201d; shows no significant change.   Lines indicate individual changes, color-coded for magnitude of change.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>This study aimed to develop and validate a novel machine learning model for the early diagnosis of thoracic malignancies using exhaled VOCs as biomarkers. To our knowledge, our findings demonstrate for the first time the feasibility of employing a single panel of VOC profiles to differentiate between benign and malignant thoracic lesions, particularly lung, esophageal, and thymic tumors.</p>
<p>To determine the optimal classifier for metabolomics data analysis, we evaluated five machine learning algorithms: logistic regression, random forest, k-nearest neighbor, XGBoost, and support vector machine, on training and validation datasets. Logistic regression demonstrated robust performance on both sets, making it the ideal choice for the baseline model. While algorithms like Random Forest and XGBoost showed some promise, they were not pursued due to their increased complexity and computational demands, without significant improvement in testing set performance. Given its simplicity, interpretability, efficiency, and strong generalization, logistic regression emerged as the optimal model for metabolomics data analysis. The 13-VOC model constructed by logistic regression algorithm achieved high accuracy in classifying thoracic tumors, with an AUC of 0.85, sensitivity of 82%, and specificity of 71%, representing a clinically significant advancement over existing clinical markers, which only achieved a sensitivity of 39.4%. Notably, the model exhibited robust performance in distinguishing early-stage lung cancer, suggesting its potential as a non-invasive screening tool.</p>
<p>Thirteen VOCs were identified as potential biomarkers for distinguishing malignant from benign thoracic lesions, many of which have established or emerging links to various cancer metabolism and pathogenesis. Several VOCs, including 1-butanol (<xref ref-type="bibr" rid="B31">31</xref>), propanoic acid (<xref ref-type="bibr" rid="B32">32</xref>), methyl-Cyclohexane (<xref ref-type="bibr" rid="B33">33</xref>, <xref ref-type="bibr" rid="B34">34</xref>), sec-Butyl acetate (<xref ref-type="bibr" rid="B33">33</xref>), camphene (<xref ref-type="bibr" rid="B35">35</xref>), D-Limonene (<xref ref-type="bibr" rid="B35">35</xref>, <xref ref-type="bibr" rid="B36">36</xref>), 6-methyl-5-Hepten-2-one (<xref ref-type="bibr" rid="B37">37</xref>), and <italic>p</italic>-cresol (<xref ref-type="bibr" rid="B38">38</xref>), have been previously reported as elevated in lung cancer and other malignancies.</p>
<p>Emerging evidence suggests that these VOCs may reflect key metabolic alterations characteristic of cancer pathogenesis. Trans-2-Decenal (<xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B40">40</xref>), an alkenal mutagen found in cooking oil fumes, has been shown to promote oxidative DNA damage through reactive oxygen species formation, a well-established mechanism implicated in lung carcinogenesis, suggesting increased risk for individuals with frequent exposure (<xref ref-type="bibr" rid="B39">39</xref>). Methyl-cyclohexane, which has also been implicated in distinguishing colorectal cancer from healthy controls, may indicate broader metabolic reprogramming in malignancy (<xref ref-type="bibr" rid="B41">41</xref>). 6-methyl-5-Hepten-2-one, potentially linked to increased fatty acid oxidation (<xref ref-type="bibr" rid="B42">42</xref>), a hallmark of cancer cell metabolism, was reported to be elevated in various gastrointestinal cancers, including colorectal (<xref ref-type="bibr" rid="B42">42</xref>) and gastric cancer (<xref ref-type="bibr" rid="B43">43</xref>&#x2013;<xref ref-type="bibr" rid="B45">45</xref>).</p>
<p>Butanal, elevated in esophagogastric cancer (<xref ref-type="bibr" rid="B46">46</xref>), may accumulate due to genetic dysregulation of its metabolic pathways or as a byproduct of lipid peroxidation&#x2014;a process often amplified by chronic inflammation in the tumor microenvironment. This aligns with the recognized role of oxidative stress in cancer progression (<xref ref-type="bibr" rid="B47">47</xref>, <xref ref-type="bibr" rid="B48">48</xref>). Furthermore, alterations in the gut microbiome, frequently observed in esophageal cancer, can modulate butanal production and metabolism (<xref ref-type="bibr" rid="B49">49</xref>), highlighting the interplay between host metabolism and microbial communities in cancer.</p>
<p>
<italic>p</italic>-Cresol, with its complex metabolism influenced by gut and oral microbiota, hepatic processes, and disease state, has been identified as a potential breath biomarker in various cancers, including esophageal, gastric, thyroid, breast, oral, and lung cancers, and even in some non-malignant conditions (<xref ref-type="bibr" rid="B50">50</xref>, <xref ref-type="bibr" rid="B51">51</xref>). This broad association suggests <italic>p</italic>-cresol and other VOCs may serve as general indicators of metabolic dysregulation or malignancy.</p>
<p>In contrast, isobutyl acetate, trans-1,2-Cyclopentanediol, and cis-2-Hexen-1-ol currently lack well-established links to cancer pathogenesis. Isobutyl acetate has been primarily reported as a marker for microbial (specifically Candida albicans) activity, particularly in respiratory infections (<xref ref-type="bibr" rid="B52">52</xref>). It may also indirectly contribute to metabolic disorders like obesity and diabetes through oxidative stress and neuroinflammation (<xref ref-type="bibr" rid="B53">53</xref>), and potentially to cardiovascular disease via ROS-mediated metabolic dysregulation (<xref ref-type="bibr" rid="B54">54</xref>). Further studies should include metabolomic and pathway enrichment analyses, such as KEGG, to elucidate their metabolic origins and explore potential sources like lipid peroxidation or microbial dysbiosis.</p>
<p>The observation that several VOCs are associated with multiple cancer types suggests they may serve as general indicators of malignancy or reflect shared metabolic pathways. Combining these VOCs into a diagnostic model is justified by their diverse origins and links to various cancer-related pathways, including genetic dysregulation, oxidative stress, lipid peroxidation, and microbiome alterations, enabling the capture of a more comprehensive metabolic fingerprint of thoracic malignancies, potentially improving diagnostic accuracy. Nevertheless, further mechanistic studies are needed to elucidate how these VOCs specifically relate to cancer pathogenesis and to validate their clinical utility as biomarkers.</p>
<p>Furthermore, the model&#x2019;s ability to track changes in VOC profiles over time, as demonstrated by the significant decrease in predicted risk following surgery, highlights its potential for monitoring disease progression and treatment response. Wang et&#xa0;al. demonstrated the feasibility of using perioperative dynamic breathomics to identify a panel of VOCs as potential biomarkers for lung cancer (<xref ref-type="bibr" rid="B55">55</xref>). By comparing VOC profiles before and after surgery, they identified 16 VOCs that were significantly altered in lung cancer patients, and a machine learning model based on these VOCs achieved high accuracy of 86.9% in differentiating between lung cancer patients and healthy controls. Nardi-Agmon et&#xa0;al. explored the potential of breath analysis for monitoring the response to anticancer treatment in patients with advanced lung cancer (<xref ref-type="bibr" rid="B56">56</xref>). By utilizing a panel of three VOCs identified as significant indicators of treatment outcomes, this approach may provide a rapid and non-invasive method for assessing treatment response, potentially enabling earlier detection of treatment failure compared to conventional imaging techniques. These findings highlight the growing evidences supporting breath analysis as a valuable tool for lung cancer management, with the ability to detect dynamic changes in VOC profiles pre- and post-treatment suggesting its potential as a complementary approach to existing diagnostic and monitoring strategies.</p>
<p>However, several limitations of this study should be acknowledged. Firstly, although our cohort was prospectively enrolled, the sample size (n=132) and subtype distribution (lung cancer 79.4%, thymoma 13.4%, esophageal cancer 7.2%) reflect the underlying epidemiology of thoracic malignancies (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B3">3</xref>, <xref ref-type="bibr" rid="B4">4</xref>). This distribution enabled robust differentiation between malignant and benign lesions, but the small numbers for rarer subtypes limit the strength of conclusions for thymoma and esophageal cancer. These analyses are exploratory and serve as preliminary, hypothesis-generating observations. External validation in larger, multi-center cohorts, particularly through collaboration with international consortia for rare thoracic tumors, is essential to confirm these findings and support broader clinical application. Secondly, the reliance on GC-MS for VOC analysis presents challenges for clinical implementation. GC-MS is a complex, time-consuming, and expensive technique that requires specialized equipment and expertise, making it less feasible for routine clinical use (<xref ref-type="bibr" rid="B57">57</xref>). To address this, future research should focus on validating these findings using point-of-care testing (POCT) devices, such as micro-GC systems (<xref ref-type="bibr" rid="B58">58</xref>&#x2013;<xref ref-type="bibr" rid="B65">65</xref>), electronic noses (<xref ref-type="bibr" rid="B66">66</xref>), or wearable VOC sensors (<xref ref-type="bibr" rid="B67">67</xref>), which offer real-time, bedside breath analysis for rapid clinical decision-making. However, challenges remain, including achieving sufficient sensor sensitivity and selectivity, minimizing sensor drift and environmental interference, and standardizing protocols. Progress in materials science and AI-driven data analysis, along with interdisciplinary collaboration, will be crucial to address these issues. Pilot studies in clinical settings are also needed to assess practicality, cost-effectiveness, and user acceptance, ultimately supporting the adoption of breath analysis in routine healthcare. Large-scale validation studies using such technologies could pave the way for the widespread adoption of breath analysis in clinical practice (<xref ref-type="bibr" rid="B58">58</xref>&#x2013;<xref ref-type="bibr" rid="B63">63</xref>). Thirdly, this study focused only on lung cancer, thymoma, and esophageal cancer, limiting its applicability to other thoracic malignancies. Future research should include mesothelioma, mediastinal tumors, and other rare thoracic cancers to develop a more comprehensive model, which could improve breath analysis for diagnosis and monitoring across the entire spectrum of thoracic oncology. Fourthly, while the study demonstrates the potential of VOC analysis, further research is needed to elucidate the underlying biological mechanisms and to address the technical challenges associated with breath sample collection and analysis. Finally, although LDCT is widely used for lung cancer screening, it carries high costs and a notable false-positive rate, which can lead to unnecessary follow-up tests and increased patient anxiety (<xref ref-type="bibr" rid="B68">68</xref>). In contrast, breath-based VOC analysis offers a non-invasive, radiation-free, and potentially more cost-effective screening approach. However, our current methodology relies on GC-MS, which is not yet feasible for large-scale screening due to its expense and complexity. The development of portable, point-of-care VOC detection platforms may help overcome these limitations, enabling broader clinical implementation and possibly reducing the economic and logistical burden associated with current screening methods. Future studies should directly compare the clinical and economic outcomes of VOC-based POCT and existing modalities such as LDCT to determine the most effective and sustainable strategies for early cancer detection. Despite these limitations, this study provides a strong foundation for the development of breath analysis as a valuable tool for the early detection, diagnosis, and monitoring of thoracic cancers.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<title>Conclusion</title>
<p>This study establishes the effectiveness of a breath-derived VOC model in distinguishing malignant and benign thoracic lesions, demonstrating its capability for multi-cancer detection and early-stage diagnosis. By pioneering breathomics for simultaneous identification of multiple thoracic malignancies and exploring its potential for postoperative monitoring, this work introduces a novel integration of non-invasive diagnostics with therapeutic surveillance. Compared to traditional serum biomarkers, the approach demonstrates superior sensitivity while eliminating invasive sampling, offering a patient-friendly alternative with clinical scalability. The methodology holds promise for improving early cancer detection and real-time postoperative evaluation, potentially enhancing clinical decision-making and personalized patient management. Future efforts should prioritize validation in broader populations, refinement of the predictive model, and development of point-of-care devices to facilitate clinical translation and improve patient outcomes.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s9" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Ethics Committee of the First Affiliated Hospital of Sun Yat-sen University. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s10" sec-type="author-contributions">
<title>Author contributions</title>
<p>ZC: Writing &#x2013; review &amp; editing, Conceptualization, Supervision. MP: Writing &#x2013; original draft, Writing &#x2013; review &amp; editing, Conceptualization. PF: Writing &#x2013; review &amp; editing, Formal Analysis, Data curation, Methodology. SC: Investigation, Writing &#x2013; review &amp; editing, Methodology. XC: Methodology, Formal Analysis, Writing &#x2013; review &amp; editing, Data curation. BX: Writing &#x2013; review &amp; editing, Formal Analysis, Validation. RC: Formal Analysis, Data curation, Resources, Writing &#x2013; review &amp; editing. XH: Methodology, Writing &#x2013; review &amp; editing, Visualization. WW: Validation, Writing &#x2013; review &amp; editing, Data curation, Investigation. TZ: Methodology, Data curation, Investigation, Writing &#x2013; review &amp; editing. JK: Writing &#x2013; review &amp; editing, Methodology, Data curation. WL: Software, Methodology, Writing &#x2013; review &amp; editing, Investigation. XQ: Writing &#x2013; review &amp; editing, Data curation, Project administration. STC: Methodology, Data curation, Supervision, Writing &#x2013; review &amp; editing. JW: Writing&#xa0;&#x2013; review &amp; editing, Project administration, Funding acquisition.</p>
</sec>
<sec id="s11" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research and/or publication of this article. This study was supported by the Disruptive Technology Innovation Project of the National Key Research and Development Program of China (2024YFF1501500).</p>
</sec>
<sec id="s12" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>Authors MP, PF, JK, WL, XQ, STC, JW were employed by the company ChromX Health Co., Ltd.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s13" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec id="s14" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s15" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fonc.2025.1635280/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fonc.2025.1635280/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bray</surname> <given-names>F</given-names>
</name>
<name>
<surname>Laversanne</surname> <given-names>M</given-names>
</name>
<name>
<surname>Sung</surname> <given-names>H</given-names>
</name>
<name>
<surname>Ferlay</surname> <given-names>J</given-names>
</name>
<name>
<surname>Siegel</surname> <given-names>RL</given-names>
</name>
<name>
<surname>Soerjomataram</surname> <given-names>I</given-names>
</name>
<etal/>
</person-group>. <article-title>Global cancer statistics 2022: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>. <source>CA Cancer J Clin</source>. (<year>2024</year>) <volume>74</volume>:<page-range>229&#x2013;63</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/caac.21834</pub-id>, PMID: <pub-id pub-id-type="pmid">38572751</pub-id></citation></ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Allemani</surname> <given-names>C</given-names>
</name>
<name>
<surname>Matsuda</surname> <given-names>T</given-names>
</name>
<name>
<surname>Di Carlo</surname> <given-names>V</given-names>
</name>
<name>
<surname>Harewood</surname> <given-names>R</given-names>
</name>
<name>
<surname>Matz</surname> <given-names>M</given-names>
</name>
<name>
<surname>Niksic</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Global surveillance of trends in cancer survival 2000-14 (CONCORD-3): analysis of individual records for 37 513&#x2013;025 patients diagnosed with one of 18 cancers from 322 population-based registries in 71 countries</article-title>. <source>Lancet</source>. (<year>2018</year>) <volume>391</volume>:<page-range>1023&#x2013;75</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0140-6736(17)33326-3</pub-id>, PMID: <pub-id pub-id-type="pmid">29395269</pub-id></citation></ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sheikh</surname> <given-names>M</given-names>
</name>
<name>
<surname>Roshandel</surname> <given-names>G</given-names>
</name>
<name>
<surname>McCormack</surname> <given-names>V</given-names>
</name>
<name>
<surname>Malekzadeh</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>Current status and future prospects for esophageal cancer</article-title>. <source>Cancers (Basel)</source>. (<year>2023</year>) <volume>15</volume>:<elocation-id>765</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/cancers15030765</pub-id>, PMID: <pub-id pub-id-type="pmid">36765722</pub-id></citation></ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alqaidy</surname> <given-names>D</given-names>
</name>
</person-group>. <article-title>Thymoma: an overview</article-title>. <source>Diagnostics (Basel)</source>. (<year>2023</year>) <volume>13</volume>:<elocation-id>2982</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/diagnostics13182982</pub-id>, PMID: <pub-id pub-id-type="pmid">37761349</pub-id></citation></ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lopes</surname> <given-names>R</given-names>
</name>
<name>
<surname>Betrouni</surname> <given-names>N</given-names>
</name>
</person-group>. <article-title>Fractal and multifractal analysis: a review</article-title>. <source>Med Image Anal</source>. (<year>2009</year>) <volume>13</volume>:<page-range>634&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.media.2009.05.003</pub-id>, PMID: <pub-id pub-id-type="pmid">19535282</pub-id></citation></ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Ge</surname> <given-names>X</given-names>
</name>
<name>
<surname>Niu</surname> <given-names>R</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>J</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Shao</surname> <given-names>X</given-names>
</name>
<etal/>
</person-group>. <article-title>PET/CT radiomics and deep learning in the diagnosis of benign and Malignant pulmonary nodules: progress and challenges</article-title>. <source>Front Oncol</source>. (<year>2024</year>) <volume>14</volume>:<elocation-id>1491762</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fonc.2024.1491762</pub-id>, PMID: <pub-id pub-id-type="pmid">39582533</pub-id></citation></ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nasim</surname> <given-names>F</given-names>
</name>
<name>
<surname>Sabath</surname> <given-names>BF</given-names>
</name>
<name>
<surname>Eapen</surname> <given-names>GA</given-names>
</name>
</person-group>. <article-title>Lung cancer</article-title>. <source>Med Clin North Am</source>. (<year>2019</year>) <volume>103</volume>:<page-range>463&#x2013;73</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.mcna.2018.12.006</pub-id>, PMID: <pub-id pub-id-type="pmid">30955514</pub-id></citation></ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>FL</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>SJ</given-names>
</name>
</person-group>. <article-title>Esophageal cancer: Risk factors, genetic association, and treatment</article-title>. <source>Asian J Surg</source>. (<year>2018</year>) <volume>41</volume>:<page-range>210&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.asjsur.2016.10.005</pub-id>, PMID: <pub-id pub-id-type="pmid">27986415</pub-id></citation></ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Phillips</surname> <given-names>M</given-names>
</name>
<name>
<surname>Herrera</surname> <given-names>J</given-names>
</name>
<name>
<surname>Krishnan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Zain</surname> <given-names>M</given-names>
</name>
<name>
<surname>Greenberg</surname> <given-names>J</given-names>
</name>
<name>
<surname>Cataneo</surname> <given-names>RN</given-names>
</name>
</person-group>. <article-title>Variation in volatile organic compounds in the breath of normal humans</article-title>. <source>J Chromatogr B BioMed Sci Appl</source>. (<year>1999</year>) <volume>729</volume>:<fpage>75</fpage>&#x2013;<lpage>88</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/s0378-4347(99)00127-9</pub-id>, PMID: <pub-id pub-id-type="pmid">10410929</pub-id></citation></ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Minh Tdo</surname> <given-names>C</given-names>
</name>
<name>
<surname>Blake DR and Galassetti</surname> <given-names>PR</given-names>
</name>
</person-group>. <article-title>The clinical potential of exhaled breath analysis for diabetes mellitus</article-title>. <source>Diabetes Res Clin Pract</source>. (<year>2012</year>) <volume>97</volume>:<fpage>195</fpage>&#x2013;<lpage>205</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.diabres.2012.02.006</pub-id>, PMID: <pub-id pub-id-type="pmid">22410396</pub-id></citation></ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bake</surname> <given-names>B</given-names>
</name>
<name>
<surname>Larsson</surname> <given-names>P</given-names>
</name>
<name>
<surname>Ljungkvist</surname> <given-names>G</given-names>
</name>
<name>
<surname>Ljungstrom</surname> <given-names>E</given-names>
</name>
<name>
<surname>Olin</surname> <given-names>AC</given-names>
</name>
</person-group>. <article-title>Exhaled particles and small airways</article-title>. <source>Respir Res</source>. (<year>2019</year>) <volume>20</volume>:<elocation-id>8</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12931-019-0970-9</pub-id>, PMID: <pub-id pub-id-type="pmid">30634967</pub-id></citation></ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brusselmans</surname> <given-names>L</given-names>
</name>
<name>
<surname>Arnouts</surname> <given-names>L</given-names>
</name>
<name>
<surname>Millevert</surname> <given-names>C</given-names>
</name>
<name>
<surname>Vandersnickt</surname> <given-names>J</given-names>
</name>
<name>
<surname>van Meerbeeck</surname> <given-names>JP</given-names>
</name>
<name>
<surname>Lamote</surname> <given-names>K</given-names>
</name>
</person-group>. <article-title>Breath analysis as a diagnostic and screening tool for Malignant pleural mesothelioma: a systematic review</article-title>. <source>Transl Lung Cancer Res</source>. (<year>2018</year>) <volume>7</volume>:<page-range>520&#x2013;36</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.21037/tlcr.2018.04.09</pub-id>, PMID: <pub-id pub-id-type="pmid">30450290</pub-id></citation></ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Phillips</surname> <given-names>M</given-names>
</name>
<name>
<surname>Greenberg</surname> <given-names>J</given-names>
</name>
<name>
<surname>Awad</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Metabolic and environmental origins of volatile organic compounds in breath</article-title>. <source>J Clin Pathol</source>. (<year>1994</year>) <volume>47</volume>:<page-range>1052&#x2013;3</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/jcp.47.11.1052</pub-id>, PMID: <pub-id pub-id-type="pmid">7829686</pub-id></citation></ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Haworth</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Pitcher</surname> <given-names>CK</given-names>
</name>
<name>
<surname>Ferrandino</surname> <given-names>G</given-names>
</name>
<name>
<surname>Hobson</surname> <given-names>AR</given-names>
</name>
<name>
<surname>Pappan</surname> <given-names>KL</given-names>
</name>
<name>
<surname>Lawson</surname> <given-names>JLD</given-names>
</name>
</person-group>. <article-title>Breathing new life into clinical testing and diagnostics: perspectives on volatile biomarkers from breath</article-title>. <source>Crit Rev Clin Lab Sci</source>. (<year>2022</year>) <volume>59</volume>:<page-range>353&#x2013;72</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/10408363.2022.2038075</pub-id>, PMID: <pub-id pub-id-type="pmid">35188863</pub-id></citation></ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fan</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhong</surname> <given-names>R</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Zhong</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>H</given-names>
</name>
<name>
<surname>He</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Exhaled VOC detection in lung cancer screening: a comprehensive meta-analysis</article-title>. <source>BMC Cancer</source>. (<year>2024</year>) <volume>24</volume>:<fpage>775</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12885-024-12537-7</pub-id>, PMID: <pub-id pub-id-type="pmid">38937687</pub-id></citation></ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saalberg</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wolff</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>VOC breath biomarkers in lung cancer</article-title>. <source>Clin Chim Acta</source>. (<year>2016</year>) <volume>459</volume>:<fpage>5</fpage>&#x2013;<lpage>9</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cca.2016.05.013</pub-id>, PMID: <pub-id pub-id-type="pmid">27221203</pub-id></citation></ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peled</surname> <given-names>N</given-names>
</name>
<name>
<surname>Fuchs</surname> <given-names>V</given-names>
</name>
<name>
<surname>Kestenbaum</surname> <given-names>EH</given-names>
</name>
<name>
<surname>Oscar</surname> <given-names>E</given-names>
</name>
<name>
<surname>Bitran</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>An update on the use of exhaled breath analysis for the early detection of lung cancer</article-title>. <source>Lung Cancer (Auckl)</source>. (<year>2021</year>) <volume>12</volume>:<fpage>81</fpage>&#x2013;<lpage>92</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2147/LCTT.S320493</pub-id>, PMID: <pub-id pub-id-type="pmid">34429674</pub-id></citation></ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Su</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>X</given-names>
</name>
<name>
<surname>He</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Sha</surname> <given-names>T</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>H</given-names>
</name>
<name>
<surname>Tao</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Inconsistencies in predictive models based on exhaled volatile organic compounds for distinguishing between benign pulmonary nodules and lung cancer: a systematic review</article-title>. <source>BMC Pulm Med</source>. (<year>2024</year>) <volume>24</volume>:<fpage>551</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12890-024-03374-2</pub-id>, PMID: <pub-id pub-id-type="pmid">39488679</pub-id></citation></ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leemans</surname> <given-names>M</given-names>
</name>
<name>
<surname>Bauer</surname> <given-names>P</given-names>
</name>
<name>
<surname>Cuzuel</surname> <given-names>V</given-names>
</name>
<name>
<surname>Audureau</surname> <given-names>E</given-names>
</name>
<name>
<surname>Fromantin</surname> <given-names>I</given-names>
</name>
</person-group>. <article-title>Volatile organic compounds analysis as a potential novel screening tool for breast cancer: A systematic review</article-title>. <source>biomark Insights</source>. (<year>2022</year>) <volume>17</volume>:<elocation-id>11772719221100709</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/11772719221100709</pub-id>, PMID: <pub-id pub-id-type="pmid">35645556</pub-id></citation></ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chung</surname> <given-names>J</given-names>
</name>
<name>
<surname>Akter</surname> <given-names>S</given-names>
</name>
<name>
<surname>Han</surname> <given-names>S</given-names>
</name>
<name>
<surname>Shin</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Choi</surname> <given-names>TG</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>I</given-names>
</name>
<etal/>
</person-group>. <article-title>Diagnosis by volatile organic compounds in exhaled breath in exhaled breath from patients with gastric and colorectal cancers</article-title>. <source>Int J Mol Sci</source>. (<year>2022</year>) <volume>24</volume>:<elocation-id>129</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms24010129</pub-id>, PMID: <pub-id pub-id-type="pmid">36613569</pub-id></citation></ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van Liere</surname> <given-names>E</given-names>
</name>
<name>
<surname>van Dijk</surname> <given-names>LJ</given-names>
</name>
<name>
<surname>Bosch</surname> <given-names>S</given-names>
</name>
<name>
<surname>Vermeulen</surname> <given-names>L</given-names>
</name>
<name>
<surname>Heymans</surname> <given-names>MW</given-names>
</name>
<name>
<surname>Burchell</surname> <given-names>GL</given-names>
</name>
<etal/>
</person-group>. <article-title>Urinary volatile organic compounds for colorectal cancer screening: A systematic review and meta-analysis</article-title>. <source>Eur J Cancer</source>. (<year>2023</year>) <volume>186</volume>:<fpage>69</fpage>&#x2013;<lpage>82</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ejca.2023.03.002</pub-id>, PMID: <pub-id pub-id-type="pmid">37030079</pub-id></citation></ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hintzen</surname> <given-names>KFH</given-names>
</name>
<name>
<surname>Grote</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wintjens</surname> <given-names>A</given-names>
</name>
<name>
<surname>Lubbers</surname> <given-names>T</given-names>
</name>
<name>
<surname>Eussen</surname> <given-names>MMM</given-names>
</name>
<name>
<surname>van Schooten</surname> <given-names>FJ</given-names>
</name>
<etal/>
</person-group>. <article-title>Breath analysis for the detection of digestive tract Malignancies: systematic review</article-title>. <source>BJS Open</source>. (<year>2021</year>) <volume>5</volume>:<elocation-id>zrab013</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bjsopen/zrab013</pub-id>, PMID: <pub-id pub-id-type="pmid">33855362</pub-id></citation></ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gordon</surname> <given-names>SM</given-names>
</name>
<name>
<surname>Szidon</surname> <given-names>JP</given-names>
</name>
<name>
<surname>Krotoszynski</surname> <given-names>BK</given-names>
</name>
<name>
<surname>Gibbons</surname> <given-names>RD</given-names>
</name>
<name>
<surname>O'Neill</surname> <given-names>HJ</given-names>
</name>
</person-group>. <article-title>Volatile organic compounds in exhaled air from patients with lung cancer</article-title>. <source>Clin Chem</source>. (<year>1985</year>) <volume>31</volume>:<page-range>1278&#x2013;82</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/clinchem/31.8.1278</pub-id>, PMID: <pub-id pub-id-type="pmid">4017231</pub-id></citation></ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kumar</surname> <given-names>S</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Abbassi-Ghadi</surname> <given-names>N</given-names>
</name>
<name>
<surname>Mackenzie</surname> <given-names>HA</given-names>
</name>
<name>
<surname>Veselkov</surname> <given-names>KA</given-names>
</name>
<name>
<surname>Hoare</surname> <given-names>JM</given-names>
</name>
<etal/>
</person-group>. <article-title>Mass spectrometric analysis of exhaled breath for the identification of volatile organic compound biomarkers in esophageal and gastric adenocarcinoma</article-title>. <source>Ann Surg</source>. (<year>2015</year>) <volume>262</volume>:<page-range>981&#x2013;90</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/SLA.0000000000001101</pub-id>, PMID: <pub-id pub-id-type="pmid">25575255</pub-id></citation></ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boccard</surname> <given-names>J</given-names>
</name>
<name>
<surname>Rutledge</surname> <given-names>DN</given-names>
</name>
</person-group>. <article-title>A consensus orthogonal partial least squares discriminant analysis (OPLS-DA) strategy for multiblock Omics data fusion</article-title>. <source>Anal Chim Acta</source>. (<year>2013</year>) <volume>769</volume>:<page-range>30&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.aca.2013.01.022</pub-id>, PMID: <pub-id pub-id-type="pmid">23498118</pub-id></citation></ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname> <given-names>H</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>X</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>W</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>H</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Logistic regression analysis of risk factors for Respiratory Distress Syndrome in Late Preterm Infants</article-title>. <source>Pak J Med Sci</source>. (<year>2025</year>) <volume>41</volume>:<page-range>461&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.12669/pjms.41.2.9796</pub-id>, PMID: <pub-id pub-id-type="pmid">39926690</pub-id></citation></ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jin</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Lan</surname> <given-names>A</given-names>
</name>
<name>
<surname>Dai</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Development and testing of a random forest-based machine learning model for predicting events among breast cancer patients with a poor response to neoadjuvant chemotherapy</article-title>. <source>Eur J Med Res</source>. (<year>2023</year>) <volume>28</volume>:<fpage>394</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s40001-023-01361-7</pub-id>, PMID: <pub-id pub-id-type="pmid">37777809</pub-id></citation></ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Florimbi</surname> <given-names>G</given-names>
</name>
<name>
<surname>Fabelo</surname> <given-names>H</given-names>
</name>
<name>
<surname>Torti</surname> <given-names>E</given-names>
</name>
<name>
<surname>Lazcano</surname> <given-names>R</given-names>
</name>
<name>
<surname>Madronal</surname> <given-names>D</given-names>
</name>
<name>
<surname>Ortega</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Accelerating the K-Nearest Neighbors Filtering Algorithm to Optimize the Real-Time Classification of Human Brain Tumor in Hyperspectral Images</article-title>. <source>Sensors (Basel)</source>. (<year>2018</year>) <volume>18</volume>:<elocation-id>2314</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/s18072314</pub-id>, PMID: <pub-id pub-id-type="pmid">30018216</pub-id></citation></ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ogunleye</surname> <given-names>A</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>QG</given-names>
</name>
</person-group>. <article-title>XGBoost model for chronic kidney disease diagnosis</article-title>. <source>IEEE/ACM Trans Comput Biol Bioinform</source>. (<year>2020</year>) <volume>17</volume>:<page-range>2131&#x2013;40</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TCBB.2019.2911071</pub-id>, PMID: <pub-id pub-id-type="pmid">30998478</pub-id></citation></ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Polat</surname> <given-names>H</given-names>
</name>
<name>
<surname>Danaei Mehr</surname> <given-names>H</given-names>
</name>
<name>
<surname>Cetin</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Diagnosis of chronic kidney disease based on support vector machine by feature selection methods</article-title>. <source>J Med Syst</source>. (<year>2017</year>) <volume>41</volume>:<fpage>55</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10916-017-0703-x</pub-id>, PMID: <pub-id pub-id-type="pmid">28243816</pub-id></citation></ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Koureas</surname> <given-names>M</given-names>
</name>
<name>
<surname>Kirgou</surname> <given-names>P</given-names>
</name>
<name>
<surname>Amoutzias</surname> <given-names>G</given-names>
</name>
<name>
<surname>Hadjichristodoulou</surname> <given-names>C</given-names>
</name>
<name>
<surname>Gourgoulianis</surname> <given-names>K</given-names>
</name>
<name>
<surname>Tsakalof</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Target analysis of volatile organic compounds in exhaled breath for lung cancer discrimination from other pulmonary diseases and healthy persons</article-title>. <source>Metabolites</source>. (<year>2020</year>) <volume>10</volume>:<elocation-id>317</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/metabo10080317</pub-id>, PMID: <pub-id pub-id-type="pmid">32756521</pub-id></citation></ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Callol-Sanchez</surname> <given-names>L</given-names>
</name>
<name>
<surname>Munoz-Lucas</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Gomez-Martin</surname> <given-names>O</given-names>
</name>
<name>
<surname>Maldonado-Sanz</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Civera-Tejuca</surname> <given-names>C</given-names>
</name>
<name>
<surname>Gutierrez-Ortega</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>Observation of nonanoic acid and aldehydes in exhaled breath of patients with lung cancer</article-title>. <source>J Breath Res</source>. (<year>2017</year>) <volume>11</volume>:<fpage>026004</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1088/1752-7163/aa6485</pub-id>, PMID: <pub-id pub-id-type="pmid">28440225</pub-id></citation></ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>X</given-names>
</name>
<name>
<surname>Muhammad</surname> <given-names>KG</given-names>
</name>
<name>
<surname>Madeeha</surname> <given-names>C</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>W</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>L</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Calculated indices of volatile organic compounds (VOCs) in exhalation for lung cancer screening and early detection</article-title>. <source>Lung Cancer</source>. (<year>2021</year>) <volume>154</volume>:<fpage>197</fpage>&#x2013;<lpage>205</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.lungcan.2021.02.006</pub-id>, PMID: <pub-id pub-id-type="pmid">33653598</pub-id></citation></ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>M</given-names>
</name>
<name>
<surname>Sheng</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Ying</surname> <given-names>K</given-names>
</name>
<etal/>
</person-group>. <article-title>Confounding effect of benign pulmonary diseases in selecting volatile organic compounds as markers of lung cancer</article-title>. <source>J Breath Res</source>. (<year>2018</year>) <volume>12</volume>:<fpage>046013</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1088/1752-7163/aad9cc</pub-id>, PMID: <pub-id pub-id-type="pmid">30102249</pub-id></citation></ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zou</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>Exhaled metabolic markers and relevant dysregulated pathways of lung cancer: a pilot study</article-title>. <source>Ann Med</source>. (<year>2022</year>) <volume>54</volume>:<fpage>790</fpage>&#x2013;<lpage>802</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/07853890.2022.2048064</pub-id>, PMID: <pub-id pub-id-type="pmid">35261323</pub-id></citation></ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fernandez Del Rio</surname> <given-names>R</given-names>
</name>
<name>
<surname>O'Hara</surname> <given-names>ME</given-names>
</name>
<name>
<surname>Holt</surname> <given-names>A</given-names>
</name>
<name>
<surname>Pemberton</surname> <given-names>P</given-names>
</name>
<name>
<surname>Shah</surname> <given-names>T</given-names>
</name>
<name>
<surname>Whitehouse</surname> <given-names>T</given-names>
</name>
<etal/>
</person-group>. <article-title>Volatile biomarkers in breath associated with liver cirrhosis - comparisons of pre- and post-liver transplant breath samples</article-title>. <source>EBioMedicine</source>. (<year>2015</year>) <volume>2</volume>:<page-range>1243&#x2013;50</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ebiom.2015.07.027</pub-id>, PMID: <pub-id pub-id-type="pmid">26501124</pub-id></citation></ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>O'Neill</surname> <given-names>HJ</given-names>
</name>
<name>
<surname>Gordon</surname> <given-names>SM</given-names>
</name>
<name>
<surname>Krotoszynski</surname> <given-names>B</given-names>
</name>
<name>
<surname>Kavin</surname> <given-names>H</given-names>
</name>
<name>
<surname>Szidon</surname> <given-names>JP</given-names>
</name>
</person-group>. <article-title>Identification of isoprenoid-type components in human expired air: a possible shunt pathway in sterol metabolism</article-title>. <source>BioMed Chromatogr</source>. (<year>1987</year>) <volume>2</volume>:<fpage>66</fpage>&#x2013;<lpage>70</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/bmc.1130020206</pub-id>, PMID: <pub-id pub-id-type="pmid">3147729</pub-id></citation></ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peralbo-Molina</surname> <given-names>A</given-names>
</name>
<name>
<surname>Calderon-Santiago</surname> <given-names>M</given-names>
</name>
<name>
<surname>Priego-Capote</surname> <given-names>F</given-names>
</name>
<name>
<surname>Jurado-Gamez</surname> <given-names>B</given-names>
</name>
<name>
<surname>Luque de Castro</surname> <given-names>MD</given-names>
</name>
</person-group>. <article-title>Identification of metabolomics panels for potential lung cancer screening by analysis of exhaled breath condensate</article-title>. <source>J Breath Res</source>. (<year>2016</year>) <volume>10</volume>:<elocation-id>26002</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1088/1752-7155/10/2/026002</pub-id>, PMID: <pub-id pub-id-type="pmid">27007686</pub-id></citation></ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dung</surname> <given-names>CH</given-names>
</name>
<name>
<surname>Wu SC and Yen</surname> <given-names>GC</given-names>
</name>
</person-group>. <article-title>Genotoxicity and oxidative stress of the mutagenic compounds formed in fumes of heated soybean oil, sunflower oil and lard</article-title>. <source>Toxicol In Vitro</source>. (<year>2006</year>) <volume>20</volume>:<page-range>439&#x2013;47</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tiv.2005.08.019</pub-id>, PMID: <pub-id pub-id-type="pmid">16216463</pub-id></citation></ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>SC</given-names>
</name>
<name>
<surname>Yen GC and Sheu</surname> <given-names>F</given-names>
</name>
</person-group>. <article-title>Mutagenicity and identification of mutagenic compounds of fumes obtained from heating peanut oil</article-title>. <source>J Food Prot</source>. (<year>2001</year>) <volume>64</volume>:<page-range>240&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.4315/0362-028x-64.2.240</pub-id>, PMID: <pub-id pub-id-type="pmid">11271774</pub-id></citation></ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zbar</surname> <given-names>AP</given-names>
</name>
</person-group>. <article-title>Exhaled volatile organic compounds identify patients with colorectal cancer (Br J Surg 2013; 100: 144-150)</article-title>. <source>Br J Surg</source>. (<year>2013</year>) <volume>100</volume>:<fpage>151</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/bjs.8970</pub-id>, PMID: <pub-id pub-id-type="pmid">23212622</pub-id></citation></ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kononova</surname> <given-names>E</given-names>
</name>
<name>
<surname>Mezmale</surname> <given-names>L</given-names>
</name>
<name>
<surname>Polaka</surname> <given-names>I</given-names>
</name>
<name>
<surname>Veliks</surname> <given-names>V</given-names>
</name>
<name>
<surname>Anarkulova</surname> <given-names>L</given-names>
</name>
<name>
<surname>Vilkoite</surname> <given-names>I</given-names>
</name>
<etal/>
</person-group>. <article-title>Breath fingerprint of colorectal cancer patients based on the gas chromatography-mass spectrometry analysis</article-title>. <source>Int J Mol Sci</source>. (<year>2024</year>) <volume>25</volume>:<fpage>1632</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms25031632</pub-id>, PMID: <pub-id pub-id-type="pmid">38338911</pub-id></citation></ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Amal</surname> <given-names>H</given-names>
</name>
<name>
<surname>Leja</surname> <given-names>M</given-names>
</name>
<name>
<surname>Broza</surname> <given-names>YY</given-names>
</name>
<name>
<surname>Tisch</surname> <given-names>U</given-names>
</name>
<name>
<surname>Funka</surname> <given-names>K</given-names>
</name>
<name>
<surname>Liepniece-Karele</surname> <given-names>I</given-names>
</name>
<etal/>
</person-group>. <article-title>Geographical variation in the exhaled volatile organic compounds</article-title>. <source>J Breath Res</source>. (<year>2013</year>) <volume>7</volume>:<elocation-id>47102</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1088/1752-7155/7/4/047102</pub-id>, PMID: <pub-id pub-id-type="pmid">24184568</pub-id></citation></ref>
<ref id="B44">
<label>44</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>ZQ</given-names>
</name>
<name>
<surname>Broza</surname> <given-names>YY</given-names>
</name>
<name>
<surname>Ionsecu</surname> <given-names>R</given-names>
</name>
<name>
<surname>Tisch</surname> <given-names>U</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>L</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>A nanomaterial-based breath test for distinguishing gastric cancer from benign gastric conditions</article-title>. <source>Br J Cancer</source>. (<year>2013</year>) <volume>108</volume>:<page-range>941&#x2013;50</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/bjc.2013.44</pub-id>, PMID: <pub-id pub-id-type="pmid">23462808</pub-id></citation></ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shehada</surname> <given-names>N</given-names>
</name>
<name>
<surname>Bronstrup</surname> <given-names>G</given-names>
</name>
<name>
<surname>Funka</surname> <given-names>K</given-names>
</name>
<name>
<surname>Christiansen</surname> <given-names>S</given-names>
</name>
<name>
<surname>Leja</surname> <given-names>M</given-names>
</name>
<name>
<surname>Haick</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Ultrasensitive silicon nanowire for real-world gas sensing: noninvasive diagnosis of cancer from breath volatolome</article-title>. <source>Nano Lett</source>. (<year>2015</year>) <volume>15</volume>:<page-range>1288&#x2013;95</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1021/nl504482t</pub-id>, PMID: <pub-id pub-id-type="pmid">25494909</pub-id></citation></ref>
<ref id="B46">
<label>46</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Markar</surname> <given-names>SR</given-names>
</name>
<name>
<surname>Wiggins</surname> <given-names>T</given-names>
</name>
<name>
<surname>Antonowicz</surname> <given-names>S</given-names>
</name>
<name>
<surname>Chin</surname> <given-names>ST</given-names>
</name>
<name>
<surname>Romano</surname> <given-names>A</given-names>
</name>
<name>
<surname>Nikolic</surname> <given-names>K</given-names>
</name>
<etal/>
</person-group>. <article-title>Assessment of a noninvasive exhaled breath test for the diagnosis of oesophagogastric cancer</article-title>. <source>JAMA Oncol</source>. (<year>2018</year>) <volume>4</volume>:<page-range>970&#x2013;6</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/jamaoncol.2018.0991</pub-id>, PMID: <pub-id pub-id-type="pmid">29799976</pub-id></citation></ref>
<ref id="B47">
<label>47</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abbassi-Ghadi</surname> <given-names>N</given-names>
</name>
<name>
<surname>Kumar</surname> <given-names>S</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Goldin</surname> <given-names>R</given-names>
</name>
<name>
<surname>Takats</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Hanna</surname> <given-names>GB</given-names>
</name>
</person-group>. <article-title>Metabolomic profiling of oesophago-gastric cancer: a systematic review</article-title>. <source>Eur J Cancer</source>. (<year>2013</year>) <volume>49</volume>:<page-range>3625&#x2013;37</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ejca.2013.07.004</pub-id>, PMID: <pub-id pub-id-type="pmid">23896378</pub-id></citation></ref>
<ref id="B48">
<label>48</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Altomare</surname> <given-names>DF</given-names>
</name>
<name>
<surname>Di Lena</surname> <given-names>M</given-names>
</name>
<name>
<surname>Porcelli</surname> <given-names>F</given-names>
</name>
<name>
<surname>Trizio</surname> <given-names>L</given-names>
</name>
<name>
<surname>Travaglio</surname> <given-names>E</given-names>
</name>
<name>
<surname>Tutino</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Exhaled volatile organic compounds identify patients with colorectal cancer</article-title>. <source>Br J Surg</source>. (<year>2013</year>) <volume>100</volume>:<page-range>144&#x2013;50</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/bjs.8942</pub-id>, PMID: <pub-id pub-id-type="pmid">23212621</pub-id></citation></ref>
<ref id="B49">
<label>49</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wroblewski</surname> <given-names>LE</given-names>
</name>
<name>
<surname>Peek</surname> <given-names>RM</given-names>
<suffix>Jr.</suffix>
</name>
<name>
<surname>Coburn</surname> <given-names>LA</given-names>
</name>
</person-group>. <article-title>The role of the microbiome in gastrointestinal cancer</article-title>. <source>Gastroenterol Clin North Am</source>. (<year>2016</year>) <volume>45</volume>:<page-range>543&#x2013;56</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.gtc.2016.04.010</pub-id>, PMID: <pub-id pub-id-type="pmid">27546848</pub-id></citation></ref>
<ref id="B50">
<label>50</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ge</surname> <given-names>D</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>J</given-names>
</name>
<name>
<surname>Chu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>X</given-names>
</name>
<name>
<surname>Xia</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>Distinguish oral-source VOCs and control their potential impact on breath biomarkers</article-title>. <source>Anal Bioanal Chem</source>. (<year>2022</year>) <volume>414</volume>:<page-range>2275&#x2013;84</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00216-021-03866-8</pub-id>, PMID: <pub-id pub-id-type="pmid">34982180</pub-id></citation></ref>
<ref id="B51">
<label>51</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J</given-names>
</name>
<name>
<surname>He</surname> <given-names>J</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>D</given-names>
</name>
<name>
<surname>Meng</surname> <given-names>X</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>T</given-names>
</name>
<etal/>
</person-group>. <article-title>A method of detecting two tumor markers (p-hydroxybenzoic acid and p-cresol) in human urine using a porous magnetic -cyclodextrine polymer as solid phase extractant, an alternative for early gastric cancer diagnosis</article-title>. <source>Talanta</source>. (<year>2019</year>) <volume>191</volume>:<page-range>133&#x2013;40</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.talanta.2018.08.036</pub-id>, PMID: <pub-id pub-id-type="pmid">30262042</pub-id></citation></ref>
<ref id="B52">
<label>52</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Filipiak</surname> <given-names>W</given-names>
</name>
<name>
<surname>Wenzel</surname> <given-names>M</given-names>
</name>
<name>
<surname>Ager</surname> <given-names>C</given-names>
</name>
<name>
<surname>Mayhew</surname> <given-names>CA</given-names>
</name>
<name>
<surname>Bogiel</surname> <given-names>T</given-names>
</name>
<name>
<surname>Wlodarski</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>Molecular Analysis of Volatile Metabolites Synthesized by Candida albicans and Staphylococcus aureus in <italic>In Vitro</italic> Cultures and Bronchoalveolar Lavage Specimens Reflecting Single- or Duo-Factor Pneumonia</article-title>. <source>Biomolecules</source>. (<year>2024</year>) <volume>14</volume>:<elocation-id>788</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/biom14070788</pub-id>, PMID: <pub-id pub-id-type="pmid">39062502</pub-id></citation></ref>
<ref id="B53">
<label>53</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Debarba</surname> <given-names>LK</given-names>
</name>
<name>
<surname>Jayarathne</surname> <given-names>HSM</given-names>
</name>
<name>
<surname>Stilgenbauer</surname> <given-names>L</given-names>
</name>
<name>
<surname>Terra Dos Santos</surname> <given-names>AL</given-names>
</name>
<name>
<surname>Koshko</surname> <given-names>L</given-names>
</name>
<name>
<surname>Scofield</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Microglial NF-kappaB signaling deficiency protects against metabolic disruptions caused by volatile organic compound via modulating the hypothalamic transcriptome</article-title>. <source>bioRxiv</source>. (<year>2023</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2023.11.08.566279</pub-id>, PMID: <pub-id pub-id-type="pmid">38014216</pub-id></citation></ref>
<ref id="B54">
<label>54</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Snieckute</surname> <given-names>G</given-names>
</name>
<name>
<surname>Ryder</surname> <given-names>L</given-names>
</name>
<name>
<surname>Vind</surname> <given-names>AC</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Arendrup</surname> <given-names>FS</given-names>
</name>
<name>
<surname>Stoneley</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>ROS-induced ribosome impairment underlies ZAKalpha-mediated metabolic decline in obesity and aging</article-title>. <source>Science</source>. (<year>2023</year>) <volume>382</volume>:<elocation-id>eadf3208</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.adf3208</pub-id>, PMID: <pub-id pub-id-type="pmid">38060659</pub-id></citation></ref>
<ref id="B55">
<label>55</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>P</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Meng</surname> <given-names>S</given-names>
</name>
<name>
<surname>Mu</surname> <given-names>T</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>He</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Identification of lung cancer breath biomarkers based on perioperative breathomics testing: A prospective observational study</article-title>. <source>EClinicalMedicine</source>. (<year>2022</year>) <volume>47</volume>:<elocation-id>101384</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eclinm.2022.101384</pub-id>, PMID: <pub-id pub-id-type="pmid">35480076</pub-id></citation></ref>
<ref id="B56">
<label>56</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nardi-Agmon</surname> <given-names>I</given-names>
</name>
<name>
<surname>Abud-Hawa</surname> <given-names>M</given-names>
</name>
<name>
<surname>Liran</surname> <given-names>O</given-names>
</name>
<name>
<surname>Gai-Mor</surname> <given-names>N</given-names>
</name>
<name>
<surname>Ilouze</surname> <given-names>M</given-names>
</name>
<name>
<surname>Onn</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Exhaled breath analysis for monitoring response to treatment in advanced lung cancer</article-title>. <source>J Thorac Oncol</source>. (<year>2016</year>) <volume>11</volume>:<page-range>827&#x2013;37</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jtho.2016.02.017</pub-id>, PMID: <pub-id pub-id-type="pmid">26968885</pub-id></citation></ref>
<ref id="B57">
<label>57</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hanna</surname> <given-names>GB</given-names>
</name>
<name>
<surname>Boshier</surname> <given-names>PR</given-names>
</name>
<name>
<surname>Markar</surname> <given-names>SR</given-names>
</name>
<name>
<surname>Romano</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Accuracy and methodologic challenges of volatile organic compound-based exhaled breath tests for cancer diagnosis: A systematic review and meta-analysis</article-title>. <source>JAMA Oncol</source>. (<year>2019</year>) <volume>5</volume>:<fpage>e182815</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/jamaoncol.2018.2815</pub-id>, PMID: <pub-id pub-id-type="pmid">30128487</pub-id></citation></ref>
<ref id="B58">
<label>58</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Nunovero</surname> <given-names>N</given-names>
</name>
<name>
<surname>Nidetz</surname> <given-names>R</given-names>
</name>
<name>
<surname>Peterson</surname> <given-names>SJ</given-names>
</name>
<name>
<surname>Brookover</surname> <given-names>BM</given-names>
</name>
<name>
<surname>Steinecker</surname> <given-names>WH</given-names>
</name>
<etal/>
</person-group>. <article-title>Belt-mounted micro-gas-chromatograph prototype for determining personal exposures to volatile-organic-compound mixture components</article-title>. <source>Anal Chem</source>. (<year>2019</year>) <volume>91</volume>:<page-range>4747&#x2013;54</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1021/acs.analchem.9b00263</pub-id>, PMID: <pub-id pub-id-type="pmid">30836745</pub-id></citation></ref>
<ref id="B59">
<label>59</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Kulkarni</surname> <given-names>GS</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>H</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>K</given-names>
</name>
<etal/>
</person-group>. <article-title>A microcolumn DC graphene sensor for rapid, sensitive, and universal chemical vapor detection</article-title>. <source>Nano Lett</source>. (<year>2021</year>) <volume>21</volume>:<page-range>10301&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1021/acs.nanolett.1c03416</pub-id>, PMID: <pub-id pub-id-type="pmid">34878794</pub-id></citation></ref>
<ref id="B60">
<label>60</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Sharma</surname> <given-names>R</given-names>
</name>
<name>
<surname>Sivakumar</surname> <given-names>AD</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Fan</surname> <given-names>X</given-names>
</name>
</person-group>. <article-title>Ultrathin silica integration for enhancing reliability of microfluidic photoionization detectors</article-title>. <source>Anal Chem</source>. (<year>2023</year>) <volume>95</volume>:<page-range>8496&#x2013;504</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1021/acs.analchem.3c00354</pub-id>, PMID: <pub-id pub-id-type="pmid">37278057</pub-id></citation></ref>
<ref id="B61">
<label>61</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei-Hao Li</surname> <given-names>M</given-names>
</name>
<name>
<surname>Ghosh</surname> <given-names>A</given-names>
</name>
<name>
<surname>Venkatasubramanian</surname> <given-names>A</given-names>
</name>
<name>
<surname>Sharma</surname> <given-names>R</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Fan</surname> <given-names>X</given-names>
</name>
</person-group>. <article-title>High-sensitivity micro-gas chromatograph-photoionization detector for trace vapor detection</article-title>. <source>ACS Sens</source>. (<year>2021</year>) <volume>6</volume>:<page-range>2348&#x2013;55</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1021/acssensors.1c00482</pub-id>, PMID: <pub-id pub-id-type="pmid">34028248</pub-id></citation></ref>
<ref id="B62">
<label>62</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sharma</surname> <given-names>R</given-names>
</name>
<name>
<surname>Zang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>M</given-names>
</name>
<name>
<surname>Schafer</surname> <given-names>N</given-names>
</name>
<name>
<surname>Begley</surname> <given-names>LA</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>YJ</given-names>
</name>
<etal/>
</person-group>. <article-title>Real time breath analysis using portable gas chromatography for adult asthma phenotypes</article-title>. <source>Metabolites</source>. (<year>2021</year>) <volume>11</volume>:<elocation-id>265</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/metabo11050265</pub-id>, PMID: <pub-id pub-id-type="pmid">33922762</pub-id></citation></ref>
<ref id="B63">
<label>63</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sharma</surname> <given-names>R</given-names>
</name>
<name>
<surname>Zang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Tabartehfarahani</surname> <given-names>A</given-names>
</name>
<name>
<surname>Lam</surname> <given-names>A</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Sivakumar</surname> <given-names>AD</given-names>
</name>
<etal/>
</person-group>. <article-title>Portable breath-based volatile organic compound monitoring for the detection of COVID-19 during the circulation of the SARS-coV-2 delta variant and the transition to the SARS-coV-2 omicron variant</article-title>. <source>JAMA Netw Open</source>. (<year>2023</year>) <volume>6</volume>:<fpage>e230982</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.0982</pub-id>, PMID: <pub-id pub-id-type="pmid">36853606</pub-id></citation></ref>
<ref id="B64">
<label>64</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tian</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>M</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>W</given-names>
</name>
<etal/>
</person-group>. <article-title>Exhaled volatile organic compounds as novel biomarkers for early detection of COPD, asthma, and PRISm: a cross-sectional study</article-title>. <source>Respir Res</source>. (<year>2025</year>) <volume>26</volume>:<fpage>173</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12931-025-03242-5</pub-id>, PMID: <pub-id pub-id-type="pmid">40325477</pub-id></citation></ref>
<ref id="B65">
<label>65</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lai</surname> <given-names>W</given-names>
</name>
<name>
<surname>Li</surname> <given-names>D</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Geng</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Xia</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Exhaled breath is feasible for mild cognitive impairment detection: A diagnostic study with portable micro-gas chromatography</article-title>. <source>J Alzheimers Dis</source>. (<year>2025</year>) <volume>104</volume>:<page-range>751&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/13872877251319553</pub-id>, PMID: <pub-id pub-id-type="pmid">39956982</pub-id></citation></ref>
<ref id="B66">
<label>66</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buma</surname> <given-names>AIG</given-names>
</name>
<name>
<surname>Muntinghe-Wagenaar</surname> <given-names>MB</given-names>
</name>
<name>
<surname>van der Noort</surname> <given-names>V</given-names>
</name>
<name>
<surname>de Vries</surname> <given-names>R</given-names>
</name>
<name>
<surname>Schuurbiers</surname> <given-names>MMF</given-names>
</name>
<name>
<surname>Sterk</surname> <given-names>PJ</given-names>
</name>
<etal/>
</person-group>. <article-title>Lung cancer detection by electronic nose analysis of exhaled breath: a multicentre prospective external validation study</article-title>. <source>Ann Oncol</source>. (<year>2025</year>) <volume>36</volume>:<page-range>786&#x2013;95</page-range>.  doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.annonc.2025.03.013</pub-id>, PMID: <pub-id pub-id-type="pmid">40174676</pub-id></citation></ref>
<ref id="B67">
<label>67</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vishinkin</surname> <given-names>R</given-names>
</name>
<name>
<surname>Busool</surname> <given-names>R</given-names>
</name>
<name>
<surname>Mansour</surname> <given-names>E</given-names>
</name>
<name>
<surname>Fish</surname> <given-names>F</given-names>
</name>
<name>
<surname>Esmail</surname> <given-names>A</given-names>
</name>
<name>
<surname>Kumar</surname> <given-names>P</given-names>
</name>
<etal/>
</person-group>. <article-title>Profiles of volatile biomarkers detect tuberculosis from skin</article-title>. <source>Adv Sci (Weinh)</source>. (<year>2021</year>) <volume>8</volume>:<fpage>e2100235</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/advs.202100235</pub-id>, PMID: <pub-id pub-id-type="pmid">34075714</pub-id></citation></ref>
<ref id="B68">
<label>68</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<collab>National Lung Screening Trial Research T</collab>
<name>
<surname>Aberle</surname> <given-names>DR</given-names>
</name>
<name>
<surname>Adams</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Berg</surname> <given-names>CD</given-names>
</name>
<name>
<surname>Black</surname> <given-names>WC</given-names>
</name>
<name>
<surname>Clapp</surname> <given-names>JD</given-names>
</name>
<etal/>
</person-group>. <article-title>Reduced lung-cancer mortality with low-dose computed tomographic screening</article-title>. <source>N Engl J Med</source>. (<year>2011</year>) <volume>365</volume>:<fpage>395</fpage>&#x2013;<lpage>409</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1056/NEJMoa1102873</pub-id>, PMID: <pub-id pub-id-type="pmid">21714641</pub-id></citation></ref>
<ref id="B69">
<label>69</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tan</surname> <given-names>J</given-names>
</name>
<name>
<surname>Taitz</surname> <given-names>J</given-names>
</name>
<name>
<surname>Nanan</surname> <given-names>R</given-names>
</name>
<name>
<surname>Grau</surname> <given-names>G</given-names>
</name>
<name>
<surname>Macia</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Dysbiotic Gut Microbiota-Derived Metabolites and Their Role in Non-Communicable Diseases</article-title>. <source>Int J Mol Sci</source>. (<year>2023</year>) <volume>24</volume>:<elocation-id>15256</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms242015256</pub-id>, PMID: <pub-id pub-id-type="pmid">37894934</pub-id></citation></ref>
<ref id="B70">
<label>70</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fryc</surname> <given-names>J</given-names>
</name>
<name>
<surname>Naumnik</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>Thrombolome and its emerging role in chronic kidney diseases</article-title>. <source>Toxins (Basel)</source>. (<year>2021</year>) <volume>13</volume>:<elocation-id>223</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/toxins13030223</pub-id>, PMID: <pub-id pub-id-type="pmid">33803899</pub-id></citation></ref>
<ref id="B71">
<label>71</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gryp</surname> <given-names>T</given-names>
</name>
<name>
<surname>Vanholder</surname> <given-names>R</given-names>
</name>
<name>
<surname>Vaneechoutte</surname> <given-names>M</given-names>
</name>
<name>
<surname>Glorieux</surname> <given-names>G</given-names>
</name>
</person-group>. <article-title>p-cresyl sulfate</article-title>. <source>Toxins (Basel)</source>. (<year>2017</year>) <volume>9</volume>:<elocation-id>52</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/toxins9020052</pub-id>, PMID: <pub-id pub-id-type="pmid">28146081</pub-id></citation></ref>
<ref id="B72">
<label>72</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Toft</surname> <given-names>PB</given-names>
</name>
<name>
<surname>Vanslette</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Trost</surname> <given-names>K</given-names>
</name>
<name>
<surname>Moritz</surname> <given-names>T</given-names>
</name>
<name>
<surname>Gillum</surname> <given-names>MP</given-names>
</name>
<name>
<surname>Backhed</surname> <given-names>F</given-names>
</name>
<etal/>
</person-group>. <article-title>Microbial metabolite p-cresol inhibits gut hormone expression and regulates small intestinal transit in mice</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2023</year>) <volume>14</volume>:<elocation-id>1200391</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2023.1200391</pub-id>, PMID: <pub-id pub-id-type="pmid">37534214</pub-id></citation></ref>
</ref-list>
</back>
</article>