<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mol. Biosci.</journal-id>
<journal-title>Frontiers in Molecular Biosciences</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mol. Biosci.</abbrev-journal-title>
<issn pub-type="epub">2296-889X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1631265</article-id>
<article-id pub-id-type="doi">10.3389/fmolb.2025.1631265</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Molecular Biosciences</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Using machine learning methods to investigate the role of volatile organic compounds in non-alcoholic fatty liver disease</article-title>
<alt-title alt-title-type="left-running-head">Shen et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fmolb.2025.1631265">10.3389/fmolb.2025.1631265</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Shen</surname>
<given-names>Chih-Hao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/561775/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Huang</surname>
<given-names>Ruei-Hao</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3088171/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Yaw-Kuen</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Chu</surname>
<given-names>Ta-Wei</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1667971/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Pei</surname>
<given-names>Dee</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Division of Pulmonary and Critical Care Medicine</institution>, <institution>Department of Medicine</institution>, <institution>Tri-Service General Hospital</institution>, <institution>National Defense Medical Center</institution>, <addr-line>Taipei</addr-line>, <country>Taiwan</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Center for Emergent Functional Matter Science</institution>, <institution>National Yang Ming Chiao Tung University</institution>, <addr-line>Hsinchu</addr-line>, <country>Taiwan</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Obstetrics and Gynecology</institution>, <institution>Tri-Service General Hospital</institution>, <institution>National Defense Medical Center</institution>, <addr-line>Taipei</addr-line>, <country>Taiwan</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Department CEO</institution>, <institution>MJ Health Research Foundation</institution>, <addr-line>Taipei</addr-line>, <country>Taiwan</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Department of Medicine</institution>, <institution>Medical School</institution>, <institution>Fu Jen Catholic University</institution>, <addr-line>New Taipei City</addr-line>, <country>Taiwan</country>
</aff>
<aff id="aff6">
<sup>6</sup>
<institution>Division of Endocrinology and Metabolism</institution>, <institution>Department of Internal Medicine</institution>, <institution>School of Medicine</institution>, <institution>College of Medicine</institution>, <institution>Fu Jen Catholic University Hospital</institution>, <addr-line>New Taipei City</addr-line>, <country>Taiwan</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/987464/overview">Xiaoyan Xing</ext-link>, Chinese Academy of Medical Sciences and Peking Union Medical College, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3081809/overview">Ashwin Dhakal</ext-link>, The University of Missouri, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1876591/overview">Youfu He</ext-link>, Guizhou Provincial People&#x2019;s Hospital, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Yaw-Kuen Li, <email>ykl@nycu.edu.tw</email>; Ta-Wei Chu, <email>taweichu@gmail.com</email>; Dee Pei, <email>peidee@gmail.com</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>06</day>
<month>08</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>12</volume>
<elocation-id>1631265</elocation-id>
<history>
<date date-type="received">
<day>19</day>
<month>05</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>18</day>
<month>06</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Shen, Huang, Li, Chu and Pei.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Shen, Huang, Li, Chu and Pei</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Aims</title>
<p>Approximately 25%&#x2013;30% of the global population is affected by non-alcoholic fatty liver disease (NAFLD). This study aimed to explore whether NAFLD could be effectively detected using 341 volatile organic compounds (VOCs) via 10 machine learning (Mach-L) algorithms in a cohort of 1,501 individuals.</p>
</sec>
<sec>
<title>Methods</title>
<p>Participants were selected from the Taiwan MJ cohort, which includes comprehensive demographic, biochemical, lifestyle, and VOCs data. NAFLD was diagnosed by experienced gastroenterologists. Exhaled breath samples were collected using a 1.0-L aluminum bag (late expiratory fraction) and analyzed with selected-ion flow-tube mass spectrometry. Ten Mach-L techniques were employed to evaluate two predictive models: Model 1 (demographic, lifestyle, and biochemical data), and Model 2 (Model 1 &#x2b; VOCs), assessed using area under the receiver operating characteristic curve (AUC).</p>
</sec>
<sec>
<title>Results</title>
<p>Subjects with NAFLD had significantly higher values for age, BMI, blood pressure, and other biomedical markers, except for eGFR and HDL-C. Key predictors of NAFLD included BMI, triglycerides (TG), uric acid (UA), fasting plasma glucose (FPG), &#x3b3;-GT, gender, LDL-C, and sleep duration. The addition of VOCs to Model 1 improved the AUC from 0.722 &#xb1; 0.149 to 0.770 &#xb1; 0.264 (p &#x3c; 0.001). Ten VOCs were identified as the most influential, in order of importance: 2-propanol, acetone, butyl 2-methylbutanoate, diethylethanolamine, urethane, &#x3b2;-caryophyllene, furfural, tridecane, 4-methyloctanoic acid, and (S)-2-methyl-1-butanol.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>Incorporating VOCs into traditional demographic, biochemical, and lifestyle data significantly enhanced the model&#x2019;s predictive performance. This suggests that VOCs may be associated with the underlying pathophysiology of NAFLD.</p>
</sec>
</abstract>
<kwd-group>
<kwd>Volatile Organic Compounds</kwd>
<kwd>non-alcoholic fatty liver</kwd>
<kwd>machine learning</kwd>
<kwd>AI</kwd>
<kwd>cohort</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Molecular Diagnostics and Therapeutics</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Non-alcoholic fatty liver disease (NAFLD) is defined as the presence of macrovesicular steatosis in more than 5% of hepatocytes without other identifiable causes, such as alcohol consumption or medication use. NAFLD progresses from simple steatosis to non-alcoholic steatohepatitis, fibrosis, and eventually cirrhosis, making it one of the leading causes of chronic liver disease worldwide (<xref ref-type="bibr" rid="B95">Younossi et al., 2016</xref>; <xref ref-type="bibr" rid="B30">Ghevariya et al., 2014</xref>). The global prevalence of NAFLD has increased from 15% in 2005 to 25%&#x2013;30% in 2023, reflecting the global rise in obesity rates (<xref ref-type="bibr" rid="B66">Quek et al., 2023</xref>). In Taiwan, a similar trend has been observed, with two studies estimating that 11.4%&#x2013;41% of the general population may be affected by NAFLD (<xref ref-type="bibr" rid="B12">Chen et al., 2006</xref>; <xref ref-type="bibr" rid="B45">Lin et al., 2005</xref>). Consequently, early detection and prevention of NAFLD have become key priorities for healthcare providers and policymakers.</p>
<p>Traditionally, multiple logistic regression (MLR) has been used to analyze the relationship between risk factors and disease outcomes in medical research. The performance of MLR models is commonly evaluated using the area under the receiver operating characteristic curve (AUC). Recently, machine learning (Mach-L)&#x2014;a branch of artificial intelligence that allows algorithms to learn from past data without explicit programming&#x2014;has emerged as a competitive and often superior approach to MLR (<xref ref-type="bibr" rid="B52">Marateb et al., 2014</xref>; <xref ref-type="bibr" rid="B94">Ye et al., 2020</xref>; <xref ref-type="bibr" rid="B60">Nusinovici et al., 2020</xref>). Unlike MLR, Mach-L can model complex, nonlinear interactions among multiple variables, making it more suitable for disease prediction tasks (<xref ref-type="bibr" rid="B56">Miller and Brown, 2018</xref>). Mach-L in the medical field involves using computer algorithms to analyze large amounts of healthcare data, helping with tasks. These tools can detect patterns in medical images, electronic health records, and other data faster and often more accurately than humans, leading to earlier diagnoses, better patient care, and more efficient healthcare delivery (<xref ref-type="bibr" rid="B4">Arkoudis and Papadakos, 2025</xref>).</p>
<p>For over five decades, researchers have shown increasing interest in volatile organic compounds (VOCs) emitted from the human body. In 1971, Nobel laureate Linus Pauling reported that human breath contains approximately 250 VOCs (<xref ref-type="bibr" rid="B50">Machado and Cortez-Pinto, 2014</xref>). Later, in 1999, <xref ref-type="bibr" rid="B54">Maurice and Manousou (2018)</xref> identified more than 3,400 VOCs in exhaled breath. Alterations in VOC concentrations can reflect disease states, such as cancer (<xref ref-type="bibr" rid="B89">Wei et al., 2020</xref>). As a result, breath-derived VOCs have been proposed as biomarkers for detecting metabolic changes associated with various diseases. There have been studies investigated the relationships between VOCs and NAFLD in the past. However, most of these studies focused on how VOCs affect or damage liver. The proposed mechanisms included metabolic dysregulation, oxidative stress, and cell death (<xref ref-type="bibr" rid="B44">Lang and Beier, 2018</xref>; <xref ref-type="bibr" rid="B47">Liu et al., 2023</xref>; <xref ref-type="bibr" rid="B24">Duan et al., 2025</xref>). Their goals were different from the present study. Analytical techniques like gas chromatography-mass spectrometry (GC-MS) have confirmed these associations in numerous studies (<xref ref-type="bibr" rid="B74">Samudrala et al., 2014</xref>; <xref ref-type="bibr" rid="B53">Markar et al., 2019</xref>; <xref ref-type="bibr" rid="B69">Ratiu et al., 2020</xref>; <xref ref-type="bibr" rid="B39">Keogh and Riches, 2022</xref>; <xref ref-type="bibr" rid="B15">Chung et al., 2022</xref>). However, while many studies have explored VOC-based disease identification, few have utilized Mach-L techniques for VOC profiling (<xref ref-type="bibr" rid="B85">Tsou et al., 2021</xref>; <xref ref-type="bibr" rid="B77">Shaffie et al., 2022</xref>; <xref ref-type="bibr" rid="B80">Sukaram et al., 2023</xref>).</p>
<p>In this study, we employed 10 different Mach-L algorithms to develop predictive models for NAFLD using health examination data combined with exhaled VOC profiles. The performance of these models was compared to evaluate their potential utility in clinical screening for NAFLD. Finally, by applying Shapley addictive explanation to examine the directions and strengths of impacts.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and methods</title>
<p>This study utilized data from the ongoing Taiwan MJ cohort, a prospective cohort collected through health examinations conducted by the MJ Health Screening Centers in Taiwan (<xref ref-type="bibr" rid="B92">Wu et al., 2017</xref>). The dataset includes over 100 essential biological indicators such as anthropometric measurements, blood tests, and imaging tests, among others.</p>
<p>The data were obtained from MJ clinic. At the time of their health checkups, participants provided general consent forms for future anonymous research. This database was maintained by the Interpretation Foundation of MJ Health Research Foundation. All or part of the data used in this study were authorized and provided by the foundation (Authorization Code: MJHRF2022009A). However, it is important to note that all interpretations and conclusions in this study are those of the authors and do not necessarily represent the views of the MJ Health Research Foundation.</p>
<p>The study protocol was reviewed and approved by the Institutional Review Board of National Yang Ming Chiao Tung University, Taiwan (IRB No. NCTU-REC-109-074E). All participants signed a written informed consent form after receiving a thorough explanation of the study&#x2019;s purpose, procedures, and potential risks by trained research assistants. These assistants ensured that all explanations were delivered using clear and understandable language, allowing participants to fully comprehend the study. After ample time for questions and deliberation, participants who provided informed and voluntary consent signed the consent form.</p>
<p>A total of 2,152 participants who underwent both medical ultrasound diagnosis for NAFLD and three sessions of exhaled breath volatile organic compounds (VOCs) collection (a total of 6,363 records) were included initially.</p>
<p>The inclusion criteria are:<list list-type="simple">
<list-item>
<p>1. Subjects between 30-70</p>
</list-item>
<list-item>
<p>2. With data of VOCs</p>
</list-item>
</list>
</p>
<p>Our exclusion criteria are:<list list-type="simple">
<list-item>
<p>1. Having significant medical diseases such as myocardial infarction, stroke, or cancers</p>
</list-item>
<list-item>
<p>2. Having drinking alcohol habit</p>
</list-item>
<list-item>
<p>3. Miss important data such as age, body mass index (BMI) or blood pressure</p>
</list-item>
</list>
</p>
<p>After excluding 651 records due to data loss or specific conditions, the final analysis included 1,501 individuals, as shown in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>The participants selection scheme.</p>
</caption>
<graphic xlink:href="fmolb-12-1631265-g001.tif">
<alt-text content-type="machine-generated">Flowchart depicting data processing of subjects undergoing medical ultrasound for non-alcoholic fatty liver diagnosis. It starts with 2,152 subjects with three breath VOCs measurements averaged. Then, exclusion of 651 incomplete records results in 1,501 subjects with complete information for modeling.</alt-text>
</graphic>
</fig>
<sec id="s2-1">
<title>Clinical assessments and biochemical analyses</title>
<p>Details of obtaining basic parameters such as BMI, blood pressure, collecting blood samples, and questionnaires could be referred to our previous publication.</p>
<sec id="s2-1-1">
<title>Fatty liver diagnosis</title>
<p>The diagnosis of fatty liver was based on ultrasound features, including increased hepatic parenchymal brightness, liver-to-kidney contrast, deep beam attenuation, visible intrahepatic vessels, and gallbladder wall definition. Qualitative grading classified fatty liver into mild, moderate, or severe, corresponding to grades 1 to 3, respectively, with grade 0 representing a normal liver (<xref ref-type="bibr" rid="B51">Mahale et al., 2018</xref>; <xref ref-type="bibr" rid="B18">Dasarathy et al., 2009</xref>). For the purpose of this study, grades 1&#x2013;3 were collectively defined as having fatty liver (NAFLD).</p>
</sec>
<sec id="s2-1-2">
<title>Variable selection</title>
<p>Seventeen clinical variables potentially associated with NAFLD were selected (listed in <xref ref-type="table" rid="T1">Table 1</xref>) as independent variables. NAFLD status (yes/no) was used as the dependent categorical variable.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>The demographic, biochemistry, and volatile organic compounds data of the study cohort.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left"/>
<th align="center">Men</th>
<th align="center">Women</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">N</td>
<td align="center">653</td>
<td align="center">848</td>
</tr>
<tr>
<td align="left">Age (year)</td>
<td align="center">42 &#xb1; 12</td>
<td align="center">46 &#xb1; 12</td>
</tr>
<tr>
<td align="left">Body mass index (kg/m<sup>2</sup>)</td>
<td align="center">21.3 &#xb1; 2.52</td>
<td align="center">24.9 &#xb1; 3.84&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Systolic blood pressure (mmHg)</td>
<td align="center">111.2 &#xb1; 15.9</td>
<td align="center">119.8 &#xb1; 16.9&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Diastolic blood pressure (mmHg)</td>
<td align="center">72.1 &#xb1; 10.3</td>
<td align="center">77.4 &#xb1; 11.1&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Fasting plasma glucose (mg/dL)</td>
<td align="center">96.5 &#xb1; 9.36</td>
<td align="center">104.0 &#xb1; 17.0&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Total bilirubin (mg/dL)</td>
<td align="center">1.09 &#xb1; 0.388</td>
<td align="center">1.04 &#xb1; 0.401&#x2a;</td>
</tr>
<tr>
<td align="left">Albumin (g/dL)</td>
<td align="center">4.40 &#xb1; 0.222</td>
<td align="center">4.43 &#xb1; 0.229&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Alkaline phosphatase (U/L)</td>
<td align="center">56.7 &#xb1; 16.3</td>
<td align="center">64.3 &#xb1; 18.9&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Serum glutamic oxaloacetic transaminase (U/L)</td>
<td align="center">21.4 &#xb1; 6.97</td>
<td align="center">24.7 &#xb1; 14.6&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Serum glutamic pyruvic transaminase (U/L)</td>
<td align="center">20.8 &#xb1; 13.2</td>
<td align="center">32.1 &#xb1; 29.4&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">&#x3b3;-Glutamyl transferase (U/L)</td>
<td align="center">19.5 &#xb1; 14.9</td>
<td align="center">31.6 &#xb1; 33.6&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Estimated glomerular filtration rate (ml/min/1.73 m2)</td>
<td align="center">86.1 &#xb1; 13.2</td>
<td align="center">83.3 &#xb1; 13.7&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Uric acid (mg/dL)</td>
<td align="center">5.17 &#xb1; 1.17</td>
<td align="center">6.02 &#xb1; 1.43&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Triglyceride (mg/dL)</td>
<td align="center">69.1 &#xb1; 33.8</td>
<td align="center">115.6 &#xb1; 74.2&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">High density lipoprotein cholesterol (mg/dL)</td>
<td align="center">58.2 &#xb1; 16.4</td>
<td align="center">57.6 &#xb1; 15.0</td>
</tr>
<tr>
<td align="left">Low density lipoprotein cholesterol (mg/dL)</td>
<td align="center">110.9 &#xb1; 28.7</td>
<td align="center">126.9 &#xb1; 35.3&#x2a;&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Alpha-fetoprotein (ng/mL)</td>
<td align="center">2.78 &#xb1; 1.91</td>
<td align="center">3.05 &#xb1; 1.86&#x2a;&#x2a;</td>
</tr>
<tr>
<td align="left">Beta-caryophyllene (87-44-5)</td>
<td align="center">0.020 &#xb1; 0.148</td>
<td align="center">0.010 &#xb1; 0.102</td>
</tr>
<tr>
<td align="left">Furfural (98-01-1)</td>
<td align="center">5.05 &#xb1; 15.4</td>
<td align="center">4.69 &#xb1; 9.11</td>
</tr>
<tr>
<td align="left">Tridecane (629-50-5)</td>
<td align="center">1.08 &#xb1; 3.62</td>
<td align="center">1.89 &#xb1; 7.48&#x2a;</td>
</tr>
<tr>
<td align="left">Butyl 2-methylbutanoate (15706-73-7)</td>
<td align="center">0.134 &#xb1; 0.521</td>
<td align="center">0.133 &#xb1; 0.683</td>
</tr>
<tr>
<td align="left">Diethylethanolamine (100-37-8)</td>
<td align="center">3.03 &#xb1; 9.19</td>
<td align="center">2.44 &#xb1; 5.72</td>
</tr>
<tr>
<td align="left">4-methyloctanoic acid (54947-74-9)</td>
<td align="center">0.170 &#xb1; 0.743</td>
<td align="center">0.119 &#xb1; 0.735</td>
</tr>
<tr>
<td align="left">(S)-2-methyl-1-butanol (1565-80-6)</td>
<td align="center">4.89 &#xb1; 37.5</td>
<td align="center">3.85 &#xb1; 8.74</td>
</tr>
<tr>
<td align="left">Urethane (51-79-6)</td>
<td align="center">20.7 &#xb1; 64.1</td>
<td align="center">18.2 &#xb1; 29.3</td>
</tr>
<tr>
<td align="left">2-propanol (67-63-0)</td>
<td align="center">71.4 &#xb1; 161.1</td>
<td align="center">61.2 &#xb1; 205.4</td>
</tr>
<tr>
<td align="left">Acetone (67-64-1)</td>
<td align="center">1,221.1 &#xb1; 3,008.5</td>
<td align="center">1,053.7 &#xb1; 4,885.6</td>
</tr>
</tbody>
</table>
<table>
<thead valign="top">
<tr>
<th align="center">Smoking</th>
<th colspan="2" align="center">n (%)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Non-smoker</td>
<td colspan="2" align="center">1140 (75)</td>
</tr>
<tr>
<td align="left">Less than 10 cigarettes/week</td>
<td colspan="2" align="center">59 (3.9)</td>
</tr>
<tr>
<td align="left">10&#x2013;20 cigarettes/week</td>
<td colspan="2" align="center">129 (8.6)</td>
</tr>
<tr>
<td align="left">20 cigarettes/week</td>
<td colspan="2" align="center">54 (3.4)</td>
</tr>
<tr>
<td align="left">More than 20 cigarettes/week</td>
<td colspan="2" align="center">119 (7.6)</td>
</tr>
</tbody>
</table>
<table>
<thead valign="top">
<tr>
<th align="center">Sleeping</th>
<th colspan="2" align="center">n (%)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Less than 6 h/day</td>
<td colspan="2" align="center">17 (4.7)</td>
</tr>
<tr>
<td align="left">6 h/day</td>
<td colspan="2" align="center">375 (25)</td>
</tr>
<tr>
<td align="left">7 h/day</td>
<td colspan="2" align="center">713 (47.5)</td>
</tr>
<tr>
<td align="left">8 h/day</td>
<td colspan="2" align="center">347 (24.9)</td>
</tr>
<tr>
<td align="left">9 h/day</td>
<td colspan="2" align="center">39 (2.6)</td>
</tr>
<tr>
<td align="left">More than 9 h/day</td>
<td colspan="2" align="center">10 (7)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s2-2">
<title>Protocol for breath sample collection</title>
<p>All volunteer participants remained in a designated room under resting conditions for at least 10 min prior to sample collection. To minimize contamination, each participant was asked to rinse their mouth with unchlorinated water before exhaling through a mouthpiece connected to a three-way direct-connect valve.</p>
<p>Initially, exhaled breath passed through the first outlet, which was connected to a gas bag (SKC Inc., Eighty-Four, PA, United States) to estimate the volume of exhaled air. Once the volume of the initial exhalation reached approximately 0.3 L, the valve was switched to the second outlet, which was attached to a 1.0-L aluminum bag. This second bag was used to collect the late expiratory fraction, which is more representative of alveolar air and thus suitable for volatile organic compound (VOC) analysis.</p>
<p>To ensure adequate sample volume for analysis, the collection procedure was repeated two to three times as necessary. All collected breath samples were sealed, stored at room temperature (25&#xb0;C), and analyzed within 48 h.</p>
<p>To validate the stability of VOCs under these storage conditions, a time-dependent analysis was conducted on ten breath samples. Samples were analyzed twice daily over three consecutive days. Comparison of the quantitative VOC data indicated that the majority of compounds remained stable during the storage period.</p>
<sec id="s2-2-1">
<title>VOCs analysis using SIFT-MS</title>
<p>A selected-ion flow-tube mass spectrometry system (SIFT-MS; VOICE200 Ultra, Syft Technologies, Christchurch, New Zealand) was employed to analyze volatile organic compounds (VOCs) in the collected late expiratory breath fraction. It is a quantitative mass spectrometry technique used for real-time analysis of trace volatile compounds, especially volatile organic compounds (VOCs), in air, breath, or headspace above liquids without the need for sample preparation or chromatographic separation (<xref ref-type="bibr" rid="B79">&#x160;pan&#x11b;l and Smith, 2020</xref>).</p>
<p>In this method, selected precursor ions (H<sub>3</sub>O<sup>&#x2b;</sup>, NO<sup>&#x2b;</sup>, and O<sub>2</sub>
<sup>&#x2b;</sup>) are injected into a nitrogen carrier gas within the flow tube. When breath samples are introduced, VOCs present in the sample undergo ionization, resulting in the formation of characteristic product ions. These product ions are detected by a quadrupole mass spectrometer, which measures the count rates of both precursor and product ions in real time.</p>
<p>For VOCs with significant product ion overlap that could not be resolved using the tolerance setting, concentrations were reported on a relative scale. Statistical models were constructed based on both absolute concentrations and these relative measures to ensure robustness in VOC profiling and interpretation.</p>
<p>To assure the reproducibility and data reliability we standardized and calibrated with the following methods:<list list-type="simple">
<list-item>
<p>1. Traceable reference materials: Use primary standards (e.g., NIST-traceable mixtures) for instrument calibration and secondary/working standards for routine checks (<xref ref-type="bibr" rid="B72">RI-URBANS, 2024</xref>; <xref ref-type="bibr" rid="B25">Dusanter et al., 2025</xref>).</p>
</list-item>
<list-item>
<p>2. Matrix modifiers: Add salt solutions (e.g., NaCl) to normalize partitioning behavior of VOCs in complex samples, reducing bias from dissolved solutes or organic components (<xref ref-type="bibr" rid="B87">U.S. Environmental Protection Agency, 2014</xref>; <xref ref-type="bibr" rid="B27">Final Report, 2012</xref>).</p>
</list-item>
<list-item>
<p>3. Dynamic calibration: For instruments like PTR-MS, use gas standards with known VOC concentrations and proton transfer rate constants to calculate normalized sensitivities (<xref ref-type="bibr" rid="B25">Dusanter et al., 2025</xref>).</p>
</list-item>
</list>
</p>
</sec>
</sec>
<sec id="s2-3">
<title>Machine learning-based analysis technology</title>
<p>While numerous studies have explored the application of VOC measurements for disease identification (<xref ref-type="bibr" rid="B69">Ratiu et al., 2020</xref>; <xref ref-type="bibr" rid="B39">Keogh and Riches, 2022</xref>; <xref ref-type="bibr" rid="B15">Chung et al., 2022</xref>), relatively few have focused on utilizing Mach-L techniques specifically for VOC profiling (<xref ref-type="bibr" rid="B85">Tsou et al., 2021</xref>; <xref ref-type="bibr" rid="B77">Shaffie et al., 2022</xref>; <xref ref-type="bibr" rid="B80">Sukaram et al., 2023</xref>). In this study, we employed ten distinct Mach-L algorithms to construct predictive models for diagnosing non-alcoholic fatty liver disease (NAFLD) based on VOCs collected from exhaled breath. To assess the impact of VOCs, models were developed both with and without VOC data, and their predictive performances were compared.</p>
<p>The ten machine learning techniques applied are as follows:<list list-type="simple">
<list-item>
<p>&#x2022;Random Forest (RF): An ensemble learning method utilizing multiple unpruned decision trees for classification (<xref ref-type="bibr" rid="B7">Breiman, 2001</xref>).</p>
</list-item>
<list-item>
<p>&#x2022; C5.0 Decision Trees (C5.0): A rule-based model using entropy, information gain, and gain ratio for decision tree construction (<xref ref-type="bibr" rid="B67">Quinlan, 2004</xref>).</p>
</list-item>
<list-item>
<p>&#x2022;Stochastic Gradient Boosting (SGB): Combines bagging and boosting to construct additive regression tree models (<xref ref-type="bibr" rid="B29">Friedman, 2001</xref>).</p>
</list-item>
<list-item>
<p>&#x2022;Multivariate Adaptive Regression Splines (MARS): A non-parametric regression technique using piecewise polynomial functions (<xref ref-type="bibr" rid="B28">Friedman, 1991</xref>).</p>
</list-item>
<list-item>
<p>&#x2022;Classification and Regression Tree (CART): A decision tree model built using Gini impurity for splitting nodes (<xref ref-type="bibr" rid="B8">Breiman et al., 1984</xref>).</p>
</list-item>
<list-item>
<p>&#x2022;Least Absolute Shrinkage and Selection Operator (Lasso): A linear model applying L1 regularization to perform feature selection (<xref ref-type="bibr" rid="B34">Hastie et al., 2015</xref>).</p>
</list-item>
<list-item>
<p>&#x2022;Ridge Regression (Ridge): Similar to Lasso but uses L2 regularization for coefficient shrinkage (<xref ref-type="bibr" rid="B35">Hoerl and Kennard, 2000</xref>).</p>
</list-item>
<list-item>
<p>&#x2022;Extreme Gradient Boosting (XGBoost): An optimized gradient boosting algorithm designed for speed and performance (<xref ref-type="bibr" rid="B55">Meng et al., 2016</xref>).</p>
</list-item>
<list-item>
<p>&#x2022;Gradient Boosting with Categorical Features (CatBoost): A boosting technique optimized for categorical features using an ordered boosting method (<xref ref-type="bibr" rid="B23">Dorogush et al., 2018</xref>).</p>
</list-item>
<list-item>
<p>&#x2022;Light Gradient Boosting Machine (LightGBM): A fast, histogram-based gradient boosting algorithm designed for efficiency and scalability (<xref ref-type="bibr" rid="B38">Ke et al., 2017</xref>).</p>
</list-item>
</list>
</p>
<p>Although Mach-L algorithms are capable of identifying key predictor variables, relying on a single method may lead to suboptimal and biased feature selection. To overcome this limitation, variable ensemble strategies are often employed, which integrate the outputs from multiple algorithms. Prior research indicates that such ensemble approaches enhance variable selection robustness, reducing both bias and variance (<xref ref-type="bibr" rid="B61">Pes, 2020</xref>; <xref ref-type="bibr" rid="B57">Moghimi et al., 2018</xref>; <xref ref-type="bibr" rid="B86">Tuli et al., 2019</xref>).</p>
<p>In this study, the variable importance values generated by each Mach-L model were averaged. The top 10 VOCs, ranked by average importance across all models, were selected for further discussion.</p>
<p>All analyses were conducted using the R programming language (version 4.1.2, R Core Team, Vienna, Austria) and RStudio (version 1.1.453) (<xref ref-type="bibr" rid="B70">R Core Team, 2017</xref>; <xref ref-type="bibr" rid="B73">RStudio Team, 2015</xref>). The following R packages were employed for model development: random Forest, C50, gbm, RWeka, kernlab, earth, rpart, glmnet, XGBoost, LightGBM, and cat boost. Heatmaps were visualized using the pheatmap package (version 2.6.2) (<xref ref-type="bibr" rid="B9">Browne, 2000</xref>; <xref ref-type="bibr" rid="B32">Gu, 2022</xref>).</p>
<p>To train and evaluate each Mach-L model, an 80/20 train-test split was used. The training set (80%) was used to construct models, while the testing set (20%) evaluated predictive performance. Hyperparameter tuning was conducted using 10-fold cross-validation (CV) to ensure optimal performance for each algorithm. The final model for each method was selected based on the best-performing configuration. Cross-validation procedures were executed using the caret package (version 6.0-93) (<xref ref-type="bibr" rid="B41">Kuhn, 2022</xref>).</p>
<p>In order to understand the directions and impacts of the variables, XGboost SHAP was applied using the following Python packages: SHAP, the core package for computing and visualizing SHAP values, provides interpretability for model predictions and feature importance. Pandas, a powerful library for data manipulation and preprocessing, was used to manage datasets, clean data, and prepare inputs for SHAP analysis. NumPy, a fundamental package for numerical computations, supported array operations and numerical calculations required by SHAP. Matplotlib, a plotting library for creating static, interactive, and animated visualizations, was employed to generate SHAP plots, including summary plots, bar plots, and waterfall plots.te feature contributions to specific predictions.</p>
</sec>
<sec id="s2-4">
<title>Performance evaluation metrics</title>
<p>To comprehensively evaluate the predictive performance of the Mach-L, we employed a range of widely accepted performance measures, as recommended in previous studies (<xref ref-type="bibr" rid="B21">Dias Canedo and Cordeiro Mendes, 2020</xref>; <xref ref-type="bibr" rid="B37">Hussain et al., 2021</xref>; <xref ref-type="bibr" rid="B84">Tomer and Sharma, 2022</xref>). Specifically, the following metrics were utilized in our analysis: accuracy (ACC), sensitivity (Sens), and specificity (Spec). These metrics provide an overall understanding of the model&#x2019;s classification capabilities.</p>
<p>However, when dealing with imbalanced datasets, traditional metrics such as ACC, Sens, and Spec can be misleading, as they tend to be disproportionately influenced by the majority class distribution. To mitigate this issue, we additionally calculated balanced accuracy (BA) and area under the receiver operating characteristic curve (AUC)&#x2014;both of which are considered more robust and reliable indicators for evaluating model performance under class imbalance conditions (<xref ref-type="bibr" rid="B22">di Biase et al., 2020</xref>; <xref ref-type="bibr" rid="B33">Hashim et al., 2021</xref>).<list list-type="simple">
<list-item>
<p>&#x2022;Balanced Accuracy (BA) accounts for imbalanced data by averaging sensitivity and specificity.</p>
</list-item>
<list-item>
<p>&#x2022;AUC provides a threshold-independent measure of a model&#x2019;s ability to distinguish between classes.</p>
</list-item>
</list>
</p>
<p>The definitions and formulas for all performance metrics used in this study are detailed in (<xref ref-type="bibr" rid="B81">Tharwat, 2021</xref>).</p>
<p>To assess the impact of volatile organic compounds (VOCs) on model performance, we compared each Mach-L model&#x2019;s predictive ability with and without VOC features. We applied DeLong&#x2019;s test for pairwise comparison of AUC values between these two scenarios across all models (<xref ref-type="bibr" rid="B20">DeLong et al., 1988</xref>), allowing for a statistically grounded evaluation of VOCs&#x2019; contribution to predictive improvement.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<p>A total of 1,501 participants were included in the present study. <xref ref-type="table" rid="T1">Table 1</xref> presents the demographic and clinical characteristics of the participants, stratified by the presence or absence of non-alcoholic fatty liver disease (NAFLD).</p>
<p>As expected, participants diagnosed with NAFLD exhibited significantly higher values across several variables, including age, body mass index (BMI), blood pressure, and various biochemical markers, compared to those without NAFLD. The only exceptions were estimated glomerular filtration rate (eGFR) and high-density lipoprotein cholesterol (HDL-C), which did not follow the same trend.</p>
<p>Among all examined variables, the most influential predictors for identifying NAFLD were found to be: BMI, Triglycerides (TG), Uric acid (UA), Fasting plasma glucose (FPG), Gamma-glutamyl transferase (GGT), Gender, Low-density lipoprotein cholesterol (LDL-C) and Sleeping hours.</p>
<p>In parallel, VOC profiling using 10 different machine learning (Mach-L) techniques identified 10 key VOCs as significant predictors for NAFLD. Ranked from most to least important, these compounds are: 2-Propanol, Acetone, Butyl 2-methylbutanoate, Diethylethanolamine, Urethane, &#x3b2; -Caryophyllene, Furfural, Tridecane, 4-Methyloctanoic acid and (S)-2-Methyl-1-butanol.</p>
<p>
<xref ref-type="table" rid="T2">Table 2</xref> displays the comparative concentrations of these 10 VOCs in subjects with and without NAFLD, along with their corresponding rankings based on variable importance across the Mach-L models.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>t-test comparing volatile organic compounds in subjects with and without NAFLD.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Characteristic (mean &#xb1; SD)</th>
<th align="center">NAFLD</th>
<th align="center">Control groups</th>
<th align="center">P value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">n (%)</td>
<td align="center">848 (56.50%)</td>
<td align="center">653 (43.50%)</td>
<td align="left"/>
</tr>
<tr>
<td align="left">2-propanol</td>
<td align="center">61.28 &#xb1; 205.46</td>
<td align="left">71.42 &#xb1; 161.10</td>
<td align="center">0.284</td>
</tr>
<tr>
<td align="left">Acetone</td>
<td align="center">1053.72 &#xb1; 4885.64</td>
<td align="left">1221.07 &#xb1; 3008.48</td>
<td align="center">0.414</td>
</tr>
<tr>
<td align="left">butyl 2-methylbutanoate</td>
<td align="center">0.13 &#xb1; 0.68</td>
<td align="left">0.13 &#xb1; 0.52</td>
<td align="center">0.955</td>
</tr>
<tr>
<td align="left">diethylethanolamine</td>
<td align="center">2.45 &#xb1; 5.73</td>
<td align="left">3.03 &#xb1; 9.20</td>
<td align="center">0.158</td>
</tr>
<tr>
<td align="left">urethane</td>
<td align="center">18.24 &#xb1; 29.31</td>
<td align="left">20.72 &#xb1; 64.05</td>
<td align="center">0.360</td>
</tr>
<tr>
<td align="left">beta-caryophyllene</td>
<td align="center">0.01 &#xb1; 0.10</td>
<td align="left">0.02 &#xb1; 0.15</td>
<td align="center">0.296</td>
</tr>
<tr>
<td align="left">furfural</td>
<td align="center">4.69 &#xb1; 9.11</td>
<td align="left">5.05 &#xb1; 15.38</td>
<td align="center">0.599</td>
</tr>
<tr>
<td align="left">tridecane</td>
<td align="center">1.89 &#xb1; 7.48</td>
<td align="left">1.08 &#xb1; 3.62</td>
<td align="center">0.006</td>
</tr>
<tr>
<td align="left">4-methyloctanoic acid</td>
<td align="center">0.12 &#xb1; 0.74</td>
<td align="left">0.17 &#xb1; 0.74</td>
<td align="center">0.190</td>
</tr>
<tr>
<td align="left">(S)-2-methyl-1-butanol</td>
<td align="center">3.85 &#xb1; 8.75</td>
<td align="left">4.90 &#xb1; 37.47</td>
<td align="center">0.485</td>
</tr>
<tr>
<td align="left">methanamide</td>
<td align="center">10.32 &#xb1; 16.59</td>
<td align="left">12.21 &#xb1; 74.70</td>
<td align="center">0.528</td>
</tr>
<tr>
<td align="left">1-nonene</td>
<td align="center">6.51 &#xb1; 16.03</td>
<td align="left">5.23 &#xb1; 8.66</td>
<td align="center">0.049</td>
</tr>
<tr>
<td align="left">isobutane</td>
<td align="center">160.08 &#xb1; 392.34</td>
<td align="left">165.93 &#xb1; 510.95</td>
<td align="center">0.808</td>
</tr>
<tr>
<td align="left">trimethylamine</td>
<td align="center">87.84 &#xb1; 306.13</td>
<td align="left">104.05 &#xb1; 242.21</td>
<td align="center">0.252</td>
</tr>
<tr>
<td align="left">6-methyl-5-hepten-2-one</td>
<td align="center">1.92 &#xb1; 2.50</td>
<td align="left">1.93 &#xb1; 3.19</td>
<td align="center">0.911</td>
</tr>
<tr>
<td align="left">pyridine</td>
<td align="center">1.60 &#xb1; 2.75</td>
<td align="left">1.49 &#xb1; 2.51</td>
<td align="center">0.414</td>
</tr>
<tr>
<td align="left">benzoic acid</td>
<td align="center">0.06 &#xb1; 0.22</td>
<td align="left">0.08 &#xb1; 0.28</td>
<td align="center">0.129</td>
</tr>
<tr>
<td align="left">3-buten-2-one</td>
<td align="center">14.13 &#xb1; 27.59</td>
<td align="left">15.42 &#xb1; 55.93</td>
<td align="center">0.587</td>
</tr>
<tr>
<td align="left">propyl acetate</td>
<td align="center">10.98 &#xb1; 14.32</td>
<td align="left">15.81 &#xb1; 116.80</td>
<td align="center">0.293</td>
</tr>
<tr>
<td align="left">propyne</td>
<td align="center">0.97 &#xb1; 3.55</td>
<td align="left">0.68 &#xb1; 1.77</td>
<td align="center">0.035</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Data are presented as means &#xb1; standard deviation (SD) or numbers (%) as in the case; P values of excess statistically significant are from the t-test comparing subjects with and without NAFLD. All the statistical tests of independence were two-sided. Abbreviations: NAFLD, non-alcoholic fatty liver disease.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<sec id="s3-1">
<title>Model performance evaluation</title>
<p>The predictive performance of all 10 machine learning (Mach-L) methods is summarized in <xref ref-type="table" rid="T3">Table 3</xref>. Across all methods, Model 2&#x2014;which incorporated volatile organic compounds (VOCs)&#x2014;demonstrated superior performance compared to Model 1, which only included demographic, biochemical, and lifestyle variables. Specifically, accuracy (ACC), sensitivity (Sens), specificity (Spec), BA, and AUC were all improved in Model 2.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Results of machine learning in Model 1 (without VOCs) and Model 2 (with VOCs).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="center">Methods</th>
<th colspan="2" align="center">ACC</th>
<th colspan="2" align="center">Sens</th>
<th colspan="2" align="center">Spec</th>
<th colspan="2" align="center">AUC</th>
<th colspan="2" align="center">BA</th>
</tr>
<tr>
<th align="center">Model<break/>1</th>
<th align="center">Model<break/>2</th>
<th align="center">Model<break/>1</th>
<th align="center">Model<break/>2</th>
<th align="center">Model 1</th>
<th align="center">Model 2</th>
<th align="center">Model 1</th>
<th align="center">Model<break/>2</th>
<th align="center">Model<break/>1</th>
<th align="center">Model 2</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">RF</td>
<td align="center">0.734</td>
<td align="center">0.777</td>
<td align="center">0.639</td>
<td align="center">0.858</td>
<td align="center">0.799</td>
<td align="center">0.713</td>
<td align="center">0.777</td>
<td align="center">0.848</td>
<td align="center">0.719</td>
<td align="center">0.785</td>
</tr>
<tr>
<td align="left">C5.0</td>
<td align="center">0.691</td>
<td align="center">0.688</td>
<td align="center">0.762</td>
<td align="center">0.843</td>
<td align="center">0.643</td>
<td align="center">0.563</td>
<td align="center">0.683</td>
<td align="center">0.765</td>
<td align="center">0.702</td>
<td align="center">0.703</td>
</tr>
<tr>
<td align="left">SGB</td>
<td align="center">0.718</td>
<td align="center">0.784</td>
<td align="center">0.705</td>
<td align="center">0.769</td>
<td align="center">0.726</td>
<td align="center">0.796</td>
<td align="center">0.773</td>
<td align="center">0.854</td>
<td align="center">0.716</td>
<td align="center">0.783</td>
</tr>
<tr>
<td align="left">MARS</td>
<td align="center">0.731</td>
<td align="center">0.781</td>
<td align="center">0.680</td>
<td align="center">0.769</td>
<td align="center">0.765</td>
<td align="center">0.790</td>
<td align="center">0.768</td>
<td align="center">0.846</td>
<td align="center">0.723</td>
<td align="center">0.780</td>
</tr>
<tr>
<td align="left">CART</td>
<td align="center">0.714</td>
<td align="center">0.781</td>
<td align="center">0.598</td>
<td align="center">0.716</td>
<td align="center">0.793</td>
<td align="center">0.832</td>
<td align="center">0.696</td>
<td align="center">0.781</td>
<td align="center">0.696</td>
<td align="center">0.774</td>
</tr>
<tr>
<td align="left">Lasso</td>
<td align="center">0.718</td>
<td align="center">0.787</td>
<td align="center">0.689</td>
<td align="center">0.754</td>
<td align="center">0.737</td>
<td align="center">0.814</td>
<td align="center">0.768</td>
<td align="center">0.866</td>
<td align="center">0.713</td>
<td align="center">0.784</td>
</tr>
<tr>
<td align="left">Ridge</td>
<td align="center">0.741</td>
<td align="center">0.744</td>
<td align="center">0.631</td>
<td align="center">0.881</td>
<td align="center">0.816</td>
<td align="center">0.635</td>
<td align="center">0.780</td>
<td align="center">0.832</td>
<td align="center">0.723</td>
<td align="center">0.758</td>
</tr>
<tr>
<td align="left">XGBoost</td>
<td align="center">0.688</td>
<td align="center">0.791</td>
<td align="center">0.885</td>
<td align="center">0.828</td>
<td align="center">0.553</td>
<td align="center">0.761</td>
<td align="center">0.784</td>
<td align="center">0.861</td>
<td align="center">0.719</td>
<td align="center">0.794</td>
</tr>
<tr>
<td align="left">CatBoost</td>
<td align="center">0.744</td>
<td align="center">0.787</td>
<td align="center">0.697</td>
<td align="center">0.769</td>
<td align="center">0.777</td>
<td align="center">0.802</td>
<td align="center">0.779</td>
<td align="center">0.860</td>
<td align="center">0.737</td>
<td align="center">0.786</td>
</tr>
<tr>
<td align="left">LightGBM</td>
<td align="center">0.761</td>
<td align="center">0.787</td>
<td align="center">0.697</td>
<td align="center">0.866</td>
<td align="center">0.805</td>
<td align="center">0.725</td>
<td align="center">0.792</td>
<td align="center">0.860</td>
<td align="center">0.751</td>
<td align="center">0.795</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>VOC, volatile organic compound; ACC, accuracy; Sens, sensitivity; Spec, specificity; AUC, area under curve; BA, balanced accuracy; Model 1, without VOCs; Model 2, with VOCs; RF, random forest; C5.0, C5.0 decision trees; SGB, stochastic gradient boosting; MARS, multivariate adaptive regression splines; CART, classification and regression tree; Lasso, least absolute shrinkage and selection operator; Ridge, ridge regression; XGBoost, extreme gradient boosting; CatBoost, gradient boosting with categorical features support; LightGBM, light gradient boosting machine.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>These findings suggest that the inclusion of VOCs significantly enhanced the predictive accuracy of the models in identifying individuals with NAFLD. The confusion matrices for Models 1 and 2 are presented in <xref ref-type="fig" rid="F2">Figure 2</xref>, while <xref ref-type="fig" rid="F3">Figure 3</xref> illustrates the respective AUC curves for each model. Additionally, the heatmap of the top 10 VOCs identified across the Mach-L algorithms is shown in <xref ref-type="fig" rid="F4">Figure 4</xref>, highlighting their relative importance in the classification task.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>The Confusion matrix of Model 1 and 2 for each machine learning methods. Model 1, without VOCs; Model 2, with VOCs; RF, random forest; C5.0, C5.0 decision trees; SGB, stochastic gradient boosting; MARS, multivariate adaptive regression splines; CART, classification and regression tree; Lasso, least absolute shrinkage and selection operator; Ridge, ridge regression; XGBoost, extreme gradient boosting; CatBoost, gradient boosting with categorical features support; LightGBM, light gradient boosting machine. <bold>(a)</bold> Model 1 o RF. <bold>(b)</bold> Model 2 o RF. <bold>(c)</bold> Model 1 of C5.0. <bold>(d)</bold> Model 2 of C5.0. <bold>(e)</bold> Model 1 of SGB. <bold>(f)</bold> Model 2 of SGB. <bold>(g)</bold> Model 1 of MARS. <bold>(h)</bold> Model 2 of MARS. <bold>(i)</bold> Model 1 of CART. <bold>(j)</bold> Model 2 of CART. <bold>(k)</bold> Model 1 of Lasso. <bold>(l)</bold> Model 2 of Lasso. <bold>(m)</bold> Model 1 of Ridge. <bold>(n)</bold> Model 2 of Ridge. <bold>(o)</bold> Model 1 of XGBoost. <bold>(p)</bold> Model 2 of XGBoost. <bold>(q)</bold> Model 1 of CatBoost. <bold>(r)</bold> Model 2 of CatBoost. <bold>(s)</bold> Model 1 of LightGBM. <bold>(t)</bold> Model 2 of LightGBM.</p>
</caption>
<graphic xlink:href="fmolb-12-1631265-g002.tif">
<alt-text content-type="machine-generated">Confusion matrices compare two models (Model 1 and model 2) for different algorithms (RF, C5.0, SGB, MARS, CART, Lasso, Ridge,XGBoost, CatBoost, and LightGBM). Each matrix shows true positives, false positives, true negatives, and false negatives for analysis.</alt-text>
</graphic>
</fig>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>The area under receiver operation curve in model 1 and 2 for all the machine learning methods. Model 1, without VOCs; Model 2, with VOCs; RF, random forest; C5.0, C5.0 decision trees; SGB, stochastic gradient boosting; MARS, multivariate adaptive regression splines; CART, classification and regression tree; Lasso, least absolute shrinkage and selection operator; Ridge, ridge regression; XGBoost, extreme gradient boosting; CatBoost, gradient boosting with categorical features support; LightGBM, light gradient boosting machine.</p>
</caption>
<graphic xlink:href="fmolb-12-1631265-g003.tif">
<alt-text content-type="machine-generated">Two ROC curve plots comparing model performance are shown. Model 1 includes several algorithms with their AUC values, such as RF (0.777), C5.0 (0.683), and XGBoost (0.784). Model 2 displays similar algorithms with AUC values, including RF (0.848), C5.0 (0.765), and XGBoost (0.861). Each plot assesses sensitivity versus one minus specificity.</alt-text>
</graphic>
</fig>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Heatmap of the top 10 volatile organic compounds identified across the machine learning methods.</p>
</caption>
<graphic xlink:href="fmolb-12-1631265-g004.tif">
<alt-text content-type="machine-generated">Heatmap displaying hierarchical clustering of various biomarkers such as albumin, uric acid, and body mass index, among others. Color gradients represent Row Z-Scores, ranging from 0 to 0.8. Additional categories include sleeping hours, gender, and NAFLD status, with corresponding color codes.</alt-text>
</graphic>
</fig>
<p>
<xref ref-type="table" rid="T4">Table 4</xref> presents the pairwise comparisons of AUC values for the 10 Mach-L methods, evaluating the improvement in predictive performance with the inclusion of VOCs compared to models without VOCs. The results indicate that for all methods, the inclusion of VOCs led to a statistically significant improvement in model performance, as evidenced by p-values less than 0.05 across all comparisons. These findings suggest that incorporating VOC data into the Mach-L models for NAFLD diagnosis results in significantly enhanced predictive accuracy compared to models that exclude VOCs.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Pairwise comparisons of the area under curve values between in Model 1 (without VOCs) and Model 2 (with VOCs) using DeLong&#x2019;s test.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Methods</th>
<th align="center">Model 1</th>
<th align="center">Model 2</th>
<th align="center">Difference Model 1 and Model 2</th>
<th align="center">
<italic>p</italic>-value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">RF</td>
<td align="center">0.777</td>
<td align="center">0.848</td>
<td align="center">7.10%</td>
<td align="center">&#x2212;2.050 (0.040)</td>
</tr>
<tr>
<td align="left">C5.0</td>
<td align="center">0.683</td>
<td align="center">0.765</td>
<td align="center">8.20%</td>
<td align="center">&#x2212;1.988 (0.047)</td>
</tr>
<tr>
<td align="left">SGB</td>
<td align="center">0.773</td>
<td align="center">0.854</td>
<td align="center">8.10%</td>
<td align="center">&#x2212;2.384 (0.017)</td>
</tr>
<tr>
<td align="left">MARS</td>
<td align="center">0.768</td>
<td align="center">0.846</td>
<td align="center">7.80%</td>
<td align="center">&#x2212;2.159 (0.031)</td>
</tr>
<tr>
<td align="left">CART</td>
<td align="center">0.696</td>
<td align="center">0.781</td>
<td align="center">8.50%</td>
<td align="center">&#x2212;2.304 (0.021)</td>
</tr>
<tr>
<td align="left">Lasso</td>
<td align="center">0.768</td>
<td align="center">0.866</td>
<td align="center">9.80%</td>
<td align="center">&#x2212;2.846 (0.004)</td>
</tr>
<tr>
<td align="left">Ridge</td>
<td align="center">0.780</td>
<td align="center">0.832</td>
<td align="center">5.20%</td>
<td align="center">&#x2212;1.471 (0.041)</td>
</tr>
<tr>
<td align="left">XGBoost</td>
<td align="center">0.784</td>
<td align="center">0.861</td>
<td align="center">7.70%</td>
<td align="center">&#x2212;2.278 (0.023)</td>
</tr>
<tr>
<td align="left">CatBoost</td>
<td align="center">0.779</td>
<td align="center">0.860</td>
<td align="center">8.10%</td>
<td align="center">&#x2212;2.403 (0.016)</td>
</tr>
<tr>
<td align="left">LightGBM</td>
<td align="center">0.792</td>
<td align="center">0.860</td>
<td align="center">6.80%</td>
<td align="center">&#x2212;2.014 (0.044)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>VOC, volatile organic compound; Model 1, without VOCs; Model 2, with VOCs. The numbers in table are the corresponding p-values. <italic>p</italic> &#x3c; 0.05 was considered statistically significant.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>
<xref ref-type="table" rid="T5">Table 5</xref> displays the most important predictive factors identified by the Mach-L methods, encompassing demographic, biochemical, lifestyle, and VOC-related variables. In total, 25 factors were selected, including the top 10 VOCs. Among the non-VOC variables, BMI emerged as the most influential predictor, followed by triglycerides (TG), uric acid (UA), fasting plasma glucose (FPG), &#x3b3; -glutamyl transferase (&#x3b3; -GT), gender, GPT, LDL-cholesterol, sleep duration, albumin, total bilirubin, alkaline phosphatase, GOT, HDL-cholesterol, and diastolic blood pressure (DBP). Notably, beginning from the 10th rank in overall importance, 2-propanol was the first VOC to appear. The complete list of VOCs identified is detailed in the Methods section.</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>The variables selected and the mean and rank of important values by ten machine learning methods.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Variables</th>
<th align="center">RF</th>
<th align="center">C5.0</th>
<th align="center">SGB</th>
<th align="center">MARS</th>
<th align="center">CART</th>
<th align="center">Lasso</th>
<th align="center">Ridge</th>
<th align="center">XGBoost</th>
<th align="center">Catboost</th>
<th align="center">LightGBM</th>
<th align="center">Mean</th>
<th align="center">ROI</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Body mass index (kg/m<sup>2</sup>)</td>
<td align="center">100</td>
<td align="center">100</td>
<td align="center">100</td>
<td align="center">100</td>
<td align="center">100</td>
<td align="center">100</td>
<td align="center">100</td>
<td align="center">100</td>
<td align="center">100</td>
<td align="center">100</td>
<td align="center">100.00</td>
<td align="center">1</td>
</tr>
<tr>
<td align="left">Triglyceride (mg/dL)</td>
<td align="center">53.56</td>
<td align="center">100</td>
<td align="center">46.48</td>
<td align="center">52.75</td>
<td align="center">87.96</td>
<td align="center">3.34</td>
<td align="center">2.8</td>
<td align="center">52.45</td>
<td align="center">64.16</td>
<td align="center">33.9</td>
<td align="center">49.74</td>
<td align="center">2</td>
</tr>
<tr>
<td align="left">Uric acid (mg/dL)</td>
<td align="center">7.06</td>
<td align="center">32.42</td>
<td align="center">2.27</td>
<td align="center">30.95</td>
<td align="center">39.63</td>
<td align="center">22.12</td>
<td align="center">80</td>
<td align="center">0</td>
<td align="center">1.43</td>
<td align="center">4.42</td>
<td align="center">22.03</td>
<td align="center">3</td>
</tr>
<tr>
<td align="left">FPG (mg/dL)</td>
<td align="center">5.61</td>
<td align="center">51.5</td>
<td align="center">3.3</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">3.76</td>
<td align="center">8</td>
<td align="center">2.31</td>
<td align="center">7.43</td>
<td align="center">1.18</td>
<td align="center">8.31</td>
<td align="center">4</td>
</tr>
<tr>
<td align="left">&#x3b3;-GT (U/L)</td>
<td align="center">10.34</td>
<td align="center">0</td>
<td align="center">6.35</td>
<td align="center">0</td>
<td align="center">47.7</td>
<td align="center">0</td>
<td align="center">1</td>
<td align="center">6.5</td>
<td align="center">6.72</td>
<td align="center">2.7</td>
<td align="center">8.13</td>
<td align="center">5</td>
</tr>
<tr>
<td align="left">Gender</td>
<td align="center">0.07</td>
<td align="center">1.17</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">67</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">6.82</td>
<td align="center">6</td>
</tr>
<tr>
<td align="left">GPT (U/L)</td>
<td align="center">7.62</td>
<td align="center">0</td>
<td align="center">4.22</td>
<td align="center">0</td>
<td align="center">38.8</td>
<td align="center">1.44</td>
<td align="center">4.3</td>
<td align="center">1.57</td>
<td align="center">4.16</td>
<td align="center">1.69</td>
<td align="center">6.38</td>
<td align="center">7</td>
</tr>
<tr>
<td align="left">LDL-cholesterol (mg/dL)</td>
<td align="center">5.4</td>
<td align="center">19.75</td>
<td align="center">3.95</td>
<td align="center">14.61</td>
<td align="center">8.33</td>
<td align="center">1.33</td>
<td align="center">2.8</td>
<td align="center">1.31</td>
<td align="center">2.63</td>
<td align="center">2.64</td>
<td align="center">6.28</td>
<td align="center">8</td>
</tr>
<tr>
<td align="left">Sleep time</td>
<td align="center">0.74</td>
<td align="center">11.17</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">39</td>
<td align="center">0</td>
<td align="center">0.36</td>
<td align="center">0</td>
<td align="center">5.13</td>
<td align="center">9</td>
</tr>
<tr>
<td align="left">2-propanol</td>
<td align="center">1.63</td>
<td align="center">35.92</td>
<td align="center">2.04</td>
<td align="center">0</td>
<td align="center">7.95</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0.43</td>
<td align="center">2.75</td>
<td align="center">0</td>
<td align="center">5.07</td>
<td align="center">10</td>
</tr>
<tr>
<td align="left">Albumin (g/dL)</td>
<td align="center">0.97</td>
<td align="center">4.67</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">42</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">4.76</td>
<td align="center">11</td>
</tr>
<tr>
<td align="left">Acetone</td>
<td align="center">1.4</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">35.85</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0.33</td>
<td align="center">1.29</td>
<td align="center">3.89</td>
<td align="center">12</td>
</tr>
<tr>
<td align="left">Butyl 2-methylbutanoate</td>
<td align="center">0.26</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">32</td>
<td align="center">0</td>
<td align="center">4.31</td>
<td align="center">0</td>
<td align="center">3.66</td>
<td align="center">13</td>
</tr>
<tr>
<td align="left">Total bilirubin (mg/dL)</td>
<td align="center">3.35</td>
<td align="center">17.33</td>
<td align="center">2.09</td>
<td align="center">8.83</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">1.86</td>
<td align="center">1.99</td>
<td align="center">3.55</td>
<td align="center">14</td>
</tr>
<tr>
<td align="left">AP (U/L)</td>
<td align="center">2.96</td>
<td align="center">22.92</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0.08</td>
<td align="center">2.1</td>
<td align="center">0.47</td>
<td align="center">1.07</td>
<td align="center">1.38</td>
<td align="center">3.10</td>
<td align="center">15</td>
</tr>
<tr>
<td align="left">Diethylethanolamine</td>
<td align="center">1.21</td>
<td align="center">0</td>
<td align="center">3.73</td>
<td align="center">21.85</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">2.19</td>
<td align="center">1.26</td>
<td align="center">3.02</td>
<td align="center">16</td>
</tr>
<tr>
<td align="left">urethane</td>
<td align="center">0.75</td>
<td align="center">4.08</td>
<td align="center">0</td>
<td align="center">24.32</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">2.92</td>
<td align="center">17</td>
</tr>
<tr>
<td align="left">GOT (U/L)</td>
<td align="center">1.3</td>
<td align="center">0.67</td>
<td align="center">0</td>
<td align="center">21.85</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0.11</td>
<td align="center">0</td>
<td align="center">4.42</td>
<td align="center">0.24</td>
<td align="center">2.86</td>
<td align="center">18</td>
</tr>
<tr>
<td align="left">HDL-cholesterol (mg/dL)</td>
<td align="center">2.56</td>
<td align="center">17.08</td>
<td align="center">2.09</td>
<td align="center">2.37</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0.93</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0.6</td>
<td align="center">2.56</td>
<td align="center">19</td>
</tr>
<tr>
<td align="left">&#x3b2;-caryophyllene</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">25</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">2.50</td>
<td align="center">20</td>
</tr>
<tr>
<td align="left">DBP (mmHg)</td>
<td align="center">3.19</td>
<td align="center">13.58</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">1.33</td>
<td align="center">4.8</td>
<td align="center">0</td>
<td align="center">1.33</td>
<td align="center">0.53</td>
<td align="center">2.48</td>
<td align="center">21</td>
</tr>
<tr>
<td align="left">Furfural</td>
<td align="center">0.87</td>
<td align="center">22.42</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">2.33</td>
<td align="center">22</td>
</tr>
<tr>
<td align="left">Tridecane</td>
<td align="center">0.58</td>
<td align="center">15.08</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">4.7</td>
<td align="center">0</td>
<td align="center">2.05</td>
<td align="center">0.07</td>
<td align="center">2.25</td>
<td align="center">23</td>
</tr>
<tr>
<td align="left">4-methyloctanoic acid</td>
<td align="center">0.34</td>
<td align="center">21.67</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">2.20</td>
<td align="center">24</td>
</tr>
<tr>
<td align="left">(S)-2-methyl-1-butanol</td>
<td align="center">0.62</td>
<td align="center">21</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0.04</td>
<td align="center">0</td>
<td align="center">2.17</td>
<td align="center">25</td>
</tr>
<tr>
<td align="left">&#x2026;</td>
<td align="center">&#x2026;</td>
<td align="center">&#x2026;</td>
<td align="center">&#x2026;</td>
<td align="center">&#x2026;</td>
<td align="center">&#x2026;</td>
<td align="center">&#x2026;</td>
<td align="center">&#x2026;</td>
<td align="center">&#x2026;</td>
<td align="center">&#x2026;</td>
<td align="center">&#x2026;</td>
<td align="center">&#x2026;</td>
<td align="center">&#x2026;</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Abbreviations: ROI, rank of importance; FPG, fasting plasma glucose; &#x3b3;-GT, &#x3b3;-glutamyl transferase; GPT, serum glutamic pyruvic transaminase; AP, alkaline phosphatase; GOT, serum glutamic oxaloacetic transaminase; DBP, diastolic blood pressure.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The Bee Swarm plot derived from the XGBoost SHAP was shown in <xref ref-type="fig" rid="F5">Figure 5</xref>. From top to the bottom listed the features selected and the higher horizontal feature indicates it is more important. Each circle represents a participant&#x2019;s value impact of that feature. The red color has stronger impact whilst the blue one has less. Thus, this figure shows the direction of impact of each participants. Finally, <xref ref-type="fig" rid="F6">Figure 6</xref> shows the absolute strengths each feature from the highest to the lowest.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>The Bee Swarm plot derived from Shapley addictive explanation of eXtreme Gradient Boosting. Note: BMI: body mass index; TG, Triglycerides; LDL-C, Low density lipoprotein cholesterol; GPT, Serum glutamic pyruvic transaminase; FPG, Fasting plasma glucose; T-Bili, Total bilirubin; GOT, Serum glutamic oxaloacetic transaminase; UA, Uric acid; SBP, Systolic blood pressure; HDL-C, High density lipoprotein cholesterol; AFP, Alpha-fetoprotein; eGFR, estimated Glomerular filtration rate; &#x3b3;-GT, Gamma glutamyl transpeptidase.</p>
</caption>
<graphic xlink:href="fmolb-12-1631265-g005.tif">
<alt-text content-type="machine-generated">Dot plot showing SHAP values for various features impacting a model's output. Features include BMI, TG, and Age. Blue to pink gradient indicates low to high feature values. BMI shows the widest range of impact.</alt-text>
</graphic>
</fig>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>The absolute Shapley addictive explanation values of each feature. Note: BMI, body mass index; TG, Triglycerides; LDL-C, Low density lipoprotein cholesterol; GPT, Serum glutamic pyruvic transaminase; FPG, Fasting plasma glucose; T-Bili, Total bilirubin; GOT, Serum glutamic oxaloacetic transaminase; UA, Uric acid; SBP, Systolic blood pressure; HDL-C, High density lipoprotein cholesterol; AFP, Alpha-fetoprotein; eGFR, estimated Glomerular filtration rate; &#x3b3;-GT, Gamma glutamyl transpeptid.</p>
</caption>
<graphic xlink:href="fmolb-12-1631265-g006.tif">
<alt-text content-type="machine-generated">Bar chart showing mean SHAP values indicating the impact of features on model output. BMI has the highest impact, followed by TG, 2-propanol, LDL-C, and Age. Other features have progressively smaller impacts.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>To the best of our knowledge, this study represents the largest cohort to date in the field of breath-based diagnostics for NAFLD, with 1,501 participants included. Previous related studies typically involved fewer than 100 subjects (<xref ref-type="bibr" rid="B31">Grewal and Mahmood, 2009</xref>; <xref ref-type="bibr" rid="B13">Chen et al., 2015</xref>), thereby limiting the generalizability and statistical power of their findings. Additionally, those studies primarily employed traditional statistical methods, which often fail to capture non-linear relationships among complex variables. In contrast, our study applied 10 different Mach-L algorithms, demonstrating that the inclusion of 341 VOCs in Model 1 led to a notable improvement in AUC, ranging from 5.20% to 9.80%, across different modeling approaches.</p>
<p>Volatile organic compounds (VOCs)&#x2014;produced through endogenous metabolism, microbiota activity, and various cellular processes&#x2014;hold significant potential as non-invasive biomarkers for disease detection. One of the greatest strengths of VOC-based diagnostics lies in their non-invasive nature, making them ideal for monitoring chronic conditions, tracking disease progression, and conducting large-scale population screening where invasive procedures are impractical. Furthermore, VOCs may offer early indicators of disease, enabling prompt diagnosis and intervention. This is particularly crucial for diseases like cancer and metabolic disorders, where early detection significantly enhances treatment outcomes.</p>
<p>By constructing a quantitative VOCs library from both sub-healthy and diseased individuals, predictive models and diagnostic algorithms can be refined to detect diseases at earlier stages. Importantly, the combination of VOC data with traditional clinical parameters and biomarkers enhances the accuracy and robustness of predictive models. Thus, the integration of quantitative VOC analysis has great potential to advance preventive medicine and revolutionize early disease detection.</p>
<p>Nevertheless, for VOCs to be effectively implemented in clinical practice, further research and validation are essential. Our present study lays a solid foundation for enhancing non-invasive prediction of NAFLD, and additional studies based on these findings are currently underway. Compared to previous research utilizing breathomics in NAFLD patients (<xref ref-type="table" rid="T6">Table 6</xref>) (<xref ref-type="bibr" rid="B2">Akesson, 1977</xref>; <xref ref-type="bibr" rid="B3">Alkhouri et al., 2014</xref>; <xref ref-type="bibr" rid="B11">Calabrese et al., 2023</xref>), our study offers a more comprehensive investigation, not only due to its larger sample size, but also through the simultaneous consideration of VOCs and clinical data, and the application of multiple machine learning algorithms for predictive modeling&#x2014;an approach not previously explored in this field. However, it should be noted that, at this stage, due to two reasons the application of VOC in clinical practice is not practical; first, the sensitivity and specificity are not high enough; second, the cost of VOCs is still high.</p>
<table-wrap id="T6" position="float">
<label>TABLE 6</label>
<caption>
<p>Analysis pipelines of studies using breath-based VOCs towards non-alcoholic fatty liver prediction.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Technique</th>
<th align="left">Sample size</th>
<th align="left">&#x23; Of VOCs</th>
<th align="center">Methods</th>
<th align="center">References</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">GC-MS</td>
<td align="center">46</td>
<td align="center">127</td>
<td align="left">Partial least square discriminant analysis</td>
<td align="left">
<xref ref-type="bibr" rid="B11">Calabrese et al., 2023</xref>
</td>
</tr>
<tr>
<td align="left">SIFT-MS</td>
<td align="center">60</td>
<td align="center">14</td>
<td align="left">Canonical discriminant analysis</td>
<td align="left">
<xref ref-type="bibr" rid="B3">Alkhouri et al., 2014</xref>
</td>
</tr>
<tr>
<td align="left">GC-MS</td>
<td align="center">60</td>
<td align="center">220</td>
<td align="left">Univariate analysis</td>
<td align="left">
<xref ref-type="bibr" rid="B68">Raman et al., 2013</xref>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>In the present study we did use XGBoost in order to examine the directions and impacts of each variable. The interpretation was given in the results section and, out of the 20 features, 6 different VOCs were selected and 2-propanol was the third important VOCS.</p>
<p>From the initial 341 VOCs analyzed, the top 10 most relevant compounds were identified using machine learning algorithms. Ranked by importance, these VOCs were: 2-propanol, acetone, butyl 2-methylbutanoate, diethylethanolamine, urethane, &#x3b2;-caryophyllene, furfural, tridecane, 4-methyloctanoic acid, and (S)-2-methyl-1-butanol.</p>
<p>The gold standard for diagnosing NAFLD remains liver biopsy (<xref ref-type="bibr" rid="B10">Brunt et al., 1999</xref>; <xref ref-type="bibr" rid="B40">Kleiner et al., 2005</xref>), yet this approach is invasive and carries a complication risk of approximately 0.5% (<xref ref-type="bibr" rid="B6">Bravo et al., 2001</xref>; <xref ref-type="bibr" rid="B62">Piccinino et al., 1986</xref>). Alternative, less invasive methods such as the Fibrosis-4 Index, which incorporates age, liver enzymes, and platelet count, have shown a positive predictive value (PPV) of around 80% (<xref ref-type="bibr" rid="B5">Author Anonymous, 2025</xref>). Likewise, ultrasound has demonstrated high sensitivity and specificity (84.8% and 93.6%, respectively) in detecting moderate to severe steatosis. Given this, one might argue that VOC analysis is more labor-intensive and costly. However, the primary value of VOCs lies in their potential to uncover novel insights into NAFLD pathophysiology, which could eventually lead to new therapeutic targets. Importantly, this study did not establish a causal relationship between VOCs and NAFLD.</p>
<p>As expected, the top-ranking variables in our analysis were traditional risk factors, including BMI, triglycerides (TG), fasting plasma glucose (FPG), among others. The first VOC to appear in the list was 2-propanol. The well-established impact of traditional clinical variables should not be overlooked (<xref ref-type="bibr" rid="B36">Huh et al., 2022</xref>), but it must also be recognized that these factors may confound the identification of VOCs truly associated with NAFLD. To address this, our machine learning models adjusted for the effects of conventional predictors, allowing for a more accurate evaluation of VOC contributions.</p>
<p>Below is a brief discussion of the top 10 VOCs identified:</p>
<sec id="s4-1">
<title>2-Propanol</title>
<p>Lu et al. demonstrated that subchronic exposure to 2-propanol in mice induced NAFLD through dysregulation of the AMPK signaling pathway (<xref ref-type="bibr" rid="B49">Lu et al., 2015</xref>). Interestingly, in our study, 2- propanol levels were lower in NAFLD subjects, suggesting possible upregulation of AMPK as a protective or compensatory modality (<xref ref-type="bibr" rid="B26">Fang et al., 2022</xref>). However, the specific mechanistic studies on 2-propanol and fatty liver are limited, its known hepatotoxicity and the findings from animal studies support the possibility that 2-propanol exposure can contribute to fatty liver development, especially with high or prolonged exposure (<xref ref-type="bibr" rid="B75">Satapathy et al., 2015</xref>; <xref ref-type="bibr" rid="B91">World HealthOrganizatiom-INTERNATIONAL P ROGRAMME ON CHEMICALSAFETY, 1990</xref>).</p>
</sec>
<sec id="s4-2">
<title>Acetone</title>
<p>Solga et al. previously reported that breath acetone was associated with NAFLD in morbidly obese patients undergoing bariatric surgery (<xref ref-type="bibr" rid="B78">Solga et al., 2006</xref>). This may reflect decreased d-3- hydroxybutyrate dehydrogenase activity or altered NADH levels, leading to acetone accumulation. There might be two mechanisms behind this relationship. First, enhancing ketogenesis reduces hepatic lipid accumulation in preclinical models. Exogenous ketones (e.g., &#x3b2;-hydroxybutyrate) show anti-inflammatory and antifibrotic effects, suggesting protective roles (<xref ref-type="bibr" rid="B42">Kwon et al., 2024</xref>). Second, while elevated acetone may indicate metabolic stress in early NAFLD, targeted ketone supplementation or ketogenic diets could mitigate steatosis and inflammation in specific contexts (<xref ref-type="bibr" rid="B42">Kwon et al., 2024</xref>). Our findings were consistent, with higher acetone levels in NAFLD subjects, though the difference was not statistically significant.</p>
</sec>
<sec id="s4-3">
<title>Butyl 2-methylbutanoate</title>
<p>This fatty acid ester, found naturally in apricots (Prunus armeniaca), has been associated with celiac disease and IBS (<xref ref-type="bibr" rid="B65">pubchem, 2025</xref>). Only one prior study has investigated its link to NAFLD, finding higher prevalence in NAFLD patients (<xref ref-type="bibr" rid="B68">Raman et al., 2013</xref>). It might have influences on NAFLD due to the gut microbiota alterations which correlates with elevated 2-butanone (a structurally related ketone), hinting at broader metabolic disruptions involving ester-like compounds (<xref ref-type="bibr" rid="B19">Del et al., 2016</xref>). In the same time, methyl tert-butyl ether, another ether compound, shows epidemiological links to NAFLD risk in humans, suggesting potential shared mechanisms for ester/ether-induced metabolic dysfunction (<xref ref-type="bibr" rid="B16">Cui et al., 2024</xref>). Additional research is needed to elucidate its pathophysiological role.</p>
</sec>
<sec id="s4-4">
<title>Diethylethanolamine</title>
<p>Akesson reported that diethylethanolamine promotes the conversion of phosphatidylethanolamine to phosphatidylcholine, a hepatoprotective compound (<xref ref-type="bibr" rid="B2">Akesson, 1977</xref>). However, at present, there is no direct evidence linking it to NAFLD. It is well known that alcohol metabolism produces acetaldehyde and reactive oxygen species that cause fatty liver. While diethylethanolamine is not an alcohol, its metabolism might theoretically produce reactive intermediates that could similarly affect hepatic cells (<xref ref-type="bibr" rid="B46">Liu, 2014</xref>). Our findings&#x2014;lower levels in NAFLD subjects&#x2014;support this mechanism and suggest its potential protective role.</p>
</sec>
<sec id="s4-5">
<title>Urethane</title>
<p>Studies in rats demonstrate that administration of carcinogenic doses of urethane leads to liver microsomal damage, including degranulation of liver microsomes, which impairs liver cell function and contributes to hepatic injury (<xref ref-type="bibr" rid="B17">Dani, 1983</xref>). In human, it is found that liver injury in workers exposed to N,N-dimethylformamide (DMF) (<xref ref-type="bibr" rid="B58">Nakasone et al., 2011</xref>; <xref ref-type="bibr" rid="B59">Nomiyama et al., 2001</xref>; <xref ref-type="bibr" rid="B71">Redlich et al., 1988</xref>), urethane levels were higher in the control group in our study. While this may indicate resistance to hepatic injury, further evidence is required to substantiate this hypothesis.</p>
</sec>
<sec id="s4-6">
<title>&#x3b2;-caryophyllene</title>
<p>This anti-inflammatory, plant-derived compound activates CB2 receptors, reducing oxidative stress and hepatic injury in mice models (<xref ref-type="bibr" rid="B88">Varga et al., 2018</xref>). In the same time, it could reduce intracellular lipid accumulation, primarily by lower saturated fatty acids and modifying the lipid profile toward less harmful species (<xref ref-type="bibr" rid="B76">Scandiffio et al., 2023</xref>). Our findings align with this, supporting its potential therapeutic use.</p>
</sec>
<sec id="s4-7">
<title>Furfural</title>
<p>Interestingly, furfural has a complex relationship with liver health. In low dose, it could improve mitochondrial function, reduced reactive oxygen species, and restoration of the NAD<sup>&#x2b;</sup>/NADH redox balance, which is crucial for lipid metabolism and preventing fatty liver progression (<xref ref-type="bibr" rid="B14">Cheng et al., 2022</xref>). But when it is in high dose, a Maillard reaction product with antioxidant properties, furfural has demonstrated hepatocyte-protective effects in animal studies (<xref ref-type="bibr" rid="B64">Powell et al., 2014</xref>). This may explain its relevance in our NAFLD model.</p>
</sec>
<sec id="s4-8">
<title>Tridecane</title>
<p>There is currently no direct evidence or well-established research linking tridecane specifically to NAFLD or its progression. Tridecane is a hydrocarbon (alkane) commonly found in petroleum products and some environmental pollutants, but its direct impact on liver fat accumulation or liver metabolism has not been clearly documented. The only evidence is that tridecane has been associated with inflammation and lipid peroxidation, particularly in distinguishing NASH from non-NASH (<xref ref-type="bibr" rid="B82">The good scents company, 2025</xref>).</p>
</sec>
<sec id="s4-9">
<title>4-methyloctanoic acid</title>
<p>Although largely known for its use in food flavoring, this compound is a fatty acid and may reflect metabolic changes. The possible mechanisms include it is a BCFA involved in lipid metabolism; it can modulate gene expression related to fatty acid metabolism; and there is an indirect link to the NAVLD (<xref ref-type="bibr" rid="B96">Zhao et al., 2022</xref>; <xref ref-type="bibr" rid="B48">Liu et al., 2018</xref>; <xref ref-type="bibr" rid="B63">Pooya et al., 2012</xref>). We observed higher levels in non-NAFLD subjects, potentially due to better hepatic metabolism in healthier individuals (<xref ref-type="bibr" rid="B93">Yamaguchi et al., 2007</xref>).</p>
</sec>
<sec id="s4-10">
<title>(S)-2-methyl-1-butanol</title>
<p>Produced by <italic>Saccharomyces cerevisiae</italic>, this compound has antioxidant properties (<xref ref-type="bibr" rid="B90">Wilson et al., 2022</xref>; <xref ref-type="bibr" rid="B1">Agarwal et al., 2020</xref>; <xref ref-type="bibr" rid="B43">Landolfo et al., 2008</xref>), which may be linked to liver protection. In the same time, it is a fatty alcohol lipid molecule involved in metabolic pathways related to fatty acid and alcohol metabolism. It can be oxidized to 2-methylbutyrate, which then enters beta-oxidation to produce acetyl-CoA and propionyl-CoA, key intermediates in energy metabolism (<xref ref-type="bibr" rid="B83">Thompson et al., 2020</xref>). This indicates that (S)-2-methyl-1-butanol is metabolically linked to fatty acid catabolism through its conversion to fatty acid derivatives that feed into mitochondrial energy pathways. While no prior study has evaluated its relationship with NAFLD, our findings suggest it may play a role in hepatic defense mechanisms.</p>
</sec>
<sec id="s4-11">
<title>Limitations</title>
<p>Despite the strengths of our study&#x2014;including a large sample size and comprehensive VOC profiling&#x2014;there are important limitations. In the present study, we do have limitations. First, this is a cross-sectional study which is less persuasive than a longitudinal one. There is no conclusion of cause-effect relationship could be drawn. However, since some of these participants will continue to have a health check up in our clinic, in the future, we believe that we will have a longitudinal study. Second, the participants were only limited to Taiwanese. It should be exercised to another ethnic group with cautious. In the future, since these participants will remain to be followed up in the MJ clinic, longitudinal studies could be done by using the present results of VOCs to predict future diseases. In the same time, we will separate these participants into two groups; one for selecting the VOCs, the rest will be treated as a validation group.</p>
</sec>
</sec>
<sec sec-type="conclusion" id="s5">
<title>Conclusion</title>
<p>Using 10 different Mach-L algorithms, we identified the relative importance of both clinical parameters and volatile organic compounds (VOCs) in predicting non-alcoholic fatty liver disease (NAFLD) within a cohort of 1,501 participants. Among clinical variables, the most influential features included body mass index (BMI), triglycerides (TG), uric acid (UA), fasting plasma glucose (FPG), &#x3b3;-glutamyltransferase (&#x3b3;-GT), gender, low-density lipoprotein cholesterol (LDL-C), and sleep duration.</p>
<p>In addition to traditional clinical predictors, 2-propanol emerged as the most influential VOC, followed in descending order by acetone, butyl 2-methylbutanoate, diethylethanolamine, urethane, &#x3b2;-caryophyllene, furfural, tridecane, 4-methyloctanoic acid, and (S)-2-methyl-1- butanol. The potential biological relevance and mechanisms of action of these VOCs were discussed in relation to liver metabolism and disease pathology.</p>
<p>While this study offers new insights into the role of VOCs as non-invasive biomarkers for NAFLD, its cross-sectional design limits the ability to determine causality. Future research should aim to conduct longitudinal studies to further elucidate the cause-effect relationships between VOCs and the development or progression of NAFLD.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, upon reasonable request.</p>
</sec>
<sec sec-type="ethics-statement" id="s7">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Institutional Review Board of National Yang Ming Chiao Tung University, Taiwan (IRB No. NCTU-REC-109-074E). The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>C-HS: Conceptualization, Investigation, Writing &#x2013; original draft. R-HH: Resources, Validation, Writing &#x2013; original draft. Y-KL: Conceptualization, Project administration, Writing &#x2013; review and editing. T-WC: Resources, Writing &#x2013; review and editing. DP: Data curation, Supervision, Writing &#x2013; review and editing.</p>
</sec>
<sec sec-type="funding-information" id="s9">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This work was financially supported by the project MOST 109-2634-F-009-028 and the Center for Emergent Functional Matter Science of National Yang Ming Chiao Tung University from The Featured Areas Research Center Program within the framework of the Higher Education Sprout Project by the Ministry of Education (MOE) in Taiwan. This work was also financially supported by grants from the Tri-Service General Hospital (Award numbers: TSGH-E-113257, TSGH-E-114259), Ministry of National Defense, Medical Affairs Bureau (Award number: MND-MAB-D-113083, MND-MAB-D-114107), Teh-Tzer Study Group for Human Medical Research Foundation (Award number: B1141005). The funding sources had no role in the study design, in the collection, analysis, and interpretation of data, in the writing of the report, and in the decision to submit the article for publication.</p>
</sec>
<ack>
<p>The authors acknowledge the research collaboration and technical service supported by National Human Microbiome Core Facility, Taiwan (NSTC 112-2740-B-A49-002).</p>
</ack>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s11">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s12">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Agarwal</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Patel</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>More</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Sapara</surname>
<given-names>K. K.</given-names>
</name>
<name>
<surname>Singh</surname>
<given-names>V. K.</given-names>
</name>
<name>
<surname>Agarwal</surname>
<given-names>P. K.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The AlRabring7 E3-Ub-ligase mediates AlRab7 ubiquitination and improves ionic and oxidative stress tolerance in <italic>Saccharomyces cerevisiae</italic>
</article-title>. <source>Plant Physiol. biochem.</source> <volume>151</volume>, <fpage>689</fpage>&#x2013;<lpage>704</lpage>. <pub-id pub-id-type="doi">10.1016/j.plaphy.2020.03.030</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Akesson</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>1977</year>). <article-title>Effects of analogles of ethanolamine and choline on phospholipid metabolism in rat hepatocytes</article-title>. <source>Biochem. J.</source> <volume>168</volume> (<issue>3</issue>), <fpage>401</fpage>&#x2013;<lpage>408</lpage>. <pub-id pub-id-type="doi">10.1042/bj1680401</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alkhouri</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Cikach</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Eng</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Moses</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Patel</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Analysis of breath volatile organic compounds as a noninvasive tool to diagnose nonalcoholic fatty liver disease in children</article-title>. <source>Eur. J. Gastroenterol. Hepatol.</source> <volume>26</volume> (<issue>1</issue>), <fpage>82</fpage>&#x2013;<lpage>87</lpage>. <pub-id pub-id-type="doi">10.1097/MEG.0b013e3283650669</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arkoudis</surname>
<given-names>N. A.</given-names>
</name>
<name>
<surname>Papadakos</surname>
<given-names>S. P.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Machine learning applications in healthcare clinical practice and research</article-title>. <source>World J. Clin. Cases</source> <volume>13</volume> (<issue>1</issue>), <fpage>99744</fpage>. <pub-id pub-id-type="doi">10.12998/wjcc.v13.i1.99744</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="web">
<collab>Author Anonymous</collab> (<year>2025</year>). <article-title>Hepatology</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="http://gihep.com/calculators/hepatology/fbrosis-4-score/">http://gihep.com/calculators/hepatology/fbrosis-4-score/</ext-link>.</comment>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bravo</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Sheth</surname>
<given-names>S. G.</given-names>
</name>
<name>
<surname>Chopra</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Liver biopsy</article-title>. <source>N. Engl. J. Med.</source> <volume>344</volume> (<issue>7</issue>), <fpage>495</fpage>&#x2013;<lpage>500</lpage>. <pub-id pub-id-type="doi">10.1056/NEJM200102153440706</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Olshen</surname>
</name>
</person-group> (<year>2001</year>). <article-title>Random forests</article-title>. <source>Mach. Learn</source> <volume>45</volume> (<issue>1</issue>), <fpage>5</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Friedman</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Olshen</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Stone</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>1984</year>). <article-title>Classification and regression trees</article-title>. <source>Wadsworth Int. Group.</source> <fpage>237</fpage>&#x2013;<lpage>251</lpage>. <pub-id pub-id-type="doi">10.1201/9781315139470</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Browne</surname>
<given-names>M. W.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Cross-validation methods</article-title>. <source>J. Math. Psychol.</source> <volume>44</volume> (<issue>1</issue>), <fpage>108</fpage>&#x2013;<lpage>132</lpage>. <pub-id pub-id-type="doi">10.1006/jmps.1999.1279</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brunt</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Janney</surname>
<given-names>C. G.</given-names>
</name>
<name>
<surname>Di Bisceglie</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Neuschwander-Tetri</surname>
<given-names>B. A.</given-names>
</name>
<name>
<surname>Bacon</surname>
<given-names>B. R.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>Nonalcoholic steatohepatitis: a proposal for grading and staging the histological lesions</article-title>. <source>Am. J. Gastroenterol.</source> <volume>94</volume> (<issue>9</issue>), <fpage>2467</fpage>&#x2013;<lpage>2474</lpage>. <pub-id pub-id-type="doi">10.1111/j.1572-0241.1999.01377.x</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Calabrese</surname>
<given-names>F. M.</given-names>
</name>
<name>
<surname>Celano</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Bonfiglio</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Campanella</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Franco</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Annunziato</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Synergistic effect of diet and physical activity on a NAFLD cohort: metabolomics profile and clinical variable evaluation</article-title>. <source>Nutrients</source> <volume>15</volume> (<issue>11</issue>), <fpage>2457</fpage>. <pub-id pub-id-type="doi">10.3390/nu15112457</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>C. H.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>M. H.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Nien</surname>
<given-names>C. K.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>C. C.</given-names>
</name>
<name>
<surname>Yeh</surname>
<given-names>Y. H.</given-names>
</name>
<etal/>
</person-group> (<year>2006</year>). <article-title>Prevalence and risk factors of nonalcoholic fatty liver disease in an adult population of Taiwan: metabolic significance of nonalcoholic fatty liver disease in nonobese adults</article-title>. <source>J. Clin. Gastroenterol.</source> <volume>40</volume> (<issue>8</issue>), <fpage>745</fpage>&#x2013;<lpage>752</lpage>. <pub-id pub-id-type="doi">10.1097/00004836-200609000-00016</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Torralba</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Embree</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zengler</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>St&#xe4;rkel</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Supplementation of saturated long-chain fatty acids maintains intestinal eubiosis and reduces ethanol-induced liver injury in mice</article-title>. <source>Gastroenterology</source> <volume>148</volume> (<issue>1</issue>), <fpage>203</fpage>&#x2013;<lpage>214.e16</lpage>. <pub-id pub-id-type="doi">10.1053/j.gastro.2014.09.014</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cheng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Furfural produces dose-dependent attenuating effects on ethanol-induced toxicity in the liver</article-title>. <source>Front. Pharmacol.</source> <volume>13</volume>, <fpage>906933</fpage>. <pub-id pub-id-type="doi">10.3389/fphar.2022.906933</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chung</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Akter</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Shin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>T. G.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>I.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Diagnosis by volatile organic compounds in exhaled breath in exhaled breath from patients with gastric and colorectal cancers</article-title>. <source>Int. J. Mol. Sci.</source> <volume>24</volume> (<issue>1</issue>), <fpage>129</fpage>. <pub-id pub-id-type="doi">10.3390/ijms24010129</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Cui</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <source>Methyl tert-Butyl ether may be a potential environmental pathogenic factor for nonalcoholic fatty liver disease: results from NHANES 2017&#x2013;2020</source>. <publisher-loc>Washington, DC</publisher-loc>: <publisher-name>ACS publication</publisher-name>. <pub-id pub-id-type="doi">10.1021/envhealth.4c00140</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dani</surname>
<given-names>H. M.</given-names>
</name>
</person-group> (<year>1983</year>). <article-title>Effects of toxic doses of urethane on rat liver and lung microsomes</article-title>. <source>Toxicol. Lett.</source> <volume>15</volume> (<issue>1</issue>), <fpage>61</fpage>&#x2013;<lpage>64</lpage>. <pub-id pub-id-type="doi">10.1016/0378-4274(83)90170-4</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dasarathy</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Dasarathy</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Khiyami</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Joseph</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lopez</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>McCullough</surname>
<given-names>A. J.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Validity of real time ultrasound in the diagnosis of hepatic steatosis: a prospective study</article-title>. <source>J. Hepatol.</source> <volume>51</volume> (<issue>6</issue>), <fpage>1061</fpage>&#x2013;<lpage>1067</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhep.2009.09.001</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Del</surname>
<given-names>C. F.</given-names>
</name>
<name>
<surname>Nobili</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Vernocchi</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Russo</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>De</surname>
<given-names>S. C.</given-names>
</name>
<name>
<surname>Gnani</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Gut microbiota profiling of pediatric nonalcoholic fatty liver disease and obese patients unveiled by an integrated meta&#x2010;omics&#x2010;based approach</article-title>. <source>Hepatology</source> <volume>65</volume> (<issue>2</issue>), <fpage>451</fpage>&#x2013;<lpage>464</lpage>. <pub-id pub-id-type="doi">10.1002/hep.28572</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DeLong</surname>
<given-names>E. R.</given-names>
</name>
<name>
<surname>DeLong</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Clarke-Pearson</surname>
<given-names>D. L.</given-names>
</name>
</person-group> (<year>1988</year>). <article-title>Comparing the areas under two or more correlated receiver operating characteristic curves: a nonparametric approach</article-title>. <source>Biometrics</source> <volume>44</volume> (<issue>3</issue>), <fpage>837</fpage>&#x2013;<lpage>845</lpage>. <pub-id pub-id-type="doi">10.2307/2531595</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dias Canedo</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Cordeiro Mendes</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Software requirements classification using machine learning algorithms</article-title>. <source>Entropy</source> <volume>22</volume> (<issue>9</issue>), <fpage>1057</fpage>. <pub-id pub-id-type="doi">10.3390/e22091057</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>di Biase</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Di Santo</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Caminiti</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>De Liso</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Shah</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Ricci</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Gait analysis in parkinson&#x27;s disease: an overview of the Most accurate markers for diagnosis and symptoms monitoring</article-title>. <source>Sensors</source> <volume>20</volume> (<issue>12</issue>), <fpage>3529</fpage>. <pub-id pub-id-type="doi">10.3390/s20123529</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dorogush</surname>
<given-names>A. V.</given-names>
</name>
<name>
<surname>Ershov</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Gulin</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>CatBoost: gradient boosting with categorical features support</article-title>. <source>arXiv</source>. <pub-id pub-id-type="doi">10.48550/arXiv.1810.11363</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Duan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Yue</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2025</year>). <article-title>The association analysis between exposure to volatile organic compounds and fatty liver disease in US adults</article-title>. <source>Dig. Liver Dis.</source> <volume>57</volume> (<issue>2</issue>), <fpage>535</fpage>&#x2013;<lpage>541</lpage>. <pub-id pub-id-type="doi">10.1016/j.dld.2024.09.027</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dusanter</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Holzinger</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Klein</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Salameh</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Jamar</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Measurement guidelines for VOC analysis by PTR-MS</article-title>. <source>ACTRIS</source>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.actris.eu/sites/default/files/inline-files/PTRMS%20SOP%20(April2025).pdf">https://www.actris.eu/sites/default/files/inline-files/PTRMS%20SOP%20(April2025).pdf</ext-link>.</comment>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Qu</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Lei</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>The AMPK pathway in fatty liver disease</article-title>. <source>Front. Physiol.</source> <volume>13</volume>, <fpage>970292</fpage>. <pub-id pub-id-type="doi">10.3389/fphys.2022.970292</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="book">
<collab>Final Report</collab> (<year>2012</year>). <source>Analytical methodology development and evaluation</source>. <publisher-loc>Sydney NSW Australia</publisher-loc>: <publisher-name>University of New South Wales</publisher-name>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://water360.com.au/wp-content/uploads/2022/02/Analytical-Methodology-Development-Report-Final.pdf">https://water360.com.au/wp-content/uploads/2022/02/Analytical-Methodology-Development-Report-Final.pdf</ext-link>.</comment>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Friedman</surname>
<given-names>J. H.</given-names>
</name>
</person-group> (<year>1991</year>). <article-title>Multivariate adaptive regression splines</article-title>. <source>Ann. Stat.</source> <volume>19</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>67</lpage>. <pub-id pub-id-type="doi">10.1214/aos/1176347963</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Friedman</surname>
<given-names>J. H.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Greedy function approximation: a gradient boosting machine</article-title>. <source>Ann. Stat.</source> <volume>29</volume> (<issue>5</issue>), <fpage>1189</fpage>&#x2013;<lpage>1232</lpage>. <pub-id pub-id-type="doi">10.1214/aos/1013203451</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ghevariya</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Sandar</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Patel</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Ghevariya</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Shah</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Aron</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Knowing what&#x27;s out there: awareness of non-alcoholic fatty liver disease</article-title>. <source>Front. Med.</source> <volume>1</volume>, <fpage>4</fpage>. <pub-id pub-id-type="doi">10.3389/fmed.2014.00004</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grewal</surname>
<given-names>R. K.</given-names>
</name>
<name>
<surname>Mahmood</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Ethanol induced changes in glycosylation of mucins in rat intestine</article-title>. <source>Ann. Gastroenterol.</source> <volume>22</volume>, <fpage>178</fpage>&#x2013;<lpage>183</lpage>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="http://www.annalsgastro.gr/index.php/annalsgastro/article/view/746">http://www.annalsgastro.gr/index.php/annalsgastro/article/view/746</ext-link>.</comment>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gu</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Make complex heatmaps</article-title>. <source>R. Package Version</source> <volume>2</volume> (<issue>6.2</issue>). <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://github.com/jokergoo/ComplexHeatmap">https://github.com/jokergoo/ComplexHeatmap</ext-link> (Accessed on May 11, 2024)</comment>.</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hashim</surname>
<given-names>I. C.</given-names>
</name>
<name>
<surname>Shariff</surname>
<given-names>A. R. M.</given-names>
</name>
<name>
<surname>Bejo</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Muharam</surname>
<given-names>F. M.</given-names>
</name>
<name>
<surname>Ahmad</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Machine-learning approach using SAR data for the classification of oil palm trees that are Non- infected and infected with the basal stem rot disease</article-title>. <source>Agronomy</source> <volume>11</volume>, <fpage>532</fpage>. <pub-id pub-id-type="doi">10.3390/agronomy11030532</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wainwright</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2015</year>). <source>Statistical learning with sparsity: the lasso and generalizations</source>. <publisher-loc>Boca Raton, FL, USA</publisher-loc>: <publisher-name>CRC Press</publisher-name>.</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoerl</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Kennard</surname>
<given-names>R. W.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Ridge regression: biased estimation for nonorthogonal problems</article-title>. <source>Technometrics</source> <volume>42</volume> (<issue>1</issue>), <fpage>80</fpage>&#x2013;<lpage>86</lpage>. <pub-id pub-id-type="doi">10.2307/1271436</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huh</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Cho</surname>
<given-names>Y. J.</given-names>
</name>
<name>
<surname>Nam</surname>
<given-names>G. E.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Recent epidemiology and risk factors of nonalcoholic fatty liver disease</article-title>. <source>J. Obes. Metab. Syndr.</source> <volume>31</volume> (<issue>1</issue>), <fpage>17</fpage>&#x2013;<lpage>27</lpage>. <pub-id pub-id-type="doi">10.7570/jomes22021</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hussain</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>H. E.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>H. J.</given-names>
</name>
<name>
<surname>Aich</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Saqlain</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>H. C.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Forecast the exacerbation in patients of chronic obstructive pulmonary disease with clinical indicators using machine learning techniques</article-title>. <source>Diagnostics</source> <volume>11</volume> (<issue>5</issue>), <fpage>829</fpage>. <pub-id pub-id-type="doi">10.3390/diagnostics11050829</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Ke</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Finley</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). &#x201c;<article-title>Lightgbm: a highly efficient gradient boosting decision tree</article-title>,&#x201d; in <source>Advances in neural information processing systems</source>. Editors <person-group person-group-type="editor">
<name>
<surname>Guyon</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Luxburg</surname>
<given-names>U. V.</given-names>
</name>
<name>
<surname>Bengio</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wallach</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Fergus</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Vishwanathan</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<publisher-loc>New York</publisher-loc>: <publisher-name>Curran Associates</publisher-name>), <fpage>3146</fpage>&#x2013;<lpage>3154</lpage>.</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Keogh</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Riches</surname>
<given-names>J. C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>The use of breath analysis in the management of lung cancer: is it ready for primetime?</article-title> <source>Curr. Oncol.</source> <volume>29</volume> (<issue>10</issue>), <fpage>7355</fpage>&#x2013;<lpage>7378</lpage>. <pub-id pub-id-type="doi">10.3390/curroncol29100578</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kleiner</surname>
<given-names>D. E.</given-names>
</name>
<name>
<surname>Brunt</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Van Natta</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Behling</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Contos</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Cummings</surname>
<given-names>O. W.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>Design and validation of a histological scoring system for nonalcoholic fatty liver disease</article-title>. <source>Hepatology</source> <volume>41</volume> (<issue>6</issue>), <fpage>1313</fpage>&#x2013;<lpage>1321</lpage>. <pub-id pub-id-type="doi">10.1002/hep.20701</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kuhn</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Caret: classification and regression training</article-title>. <source>R. Package Version</source> <volume>6</volume>, <fpage>93</fpage>. <pub-id pub-id-type="doi">10.32614/CRAN.package.caret</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kwon</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jeyaratnam</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>K. H.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Targeting ketone body metabolism to treat fatty liver disease</article-title>. <source>J. Pharm. and Pharm. Sci.</source> <volume>27</volume>, <fpage>13375</fpage>. <pub-id pub-id-type="doi">10.3389/jpps.2024.13375</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Landolfo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Politi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Angelozzi</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Mannazzu</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>ROS accumulation and oxidative damage to cell structures in <italic>Saccharomyces cerevisiae</italic> wine strains during fermentation of high-sugar-containing medium</article-title>. <source>Biochim. Biophys. Acta</source> <volume>1780</volume> (<issue>6</issue>), <fpage>892</fpage>&#x2013;<lpage>898</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbagen.2008.03.008</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lang</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>Beier</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Interaction of volatile organic compounds and underlying liver disease: a new paradigm for risk</article-title>. <source>Biol. Chem.</source> <volume>399</volume> (<issue>11</issue>), <fpage>1237</fpage>&#x2013;<lpage>1248</lpage>. <pub-id pub-id-type="doi">10.1515/hsz-2017-0324</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>C. S.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>S. O.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>L. Y.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Prevalence of HFE mutations and relation to serum iron status in patients with chronic hepatitis C and patients with nonalcoholic fatty liver disease in Taiwan in review fatty liver diseasein Taiwan</article-title>. <source>World J. Gastroenterol.</source> <volume>11</volume> (<issue>25</issue>), <fpage>3905</fpage>&#x2013;<lpage>3908</lpage>. <pub-id pub-id-type="doi">10.3748/wjg.v11.i25.3905</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Ethanol and liver: recent insights into the mechanisms of ethanol-induced fatty liver</article-title>. <source>World J. gastroenterology WJG</source> <volume>20</volume> (<issue>40</issue>), <fpage>14672</fpage>&#x2013;<lpage>14685</lpage>. <pub-id pub-id-type="doi">10.3748/wjg.v20.i40.14672</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Qiu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Single-chemical and mixture effects of multiple volatile organic compounds exposure on liver injury and risk of non-alcoholic fatty liver disease in a representative general adult population</article-title>. <source>Chemosphere</source> <volume>339</volume>, <fpage>139753</fpage>. <pub-id pub-id-type="doi">10.1016/j.chemosphere.2023.139753</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Erdene</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Mu</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Ao</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Effects of flavonoids from Allium mongolicum regel as a dietary additive on meat quality and composition of fatty acids related to flavor in lambs</article-title>. <source>Can. J. Animal Sci.</source> <volume>99</volume> (<issue>1</issue>), <fpage>15</fpage>&#x2013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.1139/cjas-2018-0008</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Nonalcoholic fatty liver disease induced by 13-week oral administration of 1,3-dichloro-2- propanol in C57BL/6J mice</article-title>. <source>Environ. Toxicol. Pharmacol.</source> <volume>39</volume> (<issue>3</issue>), <fpage>1115</fpage>&#x2013;<lpage>1121</lpage>. <pub-id pub-id-type="doi">10.1016/j.etap.2015.04.007</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Machado</surname>
<given-names>M. V.</given-names>
</name>
<name>
<surname>Cortez-Pinto</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Non-alcoholic fatty liver disease: what the clinician needs to know</article-title>. <source>World J. Gastroenterol.</source> <volume>20</volume> (<issue>36</issue>), <fpage>12956</fpage>&#x2013;<lpage>12980</lpage>. <pub-id pub-id-type="doi">10.3748/wjg.v20.i36.12956</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mahale</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Prabhu</surname>
<given-names>S. D.</given-names>
</name>
<name>
<surname>Nachiappan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fernandes</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ullal</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Clinical relevance of reporting fatty liver on ultrasound in asymptomatic patients during routine health checkups</article-title>. <source>J. Int. Med. Res.</source> <volume>46</volume> (<issue>11</issue>), <fpage>4447</fpage>&#x2013;<lpage>4454</lpage>. <pub-id pub-id-type="doi">10.1177/0300060518793039</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marateb</surname>
<given-names>H. R.</given-names>
</name>
<name>
<surname>Mansourian</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Faghihimani</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Amini</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Farina</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>A hybrid intelligent system for diagnosing microalbuminuria in type 2 diabetes patients without having to measure urinary albumin</article-title>. <source>Comput. Biol. Med.</source> <volume>45</volume>, <fpage>34</fpage>&#x2013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2013.11.006</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Markar</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Chin</surname>
<given-names>S. T.</given-names>
</name>
<name>
<surname>Romano</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wiggins</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Antonowicz</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Paraskeva</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Breath volatile organic compound profiling of colorectal cancer using selected ion flow-tube mass spectrometry</article-title>. <source>Ann. Surg.</source> <volume>269</volume> (<issue>5</issue>), <fpage>903</fpage>&#x2013;<lpage>910</lpage>. <pub-id pub-id-type="doi">10.1097/SLA.0000000000002539</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Maurice</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Manousou</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Non-alcoholic fatty liver disease</article-title>. <source>Clin. Med.</source> <volume>18</volume> (<issue>3</issue>), <fpage>245</fpage>&#x2013;<lpage>250</lpage>. <pub-id pub-id-type="doi">10.7861/clinmedicine.18-3-245</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Meng</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Ke</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>Z. M.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>A Communication- efficient parallel algorithm for decision tree</article-title>, <comment>arXiv preprint arXiv:1611.01276. Adv</comment>. <pub-id pub-id-type="doi">10.48550/arXiv.1611.01276</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Miller</surname>
<given-names>D. D.</given-names>
</name>
<name>
<surname>Brown</surname>
<given-names>E. W.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Artificial intelligence in medical practice: the question to the answer?</article-title> <source>Am. J. Med.</source> <volume>131</volume> (<issue>2</issue>), <fpage>129</fpage>&#x2013;<lpage>133</lpage>. <pub-id pub-id-type="doi">10.1016/j.amjmed.2017.10.035</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moghimi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Marchetto</surname>
<given-names>P. M.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Ensemble feature selection for plant phenotyping: a journey from hyperspectral to multispectral imaging</article-title>. <source>IEEE Access</source> <volume>6</volume>, <fpage>56870</fpage>&#x2013;<lpage>56884</lpage>. <pub-id pub-id-type="doi">10.1109/access.2018.2872801</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nakasone</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Binh</surname>
<given-names>P. N.</given-names>
</name>
<name>
<surname>Yamazaki</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Tanaka</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sakamoto</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Ashizawa</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Association between serum high-molecular-weight adiponectin level and the severity of chronic graft-versus-host disease in allogeneic stem cell transplantation recipients</article-title>. <source>Blood</source> <volume>117</volume> (<issue>12</issue>), <fpage>3469</fpage>&#x2013;<lpage>3472</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2010-10-316109</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nomiyama</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Uehara</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Miyauchi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Imamiya</surname>
<given-names>S .</given-names>
</name>
<name>
<surname>Tanaka</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Seki</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Causal relationship between a case of severe hepatic dysfunction and low exposure concentrations of N,N- dimethylformamide in the synthetics industry</article-title>. <source>Ind. Health</source> <volume>39</volume> (<issue>1</issue>), <fpage>33</fpage>&#x2013;<lpage>36</lpage>. <pub-id pub-id-type="doi">10.2486/indhealth.39.33</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nusinovici</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Tham</surname>
<given-names>Y. C.</given-names>
</name>
<name>
<surname>Chak Yan</surname>
<given-names>M. Y.</given-names>
</name>
<name>
<surname>Wei Ting</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sabanayagam</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Logistic regression was as good as machine learning for predicting major chronic diseases</article-title>. <source>J. Clin. Epidemiol.</source> <volume>122</volume>, <fpage>56</fpage>&#x2013;<lpage>69</lpage>. <pub-id pub-id-type="doi">10.1016/j.jclinepi.2020.03.002</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pes</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Ensemble feature selection for high-dimensional data: a stability analysis across multiple domains</article-title>. <source>Neural Comput. Appl.</source> <volume>32</volume>, <fpage>5951</fpage>&#x2013;<lpage>5973</lpage>. <pub-id pub-id-type="doi">10.1007/s00521-019-04082-3</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Piccinino</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Sagnelli</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Pasquale</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Giusti</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>1986</year>). <article-title>Complications following percutaneous liver biopsy. A multicentre retrospective study on 68,276 biopsies</article-title>. <source>J. Hepatol.</source> <volume>2</volume> (<issue>2</issue>), <fpage>165</fpage>&#x2013;<lpage>173</lpage>. <pub-id pub-id-type="doi">10.1016/s0168-8278(86)80075-7</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pooya</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Blaise</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Garcia</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Giudicelli</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Alberto</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Gu&#xe9;ant-Rodriguez</surname>
<given-names>R. M.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Methyl donor deficiency impairs fatty acid oxidation through PGC-1&#x3b1; hypomethylation and decreased ER-&#x3b1;, ERR-&#x3b1;, and HNF-4&#x3b1; in the rat liver</article-title>. <source>J. hepatology</source> <volume>57</volume> (<issue>2</issue>), <fpage>344</fpage>&#x2013;<lpage>351</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhep.2012.03.028</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Powell</surname>
<given-names>R. D.</given-names>
</name>
<name>
<surname>Swet</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Kennedy</surname>
<given-names>K. L.</given-names>
</name>
<name>
<surname>Huynh</surname>
<given-names>T. T.</given-names>
</name>
<name>
<surname>McKillop</surname>
<given-names>I. H.</given-names>
</name>
<name>
<surname>Evans</surname>
<given-names>S. L.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Resveratrol attenuates hypoxic injury in a primary hepatocyte model of hemorrhagic shock and resuscitation</article-title>. <source>J. Trauma Acute Care Surg.</source> <volume>76</volume> (<issue>2</issue>), <fpage>409</fpage>&#x2013;<lpage>417</lpage>. <pub-id pub-id-type="doi">10.1097/TA.0000000000000096</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="web">
<collab>pubchem</collab> (<year>2025</year>). <article-title>Butyl 2-methylbutyrate</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://pubchem.ncbi.nlm.nih.gov/compound/Butyl-2-methylbutyrate#section=Associated-Disorders-and-Diseases">https://pubchem.ncbi.nlm.nih.gov/compound/Butyl-2-methylbutyrate&#x23;section&#x3d;Associated-Disorders-and-Diseases</ext-link>.</comment>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Quek</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chan</surname>
<given-names>K. E.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>Z. Y.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Lim</surname>
<given-names>W. H.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Global prevalence of non-alcoholic fatty liver disease and non-alcoholic steatohepatitis in the overweight and Obese population: a systematic review and meta-analysis</article-title>. <source>Lancet Gastroenterol. Hepatol.</source> <volume>8</volume> (<issue>1</issue>), <fpage>20</fpage>&#x2013;<lpage>30</lpage>. <pub-id pub-id-type="doi">10.1016/S2468-1253(22)00317-X</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Quinlan</surname>
<given-names>J. R.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Data mining tools See5 and C5.0</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="http://www.rulequest.com/see5-info.htML">http://www.rulequest.com/see5-info.htML</ext-link> (Accessed on August 3, 2020)</comment>.</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Raman</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ahmed</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Gillevet</surname>
<given-names>P. M.</given-names>
</name>
<name>
<surname>Probert</surname>
<given-names>C. S.</given-names>
</name>
<name>
<surname>Ratcliffe</surname>
<given-names>N. M.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Fecal microbiome and volatile organic compound metabolome in obese humans with nonalcoholic fatty liver disease</article-title>. <source>Clin. Gastroenterol. Hepatol.</source> <volume>11</volume> (<issue>7</issue>), <fpage>868</fpage>&#x2013;<lpage>75.e753</lpage>. <pub-id pub-id-type="doi">10.1016/j.cgh.2013.02.015</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ratiu</surname>
<given-names>I. A.</given-names>
</name>
<name>
<surname>Ligor</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Bocos-Bintintan</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Mayhew</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Buszewski</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Volatile organic compounds in exhaled breath as fingerprints of lung cancer, asthma and COPD</article-title>. <source>J. Clin. Med.</source> <volume>10</volume> (<issue>1</issue>), <fpage>32</fpage>. <pub-id pub-id-type="doi">10.3390/jcm10010032</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="book">
<collab>R Core Team</collab> (<year>2017</year>). <source>R: a language and environment for statistical computing</source>. <publisher-loc>Vienna, Austria</publisher-loc>: <publisher-name>R Foundation for Statistical Computing</publisher-name>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="http://www.R-project.org">http://www.R-project.org</ext-link> (Accessed on January 21, 2023)</comment>.</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Redlich</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Beckett</surname>
<given-names>W. S.</given-names>
</name>
<name>
<surname>Sparer</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Barwick</surname>
<given-names>K. W.</given-names>
</name>
<name>
<surname>Riely</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Miller</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>1988</year>). <article-title>Liver disease associated with occupational exposure to the solvent dimethylformamide</article-title>. <source>Ann. Intern Med.</source> <volume>108</volume> (<issue>5</issue>), <fpage>680</fpage>&#x2013;<lpage>686</lpage>. <pub-id pub-id-type="doi">10.7326/0003-4819-108-5-680</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="book">
<collab>RI-URBANS</collab> (<year>2024</year>). &#x201c;<article-title>Research infrastructures services reinforcing air quality monitoring capacities in European Urban and industrial AreaS</article-title>&#x201d;. <publisher-name>European Union</publisher-name>: <publisher-name>RI-URBANS</publisher-name>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://riurbans.eu/wp-content/uploads/2024/07/ST5_VOCs.pdf">https://riurbans.eu/wp-content/uploads/2024/07/ST5_VOCs.pdf</ext-link>.</comment>
</citation>
</ref>
<ref id="B73">
<citation citation-type="web">
<collab>RStudio Team</collab> (<year>2015</year>). <article-title>RStudio: integrated development environment for R; RStudio: boston, MA, USA</article-title>. <comment>Available online at:: <ext-link ext-link-type="uri" xlink:href="http://www.rstudio.com/">http://www.rstudio.com/</ext-link> (Accessed on January 21, 2023)</comment>.</citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Samudrala</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Lammers</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Mandon</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Blanchet</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Schreuder</surname>
<given-names>T. H.</given-names>
</name>
<name>
<surname>Hopman</surname>
<given-names>M. T.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Breath acetone to monitor life style interventions in field conditions: an exploratory study</article-title>. <source>Obesity</source> <volume>22</volume> (<issue>4</issue>), <fpage>980</fpage>&#x2013;<lpage>983</lpage>. <pub-id pub-id-type="doi">10.1002/oby.20696</pub-id>
</citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Satapathy</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Kuwajima</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Nadelson</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Atiq</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Sanyal</surname>
<given-names>A. J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Drug-induced fatty liver disease: an overview of pathogenesis and management</article-title>. <source>Ann. hepatology</source> <volume>14</volume> (<issue>6</issue>), <fpage>789</fpage>&#x2013;<lpage>806</lpage>. <pub-id pub-id-type="doi">10.5604/16652681.1171749</pub-id>
</citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scandiffio</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bonzano</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Cottone</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Shrestha</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bossi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>De Marchis</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Beta-caryophyllene modifies intracellular lipid composition in a cell model of hepatic steatosis by acting through CB2 and PPAR receptors</article-title>. <source>Int. J. Mol. Sci.</source> <volume>24</volume> (<issue>7</issue>), <fpage>6060</fpage>. <pub-id pub-id-type="doi">10.3390/ijms24076060</pub-id>
</citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shaffie</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Soliman</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Eledkawy</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>X. A.</given-names>
</name>
<name>
<surname>Nantz</surname>
<given-names>M. H.</given-names>
</name>
<name>
<surname>Giridharan</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Lung cancer diagnosis system based on volatile organic compounds (VOCs) profile measured in exhaled breath in review profile measured in exhaled breath</article-title>. <source>Appl. Sci.</source> <volume>12</volume> (<issue>14</issue>), <fpage>7165</fpage>. <pub-id pub-id-type="doi">10.3390/app12147165</pub-id>
</citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Solga</surname>
<given-names>S. F.</given-names>
</name>
<name>
<surname>Alkhuraishe</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cope</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Tabesh</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Clark</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Torbenson</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2006</year>). <article-title>Breath biomarkers and non-alcoholic fatty liver disease: preliminary observations</article-title>. <source>Biomarkers</source> <volume>11</volume> (<issue>2</issue>), <fpage>174</fpage>&#x2013;<lpage>183</lpage>. <pub-id pub-id-type="doi">10.1080/13547500500421070</pub-id>
</citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>&#x160;pan&#x11b;l</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Quantification of volatile metabolites in exhaled breath by selected ion flow tube mass spectrometry, SIFT-MS</article-title>. <source>Clin. Mass Spectrom.</source> <volume>16</volume>, <fpage>18</fpage>&#x2013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.1016/j.clinms.2020.02.001</pub-id>
</citation>
</ref>
<ref id="B80">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sukaram</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Apiparakoon</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tiyarattanachai</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ariyaskul</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Kulkraisri</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Marukatat</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>VOCs from exhaled breath for the diagnosis of hepatocellular carcinoma</article-title>. <source>Diagnostics</source> <volume>13</volume> (<issue>2</issue>), <fpage>257</fpage>. <pub-id pub-id-type="doi">10.3390/diagnostics13020257</pub-id>
</citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tharwat</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Classification assessment methods</article-title>. <source>Appl. Comput. Inf.</source> <volume>17</volume>, <fpage>168</fpage>&#x2013;<lpage>192</lpage>. <pub-id pub-id-type="doi">10.1016/j.aci.2018.08.003</pub-id>
</citation>
</ref>
<ref id="B82">
<citation citation-type="web">
<collab>The good scents company</collab> (<year>2025</year>). <article-title>4-methyloctanoic acid</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="http://www.thegoodscentscompany.com/data/rw1036901.htML">http://www.thegoodscentscompany.com/data/rw1036901.htML</ext-link>.</comment>
</citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thompson</surname>
<given-names>M. G.</given-names>
</name>
<name>
<surname>Incha</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Pearson</surname>
<given-names>A. N.</given-names>
</name>
<name>
<surname>Schmidt</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sharpless</surname>
<given-names>W. A.</given-names>
</name>
<name>
<surname>Eiben</surname>
<given-names>C. B.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Fatty acid and alcohol metabolism in Pseudomonas putida: functional analysis using random barcode transposon sequencing</article-title>. <source>Applied and Environmental Microbiology</source> <volume>86</volume> (<issue>21</issue>), <fpage>e01665</fpage>&#x2013;<lpage>20</lpage>. <pub-id pub-id-type="doi">10.1128/AEM.01665-20</pub-id>
</citation>
</ref>
<ref id="B84">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tomer</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Sharma</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Detecting IoT attacks using an ensemble machine learning model</article-title>. <source>Future Internet</source> <volume>14</volume> (<issue>4</issue>), <fpage>102</fpage>. <pub-id pub-id-type="doi">10.3390/fi14040102</pub-id>
</citation>
</ref>
<ref id="B85">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tsou</surname>
<given-names>P. H.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>Z. L.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>Y. C.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>H. C.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>S. K.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Exploring volatile organic compounds in breath for high-accuracy prediction of lung cancer</article-title>. <source>Cancers</source> <volume>13</volume> (<issue>6</issue>), <fpage>1431</fpage>. <pub-id pub-id-type="doi">10.3390/cancers13061431</pub-id>
</citation>
</ref>
<ref id="B86">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tuli</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Basumatary</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Gill</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Kahani</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Arya</surname>
<given-names>R. C.</given-names>
</name>
<name>
<surname>Wander</surname>
<given-names>G. S.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>HealthFog: an ensemble deep learning based smart healthcare system for automatic diagnosis of heart diseases in integrated IoT and fog computing environments</article-title>. <source>Future Gener. Comput. Syst.</source> <volume>104</volume>, <fpage>187</fpage>&#x2013;<lpage>200</lpage>. <pub-id pub-id-type="doi">10.1016/j.future.2019.10.043</pub-id>
</citation>
</ref>
<ref id="B87">
<citation citation-type="book">
<collab>U.S. Environmental Protection Agency</collab> (<year>2014</year>). <source>Volatile organic compounds in various sample matrices using equilibrium headspace analysis</source>. <publisher-loc>Pennsylvania Avenue, NW</publisher-loc>: <publisher-name>U.S. Environmental Protection Agency</publisher-name>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.epa.gov/sites/default/files/2015-12/documents/5021a.pdf">https://www.epa.gov/sites/default/files/2015-12/documents/5021a.pdf</ext-link>.</comment>
</citation>
</ref>
<ref id="B88">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Varga</surname>
<given-names>Z. V.</given-names>
</name>
<name>
<surname>Matyas</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Erdelyi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Cinar</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Nieri</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chicca</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>&#x3b2;-Caryophyllene protects against alcoholic steatohepatitis by attenuating inflammation and metabolic dysregulation in mice</article-title>. <source>Br. J. Pharmacol.</source> <volume>175</volume> (<issue>2</issue>), <fpage>320</fpage>&#x2013;<lpage>334</lpage>. <pub-id pub-id-type="doi">10.1111/bph.13722</pub-id>
</citation>
</ref>
<ref id="B89">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname>
<given-names>Y. T.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>P. Y.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>C. Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>H. J.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>C. C.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>J. S.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Non-alcoholic fatty liver disease among patients with sleep disorders: a nationwide study of Taiwan</article-title>. <source>BMC Gastroenterol.</source> <volume>20</volume> (<issue>1</issue>), <fpage>32</fpage>. <pub-id pub-id-type="doi">10.1186/s12876-020-1178-7</pub-id>
</citation>
</ref>
<ref id="B90">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wilson</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Oba</surname>
<given-names>P. M.</given-names>
</name>
<name>
<surname>Koziol</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Applegate</surname>
<given-names>C. C.</given-names>
</name>
<name>
<surname>Soto-Diaz</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Steelman</surname>
<given-names>A. J.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Effects of a <italic>Saccharomyces cerevisiae</italic> fermentation product-supplemented diet on circulating immune cells and oxidative stress markers of dogs</article-title>. <source>J. Anim. Sci.</source> <volume>100</volume> (<issue>9</issue>), <fpage>skac245</fpage>. <pub-id pub-id-type="doi">10.1093/jas/skac245</pub-id>
</citation>
</ref>
<ref id="B91">
<citation citation-type="web">
<collab>World Health Organizatiom-INTERNATIONAL PROGRAMME ON CHEMICAL SAFETY</collab> (<year>1990</year>). <article-title>Environmental health criteria 103 2-Propanol</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.inchem.org/documents/ehc/ehc/ehc103.htm">https://www.inchem.org/documents/ehc/ehc/ehc103.htm</ext-link>.</comment>
</citation>
</ref>
<ref id="B92">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Tsai</surname>
<given-names>S. P.</given-names>
</name>
<name>
<surname>Tsao</surname>
<given-names>C. K.</given-names>
</name>
<name>
<surname>Chiu</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Tsai</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>P. J.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Cohort profile: the Taiwan MJ cohort: half a million Chinese with repeated health surveillance data</article-title>. <source>Int. J. Epidemiol.</source> <volume>46</volume> (<issue>6</issue>), <fpage>1744</fpage>&#x2013;<lpage>1744g</lpage>. <pub-id pub-id-type="doi">10.1093/ije/dyw282</pub-id>
</citation>
</ref>
<ref id="B93">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yamaguchi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>McCall</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>X. X.</given-names>
</name>
<name>
<surname>Pandey</surname>
<given-names>S. K.</given-names>
</name>
<etal/>
</person-group> (<year>2007</year>). <article-title>Inhibiting triglyceride synthesis improves hepatic steatosis but exacerbates liver damage and fibrosis in Obese mice with nonalcoholic steatohepatitis</article-title>. <source>Hepatology</source> <volume>45</volume> (<issue>6</issue>), <fpage>1366</fpage>&#x2013;<lpage>1374</lpage>. <pub-id pub-id-type="doi">10.1002/hep.21655</pub-id>
</citation>
</ref>
<ref id="B94">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ye</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xiong</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Comparison of machine learning methods and conventional logistic regressions for predicting gestational diabetes using routine clinical data: a retrospective cohort study</article-title>. <source>J. Diabetes Res.</source> <volume>2020</volume>, <fpage>4168340</fpage>. <pub-id pub-id-type="doi">10.1155/2020/4168340</pub-id>
</citation>
</ref>
<ref id="B95">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Younossi</surname>
<given-names>Z. M.</given-names>
</name>
<name>
<surname>Koenig</surname>
<given-names>A. B.</given-names>
</name>
<name>
<surname>Abdelatif</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Fazel</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Henry</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wymer</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Global epidemiology of nonalcoholic fatty liver disease-meta-analytic assessment of prevalence, incidence, and outcomes</article-title>. <source>Hepatology</source> <volume>64</volume> (<issue>1</issue>), <fpage>73</fpage>&#x2013;<lpage>84</lpage>. <pub-id pub-id-type="doi">10.1002/hep.28431</pub-id>
</citation>
</ref>
<ref id="B96">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Khas</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Bai</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Ao</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Transcriptome analysis reveals candidate genes of the synthesis of branched-chain fatty acids related to mutton flavor in the lamb liver using Allium mongolicum regel extract</article-title>. <source>J. Animal Sci.</source> <volume>100</volume> (<issue>9</issue>), <fpage>skac256</fpage>. <pub-id pub-id-type="doi">10.1093/jas/skac256</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>