<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Immunol.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Immunology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Immunol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1664-3224</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fimmu.2026.1775236</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Occupational silica exposure drives systemic immune dysregulation and tumor microenvironment susceptibility: evidence from a real-world study</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Hao</surname><given-names>Han</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Zhang</surname><given-names>Zaitian</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Zhang</surname><given-names>Hui</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2974875/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Luo</surname><given-names>Qiang</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2168769/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Zhao</surname><given-names>Jingyi</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1437223/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes" equal-contrib="yes">
<name><surname>Baishan</surname><given-names>Liu</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2339231/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>School of Public Health, North China University of Science and Technology</institution>, <city>Tangshan</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>Department of Orthopedics, First Affiliated Hospital of Hunan University of Medicine</institution>, <city>Huaihua</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff3"><label>3</label><institution>Department of Rheumatology and Immunology, Children&#x2019;s Hospital of Chongqing Medical University</institution>, <city>Chongqing</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff4"><label>4</label><institution>Institute of Traditional Chinese Medicine, Chengde Medical University</institution>, <city>Chengde</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff5"><label>5</label><institution>Department of Respiratory, Jiulongpo District People&#x2019;s Hospital of Chongqing</institution>, <city>Chongqing</city>,&#xa0;<country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Liu Baishan, <email xlink:href="mailto:spblbs@163.com">spblbs@163.com</email></corresp>
<fn fn-type="equal" id="fn003">
<label>&#x2020;</label>
<p>These authors have contributed equally to this work</p></fn>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-03-02">
<day>02</day>
<month>03</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>17</volume>
<elocation-id>1775236</elocation-id>
<history>
<date date-type="received">
<day>25</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>13</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>04</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Hao, Zhang, Zhang, Luo, Zhao and Baishan.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Hao, Zhang, Zhang, Luo, Zhao and Baishan</copyright-holder>
<license>
<ali:license_ref start_date="2026-03-02">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Occupational exposure to carcinogenic dusts such as silica is a well-established risk factor for cancer. However, the molecular mechanisms linking early exposure to tumor-promoting microenvironmental changes remain poorly defined. Emerging evidence suggests that chronic immune dysregulation and remodeling of the tumor microenvironment (TME) may serve as critical intermediates.</p>
</sec>
<sec>
<title>Methods</title>
<p>We analyzed occupational health data from 5,482 industrial workers in Anhui Province, China. Explainable machine learning models were constructed using exposure profiles and hematological immune parameters to predict carcinoembryonic antigen (CEA) positivity, with feature contributions interpreted via SHAP values. Experimental validation involved silica-stimulated THP-1 monocytes and colorectal cancer (CRC) cell lines to assess inflammatory activation and paracrine regulation of CEA. Silica- and CRC-associated genes were integrated from public databases to construct protein&#x2013;protein interaction networks, identify hub genes, and evaluate prognostic significance using TCGA and GSE39582 datasets. Single-cell RNA sequencing (scRNA-seq) analysis was used to resolve cell type&#x2013;specific expression patterns.</p>
</sec>
<sec>
<title>Results</title>
<p>Among 14 algorithms tested, CatBoost exhibited the highest predictive performance for CEA positivity. SHAP analysis highlighted the monocyte-to-lymphocyte ratio and silica exposure as dominant contributors. Mediation analysis confirmed that systemic inflammation partially mediated the silica&#x2013;CEA association. <italic>In vitro</italic>, silica activated NF-&#x3ba;B&#x2013;dependent IL-6 secretion in THP-1 cells, and conditioned media dose-dependently upregulated CEA expression in CRC cells&#x2014;an effect attenuated by NF-&#x3ba;B inhibition or IL-6 neutralization. Multi-omics analysis identified 42 overlapping genes linking silica exposure to CRC, with enrichment in cytokine signaling, adhesion, and matrix remodeling pathways. A hub gene&#x2013;based risk score was significantly associated with overall survival. scRNA-seq analysis revealed elevated expression of inflammation- and adhesion-related genes in tumor-associated macrophages.</p>
</sec>
<sec>
<title>Conclusions</title>
<p>Occupational silica exposure induces macrophage-driven inflammatory signaling that promotes early CEA elevation and TME remodeling. Integrating machine learning with experimental and multi-omics validation provides a translational framework for identifying exposure-responsive biomarkers and immune-related cancer risk in occupational settings.</p>
</sec>
</abstract>
<kwd-group>
<kwd>carcinoembryonic antigen (CEA)</kwd>
<kwd>occupational exposure</kwd>
<kwd>silica dust</kwd>
<kwd>tumor microenvironment</kwd>
<kwd>tumor-associated macrophages</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. The Science and Technology Program of Chengde (Grant No. 202406A017), and the Innovation and Entrepreneurship Training Plan for Provincial College Students of Chengde Medical University 4 (No. 2024023), open project supported by Hebei (Chengde) Industrial Technology Institute of Chinese Medicinal Materials (No. CYKF202302).</funding-statement>
</funding-group>
<counts>
<fig-count count="8"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="34"/>
<page-count count="16"/>
<word-count count="8828"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Cancer Immunity and Immunotherapy</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>Occupational carcinogens are an important but historically unrecognized component of the global cancer burden (<xref ref-type="bibr" rid="B1">1</xref>). With the increasing specialization and diversification of industrial chemicals, workers are exposed to more and more new complex toxins, which has raised concerns about the long-term health consequences of occupational exposure (<xref ref-type="bibr" rid="B2">2</xref>). Epidemiological evidence suggests that approximately 2% -8% of cancers can be attributed to occupational exposure, highlighting its significant impact on public health (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B3">3</xref>). In 2000, the World Health Organization&#x2019;s Comparative Risk Assessment (CRA) project provided the first global systematic estimate of the cancer burden caused by occupational exposure (<xref ref-type="bibr" rid="B1">1</xref>). On this basis, the International Agency for Research on Cancer (IARC) classifies nearly 200 carcinogens as Group 1 or 2A human carcinogens, many of which are commonly present in work environments (<xref ref-type="bibr" rid="B4">4</xref>).</p>
<p>Common occupational carcinogens include asbestos, crystalline silica, sawdust, polycyclic aromatic hydrocarbons, heavy metals, aromatic amines, organic solvents, and environmental pollutants such as formaldehyde and radon (<xref ref-type="bibr" rid="B4">4</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>). These drugs are causally associated with a range of malignant tumors, including lung cancer, mesothelioma, bladder cancer, leukemia, and skin cancer (<xref ref-type="bibr" rid="B5">5</xref>&#x2013;<xref ref-type="bibr" rid="B7">7</xref>). Importantly, the carcinogenic risk associated with occupational exposure not only reflects the inherent genetic toxicity of individual factors, but also factors such as the duration and intensity of exposure, co exposure, and long incubation periods (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B8">8</xref>). Occupational exposure occurs in different industries, including rubber and pigment manufacturing, textile production, mining, painting, insulation, and metal processing (<xref ref-type="bibr" rid="B5">5</xref>). Due to the fact that many occupational cancers only appear decades after initial exposure, early detection and attribution remain significant challenges (<xref ref-type="bibr" rid="B8">8</xref>). It is estimated that approximately 150000 deaths worldwide each year are related to historical occupational exposure to some recognized carcinogens (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B3">3</xref>). Despite regulatory measures such as bans, exposure restrictions, and monitoring systems, occupational cancer continues to exacerbate the global cancer burden and requires ongoing mechanism investigations and policy attention (<xref ref-type="bibr" rid="B5">5</xref>).</p>
<p>Traditional occupational cancer research emphasizes direct genetic toxicity mechanisms, including DNA damage and mutation accumulation caused by carcinogens (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B9">9</xref>). However, new evidence suggests that non genotoxic mechanisms also play a critical role in tumorigenesis by shaping the local tissue environment (<xref ref-type="bibr" rid="B10">10</xref>). Long term exposure to substances such as asbestos, benzo [a] pyrene, polycyclic aromatic hydrocarbons, and certain metals can cause persistent inflammation, oxidative stress, and immune dysfunction, leading to abnormal activation of stromal cells, immune cells, and endothelial cells (<xref ref-type="bibr" rid="B9">9</xref>&#x2013;<xref ref-type="bibr" rid="B11">11</xref>). These reactions contribute to the formation of a tumor microenvironment (TME) characterized by immune evasion, angiogenesis, extracellular matrix remodeling, and metabolic reprogramming (<xref ref-type="bibr" rid="B10">10</xref>&#x2013;<xref ref-type="bibr" rid="B12">12</xref>). Different exposure types may drive specific TME phenotypes; For example, the accumulation of silica and asbestos in lung tissue is associated with polarization of M2 macrophages and activation of fibroblasts, promoting fibrosis and lung cancer progression (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B13">13</xref>), while exposure to benzene and aromatic amines is associated with immune failure and epigenetic changes in bone marrow and bladder tissue, promoting an environment favorable for the development of leukemia or urothelial carcinoma (<xref ref-type="bibr" rid="B14">14</xref>).</p>
<p>In this context, identifying circulating biomarkers that reflect early exposure effects and TME remodeling has become a priority in occupational cancer research (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B10">10</xref>). Carcinoembryonic antigen (CEA) is one of the earliest discovered and most widely used tumor markers, showing sensitivity and clinical relevance in various cancers associated with occupational exposure (<xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B16">16</xref>). CEA levels are generally low in normal adult tissues, but increase in epithelial malignancies such as lung cancer, gastric cancer, pancreatic cancer and bladder cancer; Its expression is not only related to tumor burden, but also to tumor immune microenvironment and tumor heterogeneity (<xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B17">17</xref>).</p>
<p>More and more evidence suggests that elevated CEA may be an early indicator of chronic inflammatory response and transformation processes in occupational exposure populations, and may reflect dynamic changes in TME caused by exposure (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B17">17</xref>). For example, exposure to asbestos or silica dust is associated with activation and M2 polarization of alveolar macrophages, which may be consistent with increased CEA expression and immunosuppressive environment (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B17">17</xref>), while benzene and its metabolites are associated with bone marrow suppression and immune failure, which is related to elevated circulating CEA (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B14">14</xref>). These findings suggest that CEA can not only serve as a static disease monitor, but also as a &#x2018;liquid sensor&#x2019; that captures the continuous process from exposure to TME regulation to malignant tumors, enabling early detection and risk stratification at the individual level (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B18">18</xref>).</p>
<p>In this context, we attempt to elucidate the relationship between occupational exposure and CEA in large worker cohorts. Firstly, we will apply interpretable machine learning to a comprehensive occupational dataset, jointly model heterogeneous exposures, quantify their contributions to CEA changes, and develop cross validated personalized risk prediction models. Secondly, guided by model insights, we conducted <italic>in vitro</italic> validation studies to investigate the biological link between key occupational exposure factors and tumorigenic microenvironment characteristics, such as macrophage activation.</p>
</sec>
<sec id="s2">
<title>Methods</title>
<p>The occupational health monitoring data comes from Anhui Province, China, including 5482 workers who participated in routine occupational health monitoring. Individuals with missing key data (CEA, immune parameters, or exposure records) were excluded. In addition, to minimize confounding, participants with a known history of malignant tumors, chronic liver diseases (e.g., cirrhosis, hepatic insufficiency), or documented acute or chronic infectious/inflammatory conditions at the time of examination were excluded based on medical records and clinician review. Workers with abnormal liver enzymes exceeding 3&#xd7; ULN were also excluded from the analysis. The exposure records in the workplace are systematically linked to standardized hematological test results, enabling a comprehensive assessment of environmental exposure and biological reactions. This study used a cross-sectional design. Each participant contributed a single record, selected from their most recent occupational health examination with complete data on exposure, blood parameters, and tumor markers.</p>
<p>Hematological parameters include platelet count, hematocrit (PCT), mean platelet volume (MPV), red blood cell count, hemoglobin concentration, mean corpuscular hemoglobin (MCH), mean corpuscular hemoglobin concentration (MCHC), and red blood cell distribution width. White blood cell related measurements include absolute counts and corresponding percentages of neutrophils, lymphocytes, monocytes, eosinophils, and basophils. In addition, composite inflammatory indicators were derived, including neutrophil to lymphocyte ratio (NLR), monocyte to lymphocyte ratio (MLR), and systemic immune inflammatory index (SII), to capture systemic inflammatory status.</p>
<p>Occupational exposure variables cover various common hazards in industrial environments. Exposure to particulate matter includes coal dust, crystalline silica dust, dust, other dust, other inorganic dust, welding fumes, cement dust, rock dust, gypsum dust, ceramic dust, limestone dust, marble dust, sawdust, plant dust, and organic dust. Gas exposure includes sulfur dioxide, nitrogen dioxide, carbon monoxide, carbon dioxide, nitrogen oxides, hydrogen sulfide, ammonia, methane, hydrogen cyanide, hydrogen, ozone, chlorine, and hydrogen chloride. Organic solvents and industrial chemicals include benzene, toluene, xylene, naphthalene, phenol, vinyl chloride, dichloroethane, methanol, ethanol, propanol, isopropanol, acetic acid, methyl acetate, ethyl acetate, ethylene glycol, pyridine, ether, dimethyl ether, dimethyl sulfate, and methylamine, as well as hydrazine, hydrazine hydrate, formaldehyde, acetylene, propane, and phosphine. Corrosive and reactive substances include sulfur trioxide, sulfuric acid, hydrochloric acid, nitric acid, sodium hydroxide, potassium hydroxide, sodium carbonate, sodium hypochlorite, polyacrylamide, hydrogen peroxide, disodium hydrogen phosphate, and ammonium sulfate. Heavy metals and highly toxic compounds include mercury iodide, trinitrophenol (picric acid), lead thiocyanate, sodium nitrite, and potassium antimony tartrate. It also recorded complex industrial mixtures, including coke oven emissions and coal tar. Physical occupational hazards include noise, high and low temperatures, arm vibration, ultraviolet radiation, and power frequency electric fields. Acid exposure, alkali exposure, and acid mist or anhydride exposure are recorded as independent occupational categories. Occupational exposure classification was based on a combination of workplace environmental monitoring data and individual job title or position records, as maintained by enterprise occupational health archives. Airborne concentrations of respirable dust and relevant toxicants (e.g., silica, benzene) were assessed through routine annual workplace sampling, and each worker&#x2019;s exposure status was determined using a 3-year rolling average where available. Exposure levels were evaluated against the national occupational exposure limits (OELs) defined in GBZ/T 229.1&#x2013;2010 (China). In cases where enterprises implemented stricter internal thresholds, these enterprise-specific limits were adopted accordingly. Workers were categorized as &#x2018;exceeding OEL&#x2019; if their exposure exceeded the applicable threshold based on their job function and monitored concentration.</p>
<p>All hematological parameters were measured using standardized protocols under routine occupational health examinations conducted by enterprise-affiliated medical centers. Certified clinical laboratories used automated hematology analyzers with internal and external quality controls. Environmental exposure monitoring followed the national occupational hygiene standard GBZ/T 192.1&#x2013;2007.</p>
<p>According to the official occupational health records of the company, all occupational exposure variables are encoded as binary indicators (yes/no). Only when long-term workplace monitoring confirms that the exposure level exceeds the corresponding national occupational exposure limit during the monitoring period, will workers be classified as contacts. This binary classification reflects a regulatory based exposure assessment framework that does not capture quantitative exposure intensity.</p>
<p>In addition to the occupational exposure variables and hematological parameters mentioned above, CEA is also listed as an exposure related biomarker. The serum CEA level is obtained from routine occupational health examinations and converted into a binary variable based on the clinical reference threshold of the enterprise. Individuals with CEA values exceeding the upper limit of the normal reference range are classified as CEA positive, while individuals within the reference range are classified as CEA negative. Consistent with the coding strategy used for occupational exposure, CEA is considered a binary variable in all subsequent analyses. Adopting this binary transformation to enhance robustness, reduce the influence of extreme values, and maintain consistency with the classification structure of occupational health monitoring data. CEA positivity was defined using a threshold of 5.0 ng/mL, consistent with the reference range applied by the enterprise clinical laboratory at the time of routine occupational health screening. This threshold aligns with commonly used cut-offs in clinical settings and laboratory assay guidelines. Due to data constraints, the same threshold was applied for all participants regardless of gender or smoking status. While some studies suggest adjusted ranges for specific populations, we treated CEA as a binary outcome using a unified standard and acknowledge this simplification as a study limitation.</p>
<p>This study has been reviewed and approved by the Ethics Committee of North China Institute of Science and Technology (Approval No.: 2024280).</p>
<sec id="s2_1">
<title>Explainable machine learning model</title>
<p>We utilized occupational health monitoring data from 5482 workers in a large industrial enterprise in Anhui Province, China, to construct a comprehensive analysis framework for studying the relationship between complex occupational exposure and CEA status. All variables recorded in the occupational health monitoring system are included as candidate features, thereby minimizing prior selection bias to the greatest extent possible. These variables encompass hematological parameters, composite inflammatory indices, and a wide range of occupational exposure indicators, enabling multi-level characterization of host physiology and environmental burden (<xref ref-type="bibr" rid="B19">19</xref>).</p>
<p>Hematological measurements capture the global hematopoietic and immune status, including platelet, red blood cell, and white blood cell indices, as well as the relative composition of major white blood cell subgroups. To further summarize systemic immune activation, derived inflammatory markers (NLR, MLR, and SII) were integrated to reflect chronic low-grade inflammation and immune imbalance.</p>
<p>Occupational exposure data covers a highly heterogeneous spectrum of hazards typical of industrial environments. Exposure to particulate matter includes coal dust, crystalline silica, and various inorganic and organic dust, reflecting long-term inhalation risks associated with mining, building materials, and manufacturing processes. Exposure to gaseous and inorganic chemicals includes sulfur and nitrogen oxides, carbon monoxide and carbon dioxide, hydrogen sulfide, ammonia, methane, ozone, chlorine, and related compounds, representing combustion related emissions and confined space exposure. Organic solvents and industrial chemicals encompass aromatic hydrocarbons, halogenated compounds, alcohols, ethers, esters, and other reactive intermediates commonly found in chemical production and material processing. In addition, the dataset also records occupational exposure to corrosive substances, highly toxic substances, and complex industrial mixtures such as coke oven emissions and coal tar. In addition to chemical and particulate hazards, occupational health monitoring systems also systematically record physical stress factors, including noise, extreme heat, arm vibration, ultraviolet radiation, and power frequency electric fields, which constitute sustained non chemical stress factors that can disrupt physiological homeostasis.</p>
<p>A total of 14 algorithms were implemented, covering different method families, including tree based ensemble models (random forest, gradient enhancement, adaptive enhancement, LightGBM, CatBoost), linear and regression based methods (logistic regression, LASSO, partial least squares), kernel and distance based methods (support vector machine with kernel function, k-nearest neighbor), probability and discriminant models (naive Bayes, discriminant analysis), and neural networks (multilayer perceptron). The dataset is randomly divided into a training set (70%) and a testing set (30%). Optimize hyperparameters through 5-fold cross validation using Bayesian optimization (Hyperopt). Evaluate model performance through sensitivity, specificity, and area under the operating characteristic curve (AUC) of the subjects (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B21">21</xref>). To evaluate robustness, 1000 guided resampling iterations were conducted to obtain the distribution of sensitivity and AUC, and to compare model performance.</p>
<p>Prior to model training, we addressed several key data processing considerations to ensure robustness and fairness. First, given the moderate imbalance between CEA-positive and CEA-negative cases, we applied class weighting schemes for algorithms that support weighted loss functions (e.g., CatBoost and logistic regression), and used stratified sampling throughout training and evaluation steps to maintain representative class distributions.</p>
<p>Second, we evaluated missingness across all features. Variables with less than 5% missing values were imputed using the mean for continuous variables and the mode for categorical variables, while features with greater than 20% missingness were excluded from modeling.</p>
<p>Lastly, during the 1000 iterations of guided resampling, we implemented stratified resampling to preserve the original CEA class proportions across both training and test subsets. This approach minimized bias introduced by artificial class distributions and supported reliable performance comparison across models.</p>
<p>To enhance interpretability, we applied SHAP to quantify the marginal contribution of each feature and characterize potential non-linear exposure&#x2013;response relationships. Model interpretability was visualized through SHAP summary plots (including beeswarm and bar plots to display global feature importance and direction of effects) and dependence plots (to illustrate non-linear patterns and potential feature interactions).</p>
</sec>
<sec id="s2_2">
<title>Cell lines and culture conditions</title>
<p>Human monocytic THP-1 cells were cultured in RPMI-1640 medium (Gibco, Thermo Fisher Scientific) supplemented with 10% fetal bovine serum (FBS; Gibco) and 1% penicillin&#x2013;streptomycin (100 U/mL penicillin and 100 &#x3bc;g/mL streptomycin; Gibco). Human colorectal cancer (CRC) cell lines HT29 and Caco-2 were maintained in high-glucose DMEM (Gibco) containing 10% FBS and 1% penicillin&#x2013;streptomycin. All cells were incubated at 37 &#xb0;C in a humidified atmosphere with 5% CO<sub>2</sub>. Specifically, the complete culture media composition was described for each cell line, including base medium (RPMI-1640 or high-glucose DMEM), 10% fetal bovine serum (FBS), and 1% penicillin&#x2013;streptomycin. THP-1 cells were seeded at 5 &#xd7; 10<sup>5</sup> cells per well in 24-well plates, while HT29 and Caco-2 cells were seeded at 1.5 &#xd7; 10<sup>5</sup> cells per well. After a 12-hour equilibration period, cells were exposed to SiO<sub>2</sub> for indicated durations: 6 hours for RNA extraction, and 24 hours for cytokine detection. For NF-&#x3ba;B inhibition, cells were pretreated with BAY 11-7082 (5 &#x3bc;M) for 1 hour prior to exposure, and the inhibitor was maintained throughout the stimulation period. Conditioned media (CM) were collected by sequential centrifugation (300 &#xd7; g, then 2,000 &#xd7; g), filtered through 0.22 &#x3bc;m membranes, and stored at &#x2212;80 &#xb0;C. For stimulation assays, CRC cells were treated with a 1:1 mixture of CM and fresh complete medium to ensure consistent serum and nutrient conditions. In this study, we also used 20&#x2013;50 nm amorphous SiO<sub>2</sub> nanoparticles as model particles to induce inflammatory responses; future studies will include respirable crystalline silica to better simulate occupational exposure conditions.</p>
</sec>
<sec id="s2_3">
<title>SiO<sub>2</sub> particle preparation and dispersion</title>
<p>Amorphous silica (SiO<sub>2</sub>) nanopowder (Sigma-Aldrich, 637238; nominal particle size 20&#x2013;50 nm) was suspended in sterile phosphate-buffered saline (PBS) to prepare a 10 mg/mL stock solution. Immediately prior to each exposure, the suspension was sonicated in an ice-water bath for 10 min to minimize particle agglomeration and ensure homogeneous dispersion.</p>
</sec>
<sec id="s2_4">
<title>NF-&#x3ba;B inhibition and IL-6 neutralization</title>
<p>NF-&#x3ba;B signaling was inhibited using BAY 11-7082 (Sigma-Aldrich, B5556). BAY 11&#x2013;7082 was dissolved in DMSO to generate a 10 mM stock solution and applied at a final concentration of 5 &#x3bc;M. Cells were pretreated with BAY 11&#x2013;7082 for 1 h before SiO<sub>2</sub> exposure, and the inhibitor was maintained throughout the exposure period.</p>
<p>For IL-6 neutralization experiments, a monoclonal anti-human IL-6 antibody (R&amp;D Systems, MAB206) was added at a final concentration of 2 &#x3bc;g/mL at the onset of stimulation.</p>
</sec>
<sec id="s2_5">
<title>SiO<sub>2</sub>-induced inflammatory activation of THP-1 monocytes</title>
<p>THP-1 cells were seeded in 24-well plates at a density of 5 &#xd7; 10<sup>5</sup> cells per well in 500 &#x3bc;L complete RPMI-1640 medium and allowed to equilibrate for 12 h. Cells were then exposed to vehicle or increasing concentrations of SiO<sub>2</sub> (25, 50, or 100 &#x3bc;g/mL). To evaluate the contribution of NF-&#x3ba;B signaling, cells exposed to the highest SiO<sub>2</sub> concentration were additionally co-treated with BAY 11-7082, and BAY 11&#x2013;7082 alone was included as an inhibitor control. The selected SiO<sub>2</sub> concentrations were determined in pilot experiments to establish a robust inflammatory response while preserving cell viability.</p>
</sec>
<sec id="s2_6">
<title>RNA extraction and quantitative real-time PCR</title>
<p>At 6 h after exposure, THP-1 cells were harvested for RNA isolation. Total RNA was extracted using TRIzol reagent (Invitrogen, Thermo Fisher Scientific) and quantified by NanoDrop spectrophotometry. Complementary DNA was synthesized using the PrimeScript RT reagent kit (Takara, RR037A). Quantitative PCR was performed using PowerUp SYBR Green Master Mix (Applied Biosystems, Thermo Fisher Scientific) on a QuantStudio 5 Real-Time PCR system. Cycling conditions consisted of an initial denaturation at 95 &#xb0;C for 2 min, followed by 40 cycles of 95 &#xb0;C for 15 s and 60 &#xb0;C for 60 s, with subsequent melt-curve analysis. Expression levels of IL6, TNFA, and IL1B were normalized to GAPDH and calculated using the 2<sup>-</sup>&#x394;&#x394;Ct method.</p>
</sec>
<sec id="s2_7">
<title>Cytokine measurement by ELISA</title>
<p>Culture supernatants were collected 24 h after exposure, centrifuged at 2,000 &#xd7; g for 10 min to remove cellular debris, and stored at &#x2212;80 &#xb0;C. IL-6 concentrations were quantified using a human IL-6 ELISA kit (R&amp;D Systems, DY206) according to the manufacturer&#x2019;s instructions. At this stage, only IL-6 was quantified at the protein level, as it was prioritized for its established role in inflammatory paracrine signaling and tumor-related CEA regulation. Protein-level analysis of IL-1&#x3b2; and TNF-&#x3b1; was not performed, but their mRNA induction was confirmed by RT-qPCR. Future experiments will expand protein validation to include additional cytokines.</p>
</sec>
<sec id="s2_8">
<title>Western blot analysis</title>
<p>Proteins were extracted using RIPA buffer (Cat:R0010, Solarbio) on ice for 30 minutes, then centrifuged at 12,000 rpm for 15 minutes at 4 &#xb0;C. The supernatant&#x2019;s protein concentration was measured with a BCA assay (Cat:PC0020, Solarbio). Equal protein amounts (20 &#x3bc;g per lane) were mixed with 5&#xd7; SDS buffer (Cat:LT101S, Epizyme Biotech), denatured at 100 &#xb0;C for 10 minutes, and separated by SDS-PAGE using a 5% stacking gel and an 12% separating gel (Cat:P1200, Solarbio), depending on target protein size, at 80 V for 30 minutes and 120 V for 60&#x2013;90 minutes.</p>
<p>Proteins were transferred to methanol-activated PVDF membranes via wet transfer at 100 V for 60 minutes on ice. Membranes were blocked with 5% non-fat milk in TBST for 1.5 hours at room temperature, then incubated with primary antibodies (Anti-NF-&#x3ba;B p65 Antibody, Cat:A00284-1, Boster) overnight at 4 &#xb0;C. After three 5-minute TBST washes, membranes were treated with HRP-conjugated secondary antibodies for 1 hour at room temperature. Following another three TBST washes, protein bands were visualized using ECL and quantified with ImageJ, using GAPDH (Anti-GAPDH Antibody, Cat:A00227-1, Boster) as a reference.</p>
</sec>
<sec id="s2_9">
<title>Direct exposure of CRC cells to SiO<sub>2</sub></title>
<p>HT29 and Caco-2 cells were seeded in 24-well plates at 1.5 &#xd7; 10<sup>5</sup> cells per well and allowed to adhere overnight. Cells were subsequently treated with vehicle or SiO<sub>2</sub> at low, medium, or high concentrations as defined above. Cells were harvested at 12 h for analysis of CEA (CEACAM5) mRNA expression, and culture supernatants were collected at 48 h for measurement of secreted CEA protein. CEA mRNA levels were quantified by RT&#x2013;qPCR using GAPDH as the reference gene, and secreted CEA concentrations were determined using a human CEA ELISA kit (Abcam, ab99992). Samples were diluted when necessary to fall within the linear range of the standard curve and were analyzed in duplicate.</p>
</sec>
<sec id="s2_10">
<title>Generation of THP-1 conditioned medium and CRC stimulation</title>
<p>To generate conditioned medium, THP-1 cells were treated with vehicle or increasing concentrations of SiO<sub>2</sub> as described above. After 24 h, culture supernatants were collected and sequentially clarified by centrifugation at 300 &#xd7; g for 5 min followed by 2,000 &#xd7; g for 10 min, and then filtered through a 0.22 &#x3bc;m sterile filter to remove residual cells, debris, and particles. Conditioned media were aliquoted and stored at &#x2212;80 &#xb0;C. HT29 and Caco-2 cells were stimulated with conditioned media using a fixed ratio of 50% conditioned medium and 50% fresh complete medium (final 10% FBS) to ensure equivalent nutrient and serum conditions across treatment groups. CEA mRNA expression was assessed at 12 h, and secreted CEA protein levels were measured at 48 h.</p>
</sec>
<sec id="s2_11">
<title>Causal validation by suppression of monocyte inflammation and IL-6 neutralization</title>
<p>To establish causality, conditioned media were generated from THP-1 cells exposed to high-dose SiO<sub>2</sub> in the presence or absence of BAY 11-7082, as well as from cells treated with BAY 11&#x2013;7082 alone. Conditioned media were collected at 24 h and processed identically to those described above. IL-6 concentrations in conditioned media were quantified by ELISA to confirm effective suppression of inflammatory output following NF-&#x3ba;B inhibition.</p>
<p>CRC cells were then stimulated with conditioned media in the presence or absence of anti-IL-6 antibody or isotype control IgG, which were added at the onset of stimulation and maintained throughout incubation. CEA mRNA expression and protein secretion were analyzed at 12 h and 48 h, respectively.</p>
</sec>
<sec id="s2_12">
<title>Identification of core genes</title>
<p>Core genes associated with SiO<sub>2</sub> exposure were retrieved from the Comparative Toxicogenomics Database (CTD), while colorectal cancer (CRC)&#x2013;related core genes were obtained from the GeneCards database. The overlapping genes were defined as potential molecular mediators linking environmental exposure to tumor pathogenesis.</p>
</sec>
<sec id="s2_13">
<title>Transcriptomic validation using GEO and TCGA datasets</title>
<p>Transcriptomic profiles and matched clinical annotations for ovarian cancer were obtained from The TCGA and GEO. Only samples with complete follow-up information were included in the analysis. Genes with a prioritization score greater than four from the preceding integrative analysis were selected for clinical correlation assessment. Survival endpoints included overall survival (CRC) in both TCGA and GEO. For each candidate gene, patients were stratified into high- and low-expression groups based on the median expression value within each cohort. Univariate survival analysis was performed using the Kaplan&#x2013;Meier method with the log-rank test, while multivariable Cox proportional hazards regression models were applied to estimate hazard ratios (HRs) and 95% confidence intervals (CIs), adjusting for relevant clinical covariates. Genes demonstrating significant survival associations were subjected to functional enrichment analysis.</p>
</sec>
<sec id="s2_14">
<title>Single-cell RNA sequencing analysis</title>
<p>The preprocessing and analysis of the single-cell RNA sequencing dataset GSE161277 were supported by the KeyanZhiJia Single-Cell Analysis Platform.</p>
</sec>
<sec id="s2_15">
<title>Statistical analysis</title>
<p>Data are presented as mean &#xb1; standard deviation (SD). Statistical analyses were performed using GraphPad Prism 9.0. One-way analysis of variance (ANOVA) followed by Dunnett&#x2019;s or Tukey&#x2019;s <italic>post hoc</italic> tests was applied as appropriate. Normality and homogeneity of variance were assessed using the Shapiro&#x2013;Wilk and Levene tests, respectively, and data were log-transformed when necessary. A two-sided P &lt; 0.05 was considered statistically significant.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Performance comparison of machine learning models</title>
<p>To systematically evaluate the robustness and applicability of different machine learning paradigms in predicting carcinoembryonic antigen (CEA) positivity, we constructed and compared 14 representative algorithms across major method families. These include tree based ensemble models (random forest, gradient enhancement, adaptive enhancement, LightGBM, and CatBoost), regression based methods (logistic regression, LASSO, and partial least squares), kernel and distance based methods (support vector machines and k-nearest neighbors), probability models (naive Bayes and discriminant analysis), and neural networks (multilayer perceptron). The dataset is randomly divided into training (70%) and testing (30%) subsets, and hyperparameters are optimized using five fold cross validation. The model performance was evaluated in multiple dimensions, including discriminative ability, predictive consistency, and potential clinical utility.</p>
<p>Clear method stratification has emerged in data segmentation and evaluation metrics. Set based models consistently outperform regression, kernel, and distance based methods in both training and testing sets. During the training phase, LightGBM and CatBoost achieved near saturation discriminative performance with AUC values close to 1.00, followed by adaptive enhancement, gradient enhancement, and random forest. In contrast, logistic regression, k-nearest neighbor, and naive Bayes showed significantly weaker discriminative power, highlighting the limited expressive ability of simpler models in capturing complex exposure biomarker relationships (<xref ref-type="fig" rid="f1"><bold>Figures&#xa0;1A, B</bold></xref>). It is worth noting that the performance differences in the test set have become more pronounced. CatBoost maintains excellent sensitivity, specificity, F1 score, and overall accuracy, with minimal degradation relative to training performance, indicating its strong generalization ability and stable classification behavior (<xref ref-type="fig" rid="f1"><bold>Figures&#xa0;1C, D</bold></xref>). These findings indicate that ensemble learning frameworks not only perform well in model fitting, but also have structural robustness in out of sample prediction.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Performance comparison of machine learning models for predicting CEA positivity. <bold>(A)</bold> Forest plot of AUC scores (with 95% confidence intervals) for each model in the training set. <bold>(B)</bold> Forest plot of AUC scores (with 95% confidence intervals) for each model in the testing set. <bold>(C)</bold> Performance metrics of all models in the training set, including sensitivity, specificity, accuracy, positive predictive value (PPV), negative predictive value (NPV), F1 score, and Youden&#x2019;s index. <bold>(D)</bold> Performance metrics of all models in the testing set, including sensitivity, specificity, accuracy, positive predictive value (PPV), negative predictive value (NPV), F1 score, and Youden&#x2019;s index.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1775236-g001.tif">
<alt-text content-type="machine-generated">Side-by-side panels show model evaluation results. Panels A and B display forest plots with color-coded dots for AUC scores and 95% confidence intervals for various machine learning models on a trainset, with LightGBM and RandomForest achieving highest AUC. Panels C and D list corresponding models with metrics: sensitivity, specificity, accuracy, positive and negative predictive values, F1, and Youden's index.</alt-text>
</graphic></fig>
<p>The analysis of receiver operating characteristics further confirms these trends (<xref ref-type="fig" rid="f2"><bold>Figures&#xa0;2A, B</bold></xref>). In the training set, CatBoost and LightGBM have consistently dominated the ROC space, while in the test set, CatBoost exhibits the smallest curve collapse, highlighting its resilience to sample perturbations (<xref ref-type="fig" rid="f2"><bold>Figures&#xa0;2A, B</bold></xref>). However, relying solely on discriminative performance cannot fully capture the reliability of the model. To address this issue, DCA was used to evaluate potential clinical relevance (<xref ref-type="fig" rid="f2"><bold>Figures&#xa0;2C, D</bold></xref>). Within a wide range of threshold probabilities, CatBoost achieved the highest net benefit in both training and testing queues, outperforming alternative algorithms and default strategies (&#x201c;treat all&#x201d; and &#x201c;do not treat&#x201d;) (<xref ref-type="fig" rid="f2"><bold>Figures&#xa0;2C, D</bold></xref>). This indicates that CatBoost provides excellent decision level value for identifying high-risk individuals with CEA positivity, supporting its translational relevance to occupational risk stratification (<xref ref-type="fig" rid="f3"><bold>Figures&#xa0;3A, B</bold></xref>). The stability of the model was further verified through residual structure analysis. The reverse cumulative residual distribution indicates that CatBoost consistently exhibits a steep left shift curve in both the training and testing sets, reflecting a significant reduction in the proportion of large prediction errors. Correspondingly, the residual boxplot RMSE of CatBoost, while logistic regression, naive Bayes, and partial least squares models show significant long tail error distributions (<xref ref-type="fig" rid="f3"><bold>Figures&#xa0;3C, D</bold></xref>). Overall, these analyses indicate that the model&#x2019;s advantage depends not only on average performance metrics, but also on controlled and reproducible erroneous behavior.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Model discrimination and clinical utility across training and testing datasets. <bold>(A)</bold> ROC curves of all models in the training set. <bold>(B)</bold> ROC curves of all models in the testing set. <bold>(C)</bold> Decision curve analysis (DCA) for each model in the training set. <bold>(D)</bold> Decision curve analysis (DCA) for each model in the testing set.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1775236-g002.tif">
<alt-text content-type="machine-generated">Four-panel figure showing machine learning model performance. Panel A presents ROC curves for several models on the training set with AUCs ranging from 0.783 to 0.997. Panel B shows ROC curves for the same models on another training set, with AUCs ranging from 0.530 to 0.969. Panels C and D display decision curve analyses for training and validation sets, respectively, comparing net benefit across different models and risk thresholds. Each model is color-coded with a legend.</alt-text>
</graphic></fig>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Residual distribution analysis across training and testing sets. <bold>(A)</bold> Reverse cumulative distribution of absolute residuals for each model in the training set. <bold>(B)</bold> Reverse cumulative distribution of absolute residuals for each model in the testing set. <bold>(C)</bold> Boxplot of residuals in the training set. Red dots indicate root mean square of residuals for each model. <bold>(D)</bold> Boxplot of residuals in the testing set. Red dots indicate root mean square of residuals for each model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1775236-g003.tif">
<alt-text content-type="machine-generated">Four-panel figure comparing machine learning models by residuals. Panels A and B show reverse cumulative distributions of absolute residuals for training and test sets, respectively, with model lines color-coded. Panels C and D present boxplots of residuals for training and test data, with red dots indicating root mean square errors for each model.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_2">
<title>Model interpretation using SHAP values</title>
<p>Among the 14 machine learning algorithms evaluated, CatBoost demonstrated the best overall performance on the test set in terms of AUC, sensitivity, and specificity. In addition to its strong predictive ability, CatBoost is particularly well-suited for handling complex nonlinear relationships and categorical variables without extensive preprocessing. Its high stability and compatibility with SHAP values for feature attribution made it a practical and interpretable choice for this real-world dataset. The feature attribution using the SHAP framework indicates that CEA positivity is mainly driven by hematological and inflammation related variables, with MLR being the most influential predictor (<xref ref-type="fig" rid="f4"><bold>Figures&#xa0;4A, B</bold></xref>). This discovery emphasizes that systemic immune imbalance is the core determinant of CEA abnormal expression. Among all occupational and environmental exposures, the SHAP contribution of silica dust is the highest, significantly higher than that of nitrogen dioxide, coal dust, and carbon monoxide. SHAP distribution and dependency analysis further indicate that the association between silica exposure and CEA positivity is clearly nonlinear, characterized by threshold like effects and significant inter individual heterogeneity at higher exposure levels (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4C</bold></xref>). These patterns indicate that silicon dust may act as a risk amplifier rather than producing uniform linear effects.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>SHAP-based interpretation of model predictions. <bold>(A)</bold> Feature importance ranked by mean absolute SHAP values. <bold>(B)</bold> SHAP beeswarm plot showing the distribution and impact direction of SHAP values across all samples. Each point represents a single observation; color indicates the corresponding feature value. <bold>(C)</bold> SHAP dependence plots of the top 15 most important features. Each subplot shows the non-linear relationship between the feature value and its SHAP contribution to the model output. Color gradients indicate possible interactions with secondary features.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1775236-g004.tif">
<alt-text content-type="machine-generated">Composite data visualization for model interpretability comprises three sections: (A) bar plot ranking top fifteen features by mean absolute SHAP value, (B) bee swarm plot of SHAP value distributions for each feature, and (C) fifteen SHAP dependence scatterplots illustrating nonlinear relationships between feature values and SHAP values, each with a color bar representing additional variable context.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_3">
<title>Mediation analysis of inflammatory markers</title>
<p>To elucidate the potential biological pathways behind this structural association, mediation analysis was conducted to evaluate the role of inflammatory markers in linking silica exposure to CEA elevation (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref>). Multiple biomarkers including MLR, neutrophil percentage, lymphocyte percentage, NLR, and SII showed significant indirect effects, indicating that the relationship between silica and CEA is partially mediated through the inflammatory pathway. It is worth noting that MLR accounts for the largest proportion in mediating effects, supporting a model in which monocyte dominated inflammatory activation represents a key mechanistic link between occupational silica exposure and elevated CEA levels.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Mediation analysis of inflammatory indices linking silica dust exposure and CEA elevation.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1775236-g005.tif">
<alt-text content-type="machine-generated">Six diagram panels display mediation models illustrating the relationship between silica dust exposure and CEA via different mediators: MLR, monocyte percentage, lymphocyte percentage, NLR, SII, and neutrophil percentage. Each diagram shows arrows from silica dust to the mediator and from both silica dust and mediator to CEA, annotated with indirect (ACME) and direct (ADE) effect values, with total effect noted as zero point two seven two nine.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_4">
<title><italic>In vitro</italic> validation of silica-induced cytokine responses</title>
<p>As shown in <xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6A, B</bold></xref>, SiO<sub>2</sub> exposure strongly activates THP-1 monocytes in a dose-dependent manner. The mRNA levels of IL-6, IL-1 &#x3b2;, and TNF - &#x3b1; gradually increased from the low-dose and medium dose groups to the high-dose group, and multiple pairwise comparisons reached statistical significance (asterisk annotation). Importantly, the addition of inhibitors under high-dose conditions significantly weakened the induction of transcription of all three cytokines, restoring expression to the low-dose range. These findings indicate that SiO <sub>2</sub> - induced monocyte activation is inhibitor sensitive and regulated, rather than reflecting non-specific transcriptional fluctuations. In contrast, direct exposure of CRC cells to SiO <sub>2</sub> only resulted in minor changes in CEA expression (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6C</bold></xref>). In Caco-2 and HT29 cells, CEA mRNA levels remained close to baseline at low, medium, and high SiO2 levels, and the secreted CEA protein only showed slight upward drift, without a clear dose-response relationship or consistent statistical significance. This pattern supports the explanation that CEA is not strongly regulated by SiO <sub>2</sub> under these conditions, through direct tumor cell autonomous mechanisms.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p><italic>In vitro</italic> evaluation of monocyte-derived cytokine signaling on CEA expression in colorectal cancer cells. <bold>(A)</bold> Schematic diagram of the experimental workflow. THP-1 monocytes were exposed to amorphous silica (SiO<sub>2</sub>) and treated with NF-&#x3ba;B inhibitor (BAY 11-7082) or IL-6 neutralizing antibody. Conditioned media (CM) were collected and applied to colorectal cancer cell lines (HT29 and Caco-2) to evaluate CEA mRNA and protein expression. <bold>(B)</bold> RT-qPCR quantification of IL-6, IL-1&#x3b2;, and TNF-&#x3b1; mRNA expression in THP-1 cells following low/high-dose SiO<sub>2</sub> stimulation with or without BAY 11&#x2013;7082 treatment. <bold>(C)</bold> CEA mRNA and protein levels in HT29 and Caco-2 cells directly treated with SiO<sub>2</sub> particles (without conditioned media exposure). <bold>(D)</bold> CEA mRNA and protein expression in HT29 and Caco-2 cells treated with conditioned media derived from silica-stimulated THP-1 cells, with or without IL-6 neutralization or NF-&#x3ba;B inhibition. <bold>(E)</bold> CEA mRNA and protein levels in colorectal cancer cells treated with CM under varying conditions: anti-IL-6 antibody, NF-&#x3ba;B inhibitor (BAY 11-7082), or both. Statistical comparisons are shown between multiple experimental groups. Significance levels: P&#x2009;&lt;&#x2009;0.05 (*), P&#x2009;&lt;&#x2009;0.01 (**), P&#x2009;&lt;&#x2009;0.001 (***), P&#x2009;&lt;&#x2009;0.0001 (****).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1775236-g006.tif">
<alt-text content-type="machine-generated">Scientific figure with five panels. Panel A shows a schematic diagram illustrating a proposed experimental setup and signaling pathway involving SiO2 exposure, NF-&#x3ba;B inhibition, cytokine release (IL-6), and downstream effects on CEA secretion in cell lines. Panels B to E contain grouped bar graphs quantifying gene and protein expression levels (IL-6, IL-1&#x3b2;, TNF-&#x3b1;, CEA) in HT29 and Caco-2 cells under various treatments, with statistical significance marked by asterisks. Each graph has labeled axes and clear legends for experimental conditions.</alt-text>
</graphic></fig>
<p>We examined how SiO<sub>2</sub> exposure affects NF-&#x3ba;B p65 activation by conducting Western blot analysis on cells treated with different SiO<sub>2</sub> concentrations, with and without an NF-&#x3ba;B inhibitor. <xref ref-type="supplementary-material" rid="SF1"><bold>Supplementary Figure&#xa0;1</bold></xref> shows that NF-&#x3ba;B protein levels were baseline in the control group. SiO<sub>2</sub> treatment led to a concentration-dependent increase in NF-&#x3ba;B expression, with the highest levels in the SiO<sub>2</sub>-High group, followed by the SiO<sub>2</sub>-Mild and SiO<sub>2</sub>-Low groups, all significantly higher than the control (P &lt; 0.0001). The NF-&#x3ba;B p65 inhibitor significantly reduced NF-&#x3ba;B p65 upregulation in the SiO<sub>2</sub>-High+Inhibitor group (P &lt; 0.01), while the inhibitor alone did not affect basal NF-&#x3ba;B p65 levels. The results suggest that exposure to SiO<sub>2</sub> triggers the NF-&#x3ba;B pathway based on concentration, and this activation can be significantly reduced by using an NF-&#x3ba;B inhibitor.</p>
<p>It is noteworthy that CM derived from SiO <sub>2</sub> - stimulated THP-1 cells induced significant and graded CEA induction in CRC cells (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6D</bold></xref>). In Caco-2 and HT29, CEA mRNA gradually increases with the CM produced by low, medium, and high doses of SiO2. The parallel increase of CEA protein secreted by treated monocytes reaches its maximum level under high CM conditions. The consistent stepwise pattern observed at the transcript and protein levels, as well as dense significant annotations, indicate that the soluble factors released by activated monocytes are sufficient to drive strong CEA responses in CRC cells, and the intensity of this response is proportional to the strength of upstream monocyte activation.</p>
<p>Finally, the intervention experiment supported the causal interruption of the paracrine axis (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6E</bold></xref>). High CM produced the strongest increase in CEA mRNA and protein in two CRC cell lines, while the isotype IgG control group remained comparable to the high CM group, indicating that antibody addition alone cannot explain the observed effects. In contrast, CM (high+NFkBi CM) produced under NF - &#x3ba; B inhibition significantly reduced the increase in CEA driven by high CM, and the neutralization of IL-6 during CRC stimulation also weakened the expression of CEA at the mRNA and protein levels. It is worth noting that in the context of CM control, anti-IL-6 therapy is still close to baseline, supporting pathway specificity and opposing the main direct inhibitory effect of antibody therapy under non inflammatory conditions.</p>
<p>Overall, this set of numbers supports a coherent mechanistic model, in which SiO<sub>2</sub> dose-dependent activates THP-1 inflammatory signaling, direct SiO<sub>2</sub> exposure has little effect on CRC CEA, and monocyte derived conditioned medium can effectively induce CEA in CRC cells in a dose-dependent manner. Partial reversal of NF - &#x3ba; B inhibition (upstream, monocyte side) and IL-6 neutralization (downstream) suggests that this inflammatory paracrine pathway is partially but not exclusively necessary, consistent with the multifactorial monocyte secretion group driving CRC CEA upregulation.</p>
</sec>
<sec id="s3_5">
<title>Identification of overlapping genes and prognostic modeling</title>
<p>SiO<sub>2</sub>-associated genes were retrieved from the Comparative Toxicogenomics Database (CTD), while CRC&#x2013;related genes were obtained from the GeneCards database. An intersection analysis identified a total of 42 overlapping genes that were simultaneously associated with SiO<sub>2</sub> exposure and CRC (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7A</bold></xref>), suggesting that these genes may serve as potential molecular bridges linking environmental exposure to tumorigenesis. To further characterize the functional relationships among the overlapping genes, a protein&#x2013;protein interaction (PPI) network was constructed (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7B</bold></xref>). Network analysis revealed a highly interconnected interaction pattern among these genes, indicating their involvement in shared biological processes. Based on network topological features, a set of key hub genes was identified, including AKT1, TNF, TGFB1, IL1B, MMP9, MMP2, FN1, ICAM1, PECAM1, and CDH5. These genes exhibited high connectivity within the network and are likely to play central roles in regulating inflammatory responses, extracellular matrix remodeling, and endothelial function.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Identification of shared core genes between SiO<sub>2</sub> exposure and colorectal cancer and their prognostic significance. <bold>(A)</bold> Venn diagram showing the overlap between SiO<sub>2</sub>-associated genes derived from the CTD database and CRC-related genes obtained from GeneCards. A total of 42 overlapping genes were identified. <bold>(B)</bold> Protein&#x2013;protein interaction (PPI) network constructed using the overlapping genes. Key hub genes with high connectivity are highlighted. <bold>(C)</bold> Multivariable Cox regression analysis and concordance index (C-index) evaluating the prognostic performance of the core gene signature in the TCGA-CRC and GSE39582 cohorts across multiple survival endpoints. <bold>(D)</bold> Prognostic evaluation of the gene signature in the TCGA-CRC cohort. Kaplan&#x2013;Meier survival curves comparing high- and low-risk groups, time-dependent ROC curves for 1-, 3-, and 5-year overall survival, and decision curve analysis (DCA) illustrating the clinical net benefit of the model. **, **** P&lt; 0.01, P&lt;0.0001.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1775236-g007.tif">
<alt-text content-type="machine-generated">Panel A shows a Venn diagram comparing gene sets from CRC and silicon, indicating 9930 unique to CRC, 2 unique to silicon, and 42 overlapping genes. Panel B displays a network diagram of protein-protein interactions, highlighting central nodes such as CDH5, FN1, TNF, MMP9, AKT1, and others. Panel C presents Cox regression plots and concordance indexes for TCGA_CRC and GSE39582 datasets, with hazard ratios for various survival outcomes. Panel D illustrates four graphs for TCGA_CRC: a Kaplan-Meier survival curve, a calibration plot, a sensitivity-specificity ROC curve with area under the curve values, and a net benefit decision curve.</alt-text>
</graphic></fig>
<p>A risk score model was constructed based on the identified core genes and evaluated in the TCGA-CRC and GSE39582 cohorts to assess its prognostic significance. Multivariable Cox regression analysis demonstrated that the gene signature was significantly associated with overall survival (OS) (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7C</bold></xref>) and consistently exhibited robust prognostic performance across both independent cohorts. The concordance index (C-index) further confirmed the predictive accuracy of the model. Kaplan&#x2013;Meier survival analysis in the TCGA-CRC cohort showed that patients in the high-risk group had significantly poorer overall survival compared with those in the low-risk group (log-rank P &lt; 0.0001) (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7D</bold></xref>). Time-dependent receiver operating characteristic (ROC) curves indicated strong discriminatory power for 1-, 3-, and 5-year survival prediction. In addition, decision curve analysis (DCA) demonstrated that the risk model provided a stable net clinical benefit across a wide range of threshold probabilities, highlighting its potential clinical utility.</p>
</sec>
<sec id="s3_6">
<title>Single-cell transcriptomic insights into tumor microenvironment remodeling</title>
<p>To provide cell-level evidence supporting the role of SiO<sub>2</sub> in shaping tumor microenvironment susceptibility, we analyzed single-cell RNA sequencing data from the GSE161277 dataset. After stringent quality control, the cells retained for downstream analysis exhibited comparable distributions of detected genes (nFeature_RNA), total UMI counts (nCount_RNA), and mitochondrial gene proportions (percent.mt) across samples (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8A</bold></xref>), indicating high data quality and minimal technical bias. Following normalization and dimensionality reduction, highly variable genes were identified to capture dominant biological heterogeneity (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8B</bold></xref>). Unsupervised clustering combined with Uniform Manifold Approximation and Projection (UMAP) visualization revealed well-separated cellular populations (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8C</bold></xref>). Based on canonical marker genes, these clusters were annotated as major immune and stromal cell types, including T cells, B cells, monocytes, macrophages, neutrophils, fibroblasts, endothelial cells, and epithelial cells, reflecting the complex cellular architecture of the colorectal tumor microenvironment. To directly interrogate inflammation-related transcriptional alterations associated with occupational exposure&#x2013;related immune imbalance, we examined the expression patterns of key genes involved in immune activation, cytokine signaling, and cell&#x2013;cell interactions. Comparative analysis between control and CRC samples demonstrated marked upregulation of ICAM1, TGFB1, and IL1B in CRC-derived cells (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8D</bold></xref>). Feature plots revealed that these genes were enriched within specific immune and stromal compartments rather than being uniformly expressed, indicating localized microenvironmental activation rather than global transcriptional shifts. Violin plot analysis further confirmed significantly higher expression levels of these genes in CRC samples compared with controls.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>Single-cell transcriptomic evidence linking immune dysregulation to tumor microenvironment remodeling in colorectal cancer. <bold>(A)</bold> Quality control metrics of single-cell RNA sequencing data from the GSE161277 dataset, showing the distributions of detected genes (nFeature_RNA), total UMI counts (nCount_RNA), and mitochondrial gene proportions (percent.mt) across samples. <bold>(B)</bold> Identification of highly variable genes following normalization and scaling, capturing dominant biological heterogeneity for downstream analysis. <bold>(C)</bold> Uniform Manifold Approximation and Projection (UMAP) visualization of single cells colored by annotated cell types based on canonical marker genes, including immune and stromal populations such as T cells, B cells, monocytes, macrophages, neutrophils, fibroblasts, endothelial cells, and epithelial cells. <bold>(D)</bold> Feature plots and violin plots showing the expression patterns of inflammation- and signaling-related genes (ICAM1, TGFB1, and IL1B) in control and CRC samples.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1775236-g008.tif">
<alt-text content-type="machine-generated">Panel A contains three violin plots representing nFeature_RNA, nCount_RNA, and percent.mt across sample identities. Panel B shows scatter plots of standardized variance versus average expression for genes, highlighting highly variable genes. Panel C presents a UMAP plot with distinct cell clusters annotated by color. Panel D displays UMAP expression plots and corresponding violin plots for ICAM1, TGFB1, and IL1B in control and CRC conditions.</alt-text>
</graphic></fig>
<p>Collectively, these single-cell results provide direct cellular evidence that colorectal cancer is characterized by coordinated immune and stromal transcriptional reprogramming, consistent with a state of sustained inflammatory activation. The enrichment of adhesion molecules and cytokine-related genes supports a model in which systemic immune dysregulation&#x2014;potentially triggered by chronic occupational exposure&#x2014;contributes to tumor microenvironment remodeling, thereby creating a permissive context for tumor-associated biomarker elevation and disease progression.</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>Our research findings collectively depict a mechanism and computational framework linking occupational silica exposure to elevated levels of carcinoembryonic antigen (CEA) through inflammation mediated pathways. By combining real-world occupational health monitoring data with machine learning and <italic>in vitro</italic> validation, we provide multidimensional evidence to support CEA as a reactive biomarker that reflects environmental exposure and promotes tumor microenvironment remodeling.</p>
<p>From a computational perspective, the outstanding performance of ensemble learning models highlights the importance of capturing nonlinear, multidimensional interactions between occupational exposure, hematological parameters, and systemic inflammation indices. The interpretability of SHAP based models further reveals inflammation related features, especially MLR, which is a key mediator linking specific occupational toxins with elevated CEA. These findings extend previous reports that inflammatory features may occur prior to obvious malignant tumors, emphasizing the potential of artificial intelligence driven frameworks in exposure risk stratification (<xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B23">23</xref>). At the biological level, our <italic>in vitro</italic> experiments confirmed that amorphous silica particles induce strong monocyte activation characterized by NF - &#x3ba; B-dependent IL-6 secretion. The conditioned medium derived from activated monocytes significantly increased CEA expression in colorectal cancer cells, partially reversed after drug inhibition or cytokine neutralization. These results suggest that elevated CEA levels in exposed workers may reflect chronic immune disorders, rather than just cellular autonomous genotoxic effects (<xref ref-type="bibr" rid="B24">24</xref>). This mechanism may be particularly relevant to tissues with active epithelial renewal, such as the lungs, colon, or bladder (<xref ref-type="bibr" rid="B25">25</xref>). Finally, given that CEA testing is widely accessible, inexpensive, and already incorporated into routine health screening protocols, the ability to predict CEA elevation using machine learning offers a scalable and practical tool for occupational cancer risk stratification, enabling proactive surveillance and early intervention in exposed populations.</p>
<p>Mechanistically, the pathway linking silica exposure to CEA upregulation involves a multi-step cascade centered around monocyte activation and paracrine signaling. After inhalation, amorphous silica particles accumulate in the alveolar region, where they are engulfed by resident or recruited monocytes/macrophages. This activates innate immune signaling pathways, especially the NF-&#x3ba;B axis, leading to upregulation and secretion of pro-inflammatory cytokines, including IL-6, TN -&#x3b1;, and IL-1&#x3b2; (<xref ref-type="bibr" rid="B26">26</xref>). SO, in our SHAP analysis, monocyte-to-lymphocyte ratio (MLR) and neutrophil count emerged as the most important predictors of CEA positivity. Biologically, these features reflect systemic immune dysregulation consistent with chronic silica exposure. Elevated MLR suggests a shift toward a myeloid-dominant immune profile, which has been associated with macrophage-driven inflammation, cytokine release (e.g., IL-6), and tumor-promoting paracrine signaling. Increased neutrophil counts may reflect acute-phase responses and have been implicated in tumor progression through reactive oxygen species generation, immune suppression, and neutrophil extracellular trap (NET) formation. These patterns align with recent studies showing that silica inhalation promotes myeloid expansion, NF-&#x3ba;B activation, and inflammatory remodeling of the tumor microenvironment (<xref ref-type="bibr" rid="B26">26</xref>). Therefore, the top SHAP features not only carry predictive power, but also biological relevance in the context of exposure-related carcinogenesis.</p>
<p>IL-6 is a pleiotropic cytokine that plays a dual role in inflammation and cancer biology. In our study, IL-6 served as a key soluble mediator linking monocyte activation with tumor cell responses. When CRC cells were exposed to conditioned medium containing IL-6 (possibly other co releasing factors), a significant increase in CEA mRNA expression and protein secretion was observed. The neutralizing effect of IL-6 weakened this effect, but it was not completely eliminated, indicating that although IL-6 is necessary, there may be other mediators at work (<xref ref-type="bibr" rid="B24">24</xref>). Importantly, the response of CRC cells to monocyte derived signals is not only a passive response, but also involves reprogramming of the transcriptional network that controls the expression of tumor biomarkers. It is known that CEA (CEACAM5) is upregulated in the context of inflammatory cytokine exposure, and its promoter region contains binding sites that respond to downstream effector STAT3 of IL-6 signaling (<xref ref-type="bibr" rid="B27">27</xref>). Therefore, sustained exposure to IL-6 may activate the JAK/STAT3 pathway, leading epithelial cells to develop a pro tumor phenotype, enhancing immune evasion, cell adhesion, and potentially increasing metastatic potential. In addition, incomplete reversal of CEA induction by NF - &#x3ba; B blockade in monocytes or IL-6 neutralization in tumor cells indicates redundancy and complexity in the inflammatory secretion group. Other mediators, such as IL-8, GM-CSF, or ROS, may synergistically interact with IL-6 or act in parallel pathways to shape TME. This multifactorial inflammatory environment may become a potential risk amplifier, especially in chronic or cumulative exposure situations (<xref ref-type="bibr" rid="B28">28</xref>). In addition to IL-6, we also observed marked mRNA upregulation of IL-1&#x3b2; and TNF-&#x3b1; upon silica stimulation; however, their protein levels were not assessed in the current study. This represents a limitation of our cytokine profiling, and we acknowledge that these additional secreted factors may contribute to downstream effects. Further protein-level validation is warranted to fully characterize the inflammatory secretome of exposed monocytes.</p>
<p>These findings reinforce the emerging understanding that occupational silica exposure not only triggers local inflammation but also reprograms immune cell function, contributing to early TME susceptibility. Recent studies have shown that amorphous and crystalline forms of silica activate macrophages through NF-&#x3ba;B and NLRP3 pathways, leading to sustained secretion of IL-6 and other proinflammatory cytokines (<xref ref-type="bibr" rid="B29">29</xref>&#x2013;<xref ref-type="bibr" rid="B32">32</xref>). Our <italic>in vitro</italic> results further support this model, demonstrating that THP-1&#x2013;derived conditioned media can upregulate CEA in CRC cells via an IL-6&#x2013;dependent mechanism. In parallel, our scRNA-seq analysis revealed increased expression of inflammation- and adhesion-related genes in tumor-associated macrophages, consistent with prior reports in colorectal cancer cohorts (<xref ref-type="bibr" rid="B33">33</xref>). These integrated findings suggest that immune dysregulation may represent a key intermediate link between occupational exposure and early cancer risk, particularly in high-risk working populations.</p>
<p>Our research has several implications. Firstly, incorporating CEA into occupational monitoring programs can promote early identification of high-risk populations. Secondly, using interpretable models can transparently explain the exposure biomarker relationship, strengthen regulatory accountability, and enable personalized risk assessment. Thirdly, identifying inflammation as a key mediator paves the way for intervention strategies targeting the immune microenvironment, including anti-inflammatory or cytokine regulation methods. However, there are several limitations worth considering. The exposure data is based on binary classification obtained from regulatory monitoring, rather than continuous individual dose measurements, which may underestimate the dose-response gradient. And, there were no potentially important confounding variables in this study, such as smoking status, BMI and chronic comorbidities (such as diabetes, cardiovascular disease). The occupational monitoring system used in this study did not regularly collect these data. Although our model includes a variety of hematological and demographic characteristics, unmeasured confounding factors cannot be completely excluded. Secondly, although the focus on silica provides mechanistic clarity, further research is needed to extend it to other carcinogens such as benzene and polycyclic aromatic hydrocarbons. Thirdly, although THP-1 cells are widely used to model macrophage activation in response to environmental stimuli, their leukemic origin may limit generalizability. Future studies incorporating RAW264.7 or PBMC-derived macrophages&#x2014;used in comparable models of particulate-induced immune activation (<xref ref-type="bibr" rid="B29">29</xref>, <xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B34">34</xref>) are warranted to validate the robustness and applicability of our findings. Finally, occupational exposure in this study was classified as a binary variable based on regulatory thresholds, which may not fully capture exposure intensity or duration. And while the model demonstrated good internal performance, external validation in independent populations is necessary to confirm generalizability and robustness. Given the heterogeneity of occupational environments and individual health status, future work should incorporate stratified or sensitivity analyses (e.g., by sex, age group, or job category) to further validate model robustness and generalizability.</p>
<p>In summary, this study supports a model that occupational silica exposure promotes CEA elevation through inflammation driven paracrine signaling. The integration of machine learning, molecular biology, and exposure science provides a powerful paradigm for revealing hidden connections between environmental carcinogens and early risk biomarkers. Future research should extend this method to additional exposures and explore the prognostic value of dynamic CEA monitoring in occupational exposure cohorts.</p>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p></sec>
<sec id="s6" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by the Ethics Committee of North China Institute of Science and Technology (Approval No.: 2024280). The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p></sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>HG: Data curation, Methodology, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. ZZ: Writing &#x2013; review &amp; editing, Data curation. HZ: Validation, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. QL: Formal analysis, Writing &#x2013; review &amp; editing. JZ: Funding acquisition, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. LB: Conceptualization, Validation, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing.</p></sec>
<ack>
<title>Acknowledgments</title>
<p>We acknowledge the KeyanZhiJia single-cell analysis platform for providing technical support and analytical information for the single-cell RNA sequencing dataset GSE161277.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fimmu.2026.1775236/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fimmu.2026.1775236/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Image1.pdf" id="SF1" mimetype="application/pdf"><label>Supplementary Figure&#xa0;1</label>
<caption>
<p>NF-&#x3ba;B activation verification.</p>
</caption></supplementary-material></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Marant Micallef</surname> <given-names>C</given-names></name>
<name><surname>Shield</surname> <given-names>KD</given-names></name>
<name><surname>Baldi</surname> <given-names>I</given-names></name>
<name><surname>Charbotel</surname> <given-names>B</given-names></name>
<name><surname>Fervers</surname> <given-names>B</given-names></name>
<name><surname>Gilg Soit Ilg</surname> <given-names>A</given-names></name>
<etal/>
</person-group>. 
<article-title>Occupational exposures and cancer: a review of agents and relative risk estimates</article-title>. <source>Occup Environ Med</source>. (<year>2018</year>) <volume>75</volume>:<page-range>604&#x2013;14</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/oemed-2017-104858</pub-id>, PMID: <pub-id pub-id-type="pmid">29735747</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<label>2</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wild</surname> <given-names>CP</given-names></name>
</person-group>. 
<article-title>The exposome: from concept to utility</article-title>. <source>Int J Epidemiol</source>. (<year>2012</year>) <volume>41</volume>:<fpage>24</fpage>&#x2013;<lpage>32</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/ije/dyr236</pub-id>, PMID: <pub-id pub-id-type="pmid">22296988</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<label>3</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rushton</surname> <given-names>L</given-names></name>
<name><surname>Hutchings</surname> <given-names>SJ</given-names></name>
<name><surname>Fortunato</surname> <given-names>L</given-names></name>
<name><surname>Young</surname> <given-names>C</given-names></name>
<name><surname>Evans</surname> <given-names>GS</given-names></name>
<name><surname>Brown</surname> <given-names>T</given-names></name>
<etal/>
</person-group>. 
<article-title>Occupational cancer burden in Great Britain</article-title>. <source>Br J Cancer</source>. (<year>2012</year>) <volume>107</volume>:<page-range>S3&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/bjc.2012.112</pub-id>, PMID: <pub-id pub-id-type="pmid">22710676</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<label>4</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Pearce</surname> <given-names>N</given-names></name>
<name><surname>Blair</surname> <given-names>A</given-names></name>
<name><surname>Vineis</surname> <given-names>P</given-names></name>
<name><surname>Ahrens</surname> <given-names>W</given-names></name>
<name><surname>Andersen</surname> <given-names>A</given-names></name>
<name><surname>Anto</surname> <given-names>JM</given-names></name>
<etal/>
</person-group>. 
<article-title>IARC monographs: 40 years of evaluating carcinogenic hazards to humans</article-title>. <source>Environ Health Perspect</source>. (<year>2015</year>) <volume>123</volume>:<page-range>507&#x2013;14</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1289/ehp.1409149</pub-id>, PMID: <pub-id pub-id-type="pmid">25712798</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<label>5</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Loomis</surname> <given-names>D</given-names></name>
<name><surname>Guha</surname> <given-names>N</given-names></name>
<name><surname>Hall</surname> <given-names>AL</given-names></name>
<name><surname>Straif</surname> <given-names>K</given-names></name>
</person-group>. 
<article-title>Identifying occupational carcinogens: an update from the IARC Monographs</article-title>. <source>Occup Environ Med</source>. (<year>2018</year>) <volume>75</volume>:<fpage>593</fpage>&#x2013;<lpage>603</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/oemed-2017-104944</pub-id>, PMID: <pub-id pub-id-type="pmid">29769352</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<label>6</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Straif</surname> <given-names>K</given-names></name>
<name><surname>Benbrahim-Tallaa</surname> <given-names>L</given-names></name>
<name><surname>Baan</surname> <given-names>R</given-names></name>
<name><surname>Grosse</surname> <given-names>Y</given-names></name>
<name><surname>Secretan</surname> <given-names>B</given-names></name>
<name><surname>El Ghissassi</surname> <given-names>F</given-names></name>
<etal/>
</person-group>. 
<article-title>A review of human carcinogens--Part C: metals, arsenic, dusts, and fibres</article-title>. <source>Lancet Oncol</source>. (<year>2009</year>) <volume>10</volume>:<page-range>453&#x2013;4</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/s1470-2045(09)70134-2</pub-id>, PMID: <pub-id pub-id-type="pmid">19418618</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<label>7</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Clapp</surname> <given-names>RW</given-names></name>
<name><surname>Jacobs</surname> <given-names>MM</given-names></name>
<name><surname>Loechler</surname> <given-names>EL</given-names></name>
</person-group>. 
<article-title>Environmental and occupational causes of cancer: new evidence 2005-2007</article-title>. <source>Rev Environ Health</source>. (<year>2008</year>) <volume>23</volume>:<fpage>1</fpage>&#x2013;<lpage>37</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1515/reveh.2008.23.1.1</pub-id>, PMID: <pub-id pub-id-type="pmid">18557596</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<label>8</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Siemiatycki</surname> <given-names>J</given-names></name>
<name><surname>Richardson</surname> <given-names>L</given-names></name>
<name><surname>Straif</surname> <given-names>K</given-names></name>
<name><surname>Latreille</surname> <given-names>B</given-names></name>
<name><surname>Lakhani</surname> <given-names>R</given-names></name>
<name><surname>Campbell</surname> <given-names>S</given-names></name>
<etal/>
</person-group>. 
<article-title>Listing occupational carcinogens</article-title>. <source>Environ Health Perspect</source>. (<year>2004</year>) <volume>112</volume>:<page-range>1447&#x2013;59</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1289/ehp.7047</pub-id>, PMID: <pub-id pub-id-type="pmid">15531427</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<label>9</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Greten</surname> <given-names>FR</given-names></name>
<name><surname>Grivennikov</surname> <given-names>SI</given-names></name>
</person-group>. 
<article-title>Inflammation and Cancer: Triggers, Mechanisms, and Consequences</article-title>. <source>Immunity</source>. (<year>2019</year>) <volume>51</volume>:<fpage>27</fpage>&#x2013;<lpage>41</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.immuni.2019.06.025</pub-id>, PMID: <pub-id pub-id-type="pmid">31315034</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<label>10</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Landskron</surname> <given-names>G</given-names></name>
<name><surname>de la Fuente</surname> <given-names>M</given-names></name>
<name><surname>Thuwajit</surname> <given-names>P</given-names></name>
<name><surname>Thuwajit</surname> <given-names>C</given-names></name>
<name><surname>Hermoso</surname> <given-names>MA</given-names></name>
</person-group>. 
<article-title>Chronic inflammation and cytokines in the tumor microenvironment</article-title>. <source>J Immunol Res</source>. (<year>2014</year>) <volume>2014</volume>:<elocation-id>149185</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2014/149185</pub-id>, PMID: <pub-id pub-id-type="pmid">24901008</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<label>11</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kim</surname> <given-names>SJ</given-names></name>
<name><surname>Williams</surname> <given-names>D</given-names></name>
<name><surname>Cheresh</surname> <given-names>P</given-names></name>
<name><surname>Kamp</surname> <given-names>DW</given-names></name>
</person-group>. 
<article-title>Asbestos-Induced Gastrointestinal Cancer: An Update</article-title>. <source>J Gastrointest Dig Syst</source>. (<year>2013</year>) <volume>3</volume>:<elocation-id>135</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.4172/2161-069X.1000135</pub-id>, PMID: <pub-id pub-id-type="pmid">27158561</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<label>12</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wynn</surname> <given-names>TA</given-names></name>
<name><surname>Vannella</surname> <given-names>KM</given-names></name>
</person-group>. 
<article-title>Macrophages in Tissue Repair, Regeneration, and Fibrosis</article-title>. <source>Immunity</source>. (<year>2016</year>) <volume>44</volume>:<page-range>450&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.immuni.2016.02.015</pub-id>, PMID: <pub-id pub-id-type="pmid">26982353</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<label>13</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Leung</surname> <given-names>CC</given-names></name>
<name><surname>Yu</surname> <given-names>IT</given-names></name>
<name><surname>Chen</surname> <given-names>W</given-names></name>
</person-group>. 
<article-title>Silicosis</article-title>. <source>Lancet</source>. (<year>9830</year>) <volume>2012</volume>:<fpage>379</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0140-6736(12)60235-9</pub-id>, PMID: <pub-id pub-id-type="pmid">22534002</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<label>14</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lan</surname> <given-names>Q</given-names></name>
<name><surname>Zhang</surname> <given-names>L</given-names></name>
<name><surname>Li</surname> <given-names>G</given-names></name>
<name><surname>Vermeulen</surname> <given-names>R</given-names></name>
<name><surname>Weinberg</surname> <given-names>RS</given-names></name>
<name><surname>Dosemeci</surname> <given-names>M</given-names></name>
<etal/>
</person-group>. 
<article-title>Hematotoxicity in workers exposed to low levels of benzene</article-title>. <source>Science</source>. (<year>2004</year>) <volume>306</volume>:<page-range>1774&#x2013;6</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1102443</pub-id>, PMID: <pub-id pub-id-type="pmid">15576619</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<label>15</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Gold</surname> <given-names>P</given-names></name>
<name><surname>Freedman</surname> <given-names>SO</given-names></name>
</person-group>. 
<article-title>Demonstration of tumor-specific antigens in human colonic carcinomata by immunological tolerance and absorption techniques</article-title>. <source>J Exp Med</source>. (<year>1965</year>) <volume>121</volume>:<page-range>439&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1084/jem.121.3.439</pub-id>, PMID: <pub-id pub-id-type="pmid">14270243</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<label>16</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Duffy</surname> <given-names>MJ</given-names></name>
</person-group>. 
<article-title>Carcinoembryonic antigen as a marker for colorectal cancer: is it clinically useful</article-title>? <source>Clin Chem</source>. (<year>2001</year>) <volume>47</volume>:<page-range>624&#x2013;30</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/clinchem/47.4.624</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<label>17</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>De Vries</surname> <given-names>BB</given-names></name>
<name><surname>White</surname> <given-names>SM</given-names></name>
<name><surname>Knight</surname> <given-names>SJ</given-names></name>
<name><surname>Regan</surname> <given-names>R</given-names></name>
<name><surname>Homfray</surname> <given-names>T</given-names></name>
<name><surname>Young</surname> <given-names>ID</given-names></name>
<etal/>
</person-group>. 
<article-title>Clinical studies on submicroscopic subtelomeric rearrangements: a checklist</article-title>. <source>J Med Genet</source>. (<year>2001</year>) <volume>38</volume>:<page-range>145&#x2013;50</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/jmg.38.3.145</pub-id>, PMID: <pub-id pub-id-type="pmid">11238680</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<label>18</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Grivennikov</surname> <given-names>SI</given-names></name>
<name><surname>Greten</surname> <given-names>FR</given-names></name>
<name><surname>Karin</surname> <given-names>M</given-names></name>
</person-group>. 
<article-title>Immunity, inflammation, and cancer</article-title>. <source>Cell</source>. (<year>2010</year>) <volume>140</volume>:<page-range>883&#x2013;99</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cell.2010.01.025</pub-id>, PMID: <pub-id pub-id-type="pmid">20303878</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<label>19</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Faisal</surname> <given-names>F</given-names></name>
<name><surname>Danelakis</surname> <given-names>A</given-names></name>
<name><surname>Bj&#xf8;rk</surname> <given-names>MH</given-names></name>
<name><surname>Winsvold</surname> <given-names>B</given-names></name>
<name><surname>Matharu</surname> <given-names>M</given-names></name>
<name><surname>Nachev</surname> <given-names>P</given-names></name>
<etal/>
</person-group>. 
<article-title>Prediction of new-onset migraine using clinical-genotypic data from the HUNT Study: a machine learning analysis</article-title>. <source>J Headache Pain</source>. (<year>2025</year>) <volume>26</volume>:<fpage>70</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s10194-025-02014-2</pub-id>, PMID: <pub-id pub-id-type="pmid">40197205</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<label>20</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Luo</surname> <given-names>Q</given-names></name>
<name><surname>Hao</surname> <given-names>H</given-names></name>
<name><surname>Xiwen</surname> <given-names>L</given-names></name>
<name><surname>Qui</surname> <given-names>X</given-names></name>
<name><surname>Liu</surname> <given-names>D</given-names></name>
<name><surname>Liu</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>UBE2D1 as a key biomarker in systemic juvenile idiopathic arthritis: a new perspective on diagnosis and disease activity assessment</article-title>. <source>Arthritis Res Ther</source>. (<year>2025</year>) <volume>27</volume>:<fpage>140</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13075-025-03606-8</pub-id>, PMID: <pub-id pub-id-type="pmid">40635084</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<label>21</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Qi</surname> <given-names>X</given-names></name>
<name><surname>Wang</surname> <given-names>S</given-names></name>
<name><surname>Fang</surname> <given-names>C</given-names></name>
<name><surname>Jia</surname> <given-names>J</given-names></name>
<name><surname>Lin</surname> <given-names>L</given-names></name>
<name><surname>Yuan</surname> <given-names>T</given-names></name>
</person-group>. 
<article-title>Machine learning and SHAP value interpretation for predicting comorbidity of cardiovascular disease and cancer with dietary antioxidants</article-title>. <source>Redox Biol</source>. (<year>2025</year>) <volume>79</volume>:<elocation-id>103470</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.redox.2024.103470</pub-id>, PMID: <pub-id pub-id-type="pmid">39700695</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<label>22</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mantovani</surname> <given-names>A</given-names></name>
<name><surname>Allavena</surname> <given-names>P</given-names></name>
<name><surname>Sica</surname> <given-names>A</given-names></name>
<name><surname>Balkwill</surname> <given-names>F</given-names></name>
</person-group>. 
<article-title>Cancer-related inflammation</article-title>. <source>Nature</source>. (<year>2008</year>) <volume>454</volume>:<page-range>436&#x2013;44</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature07205</pub-id>, PMID: <pub-id pub-id-type="pmid">18650914</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<label>23</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Topol</surname> <given-names>EJ</given-names></name>
</person-group>. 
<article-title>High-performance medicine: the convergence of human and artificial intelligence</article-title>. <source>Nat Med</source>. (<year>2019</year>) <volume>25</volume>:<fpage>44</fpage>&#x2013;<lpage>56</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41591-018-0300-7</pub-id>, PMID: <pub-id pub-id-type="pmid">30617339</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<label>24</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Holmer</surname> <given-names>R</given-names></name>
<name><surname>W&#xe4;tzig</surname> <given-names>GH</given-names></name>
<name><surname>Tiwari</surname> <given-names>S</given-names></name>
<name><surname>Rose-John</surname> <given-names>S</given-names></name>
<name><surname>Kalthoff</surname> <given-names>H</given-names></name>
</person-group>. 
<article-title>Interleukin-6 trans-signaling increases the expression of carcinoembryonic antigen-related cell adhesion molecules 5 and 6 in colorectal cancer cells</article-title>. <source>BMC Cancer</source>. (<year>2015</year>) <volume>15</volume>:<fpage>975</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12885-015-1950-1</pub-id>, PMID: <pub-id pub-id-type="pmid">26673628</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<label>25</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Blanpain</surname> <given-names>C</given-names></name>
<name><surname>Fuchs</surname> <given-names>E</given-names></name>
</person-group>. 
<article-title>Epidermal stem cells of the skin</article-title>. <source>Annu Rev Cell Dev Biol</source>. (<year>2006</year>) <volume>22</volume>:<page-range>339&#x2013;73</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev.cellbio.22.010305.104357</pub-id>, PMID: <pub-id pub-id-type="pmid">16824012</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<label>26</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hamilton</surname> <given-names>RF</given-names> <suffix>Jr</suffix></name>
<name><surname>Thakur</surname> <given-names>SA</given-names></name>
<name><surname>Holian</surname> <given-names>A</given-names></name>
</person-group>. 
<article-title>Silica binding and toxicity in alveolar macrophages</article-title>. <source>Free Radic Biol Med</source>. (<year>2008</year>) <volume>44</volume>:<page-range>1246&#x2013;58</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.freeradbiomed.2007.12.027</pub-id>, PMID: <pub-id pub-id-type="pmid">18226603</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<label>27</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lin</surname> <given-names>Y</given-names></name>
<name><surname>He</surname> <given-names>Z</given-names></name>
<name><surname>Ye</surname> <given-names>J</given-names></name>
<name><surname>Liu</surname> <given-names>Z</given-names></name>
<name><surname>She</surname> <given-names>X</given-names></name>
<name><surname>Gao</surname> <given-names>X</given-names></name>
<etal/>
</person-group>. 
<article-title>Progress in Understanding the IL-6/STAT3 Pathway in Colorectal Cancer</article-title>. <source>Onco Targets Ther</source>. (<year>2020</year>) <volume>13</volume>:<page-range>13023&#x2013;32</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2147/OTT.S278013</pub-id>, PMID: <pub-id pub-id-type="pmid">33376351</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<label>28</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hanahan</surname> <given-names>D</given-names></name>
<name><surname>Weinberg</surname> <given-names>RA</given-names></name>
</person-group>. 
<article-title>Hallmarks of cancer: the next generation</article-title>. <source>Cell</source>. (<year>2011</year>) <volume>144</volume>:<page-range>646&#x2013;74</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cell.2011.02.013</pub-id>, PMID: <pub-id pub-id-type="pmid">21376230</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<label>29</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yu</surname> <given-names>R</given-names></name>
<name><surname>Zhang</surname> <given-names>C</given-names></name>
<name><surname>Yuan</surname> <given-names>M</given-names></name>
<name><surname>Ye</surname> <given-names>S</given-names></name>
<name><surname>Hu</surname> <given-names>T</given-names></name>
<name><surname>Chen</surname> <given-names>S</given-names></name>
<etal/>
</person-group>. 
<article-title>Exercise-induced Metabolite N-lactoyl-phenylalanine Ameliorates Colitis by Inhibiting M1 Macrophage Polarization via the Suppression of the NF-&#x3ba;B Signaling Pathway</article-title>. <source>Cell Mol Gastroenterol Hepatol</source>. (<year>2025</year>) <volume>19</volume>:<elocation-id>101558</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jcmgh.2025.101558</pub-id>, PMID: <pub-id pub-id-type="pmid">40562095</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<label>30</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yuan</surname> <given-names>M</given-names></name>
<name><surname>Chen</surname> <given-names>S</given-names></name>
<name><surname>Lin</surname> <given-names>Z</given-names></name>
<name><surname>Yu</surname> <given-names>R</given-names></name>
<name><surname>Chao</surname> <given-names>K</given-names></name>
<name><surname>Ye</surname> <given-names>S</given-names></name>
<etal/>
</person-group>. 
<article-title>ACSS2-Mediated Histone H4 Lysine 12 Crotonylation (H4K12cr) Alleviates Colitis via Enhancing Transcription of CLDN7</article-title>. <source>Adv Sci (Weinh)</source>. (<year>2025</year>) <volume>12</volume>:<fpage>e00461</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/advs.202500461</pub-id>, PMID: <pub-id pub-id-type="pmid">40650658</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<label>31</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>C</given-names></name>
<name><surname>Yu</surname> <given-names>R</given-names></name>
<name><surname>Li</surname> <given-names>S</given-names></name>
<name><surname>Yuan</surname> <given-names>M</given-names></name>
<name><surname>Hu</surname> <given-names>T</given-names></name>
<name><surname>Liu</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>KRAS mutation increases histone H3 lysine 9 lactylation (H3K9la) to promote colorectal cancer progression by facilitating cholesterol transporter GRAMD1A expression</article-title>. <source>Cell Death Differ</source>. (<year>2025</year>) <volume>32</volume>:<page-range>2225&#x2013;38</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41418-025-01533-4</pub-id>, PMID: <pub-id pub-id-type="pmid">40707783</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<label>32</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ke</surname> <given-names>H</given-names></name>
<name><surname>Li</surname> <given-names>Z</given-names></name>
<name><surname>Li</surname> <given-names>P</given-names></name>
<name><surname>Ye</surname> <given-names>S</given-names></name>
<name><surname>Huang</surname> <given-names>J</given-names></name>
<name><surname>Hu</surname> <given-names>T</given-names></name>
<etal/>
</person-group>. 
<article-title>Dynamic heterogeneity of colorectal cancer during progression revealed clinical risk-associated cell types and regulations in single-cell resolution and spatial context</article-title>. <source>Gastroenterol Rep (Oxf)</source>. (<year>2023</year>) <volume>11</volume>:<elocation-id>goad034</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gastro/goad034</pub-id>, PMID: <pub-id pub-id-type="pmid">37360193</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<label>33</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>J</given-names></name>
<name><surname>Su</surname> <given-names>Y</given-names></name>
<name><surname>Zhang</surname> <given-names>C</given-names></name>
<name><surname>Dong</surname> <given-names>H</given-names></name>
<name><surname>Yu</surname> <given-names>R</given-names></name>
<name><surname>Yang</surname> <given-names>X</given-names></name>
<etal/>
</person-group>. 
<article-title>NCOA3 impairs the efficacy of anti-PD-L1 therapy via HSP90&#x3b1;/EZH2/CXCL9 axis in colon cancer</article-title>. <source>Int Immunopharmacol</source>. (<year>2025</year>) <volume>155</volume>:<elocation-id>114579</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.intimp.2025.114579</pub-id>, PMID: <pub-id pub-id-type="pmid">40215778</pub-id>
</mixed-citation>
</ref>
<ref id="B34">
<label>34</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Erickson</surname> <given-names>GM</given-names></name>
<name><surname>Finkler</surname> <given-names>SA</given-names></name>
</person-group>. 
<article-title>Determinants of market share for a hospital&#x2019;s services</article-title>. <source>Med Care</source>. (<year>1985</year>) <volume>23</volume>:<page-range>1003&#x2013;18</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/00005650-198508000-00008</pub-id>, PMID: <pub-id pub-id-type="pmid">4021577</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1555542">Shengshan Xu</ext-link>, Jiangmen Central Hospital, China</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1708205">Haiyang Yu</ext-link>, Guizhou University of Traditional Chinese Medicine, China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3239118">Chi Zhang</ext-link>, University of Texas MD Anderson Cancer Center, United States</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3340461">Yangang Wang</ext-link>, Beijing University of Chinese Medicine Third Affiliated Hospital, China</p></fn>
</fn-group>
</back>
</article>