<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Environ. Sci.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Environmental Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Environ. Sci.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-665X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1729913</article-id>
<article-id pub-id-type="doi">10.3389/fenvs.2026.1729913</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Predicting environmental pollutant concentrations via cell image-derived damage features using a hybrid model</article-title>
<alt-title alt-title-type="left-running-head">Zhao et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fenvs.2026.1729913">10.3389/fenvs.2026.1729913</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Zhao</surname>
<given-names>Linying</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3250967"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal Analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Anqi</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Yanyan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Jiang</surname>
<given-names>Beier</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal Analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Changyu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing - review and editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Xu</surname>
<given-names>Xiaolong</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing - review and editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Jia</surname>
<given-names>Jianbo</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1929199"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing - review and editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal Analysis</role>
</contrib>
</contrib-group>
<aff id="aff1">
<label>1</label>
<institution>Jiangmen Key Laboratory of Synthetic Chemistry and Cleaner Production, School of Environmental and Chemical Engineering; Carbon Neutrality Innovation Center, Wuyi University</institution>, <city>Jiangmen</city>, <country country="CN">China</country>
</aff>
<aff id="aff2">
<label>2</label>
<institution>Guangdong Provincial Laboratory of Chemistry and Fine Chemical Industry Jieyang Center</institution>, <city>Jieyang</city>, <country country="CN">China</country>
</aff>
<aff id="aff3">
<label>3</label>
<institution>School of Emergency Technology and Management; Wuyi University</institution>, <city>Jiangmen</city>, <country country="CN">China</country>
</aff>
<author-notes>
<corresp id="c001">
<label>&#x2a;</label>Correspondence: Jianbo Jia, <email xlink:href="mailto:jbjiagu@163.com">jbjiagu@163.com</email>; Xiaolong Xu, <email xlink:href="mailto:xuxl@wyu.edu.cn">xuxl@wyu.edu.cn</email>
</corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-16">
<day>16</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>14</volume>
<elocation-id>1729913</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>10</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>15</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>29</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Zhao, Li, Zhang, Jiang, Liu, Xu and Jia.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Zhao, Li, Zhang, Jiang, Liu, Xu and Jia</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-16">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Effective detection of environmental pollution relies on reliable methods for determining pollutant concentrations, with cellular damage reflecting pollutant toxicity as a vital detection tool. This study presents a novel quantitative method for predicting environmental pollutant concentrations using cell images and a hybrid model.</p>
</sec>
<sec>
<title>Methods</title>
<p>The approach processes conventional optical microscope images by extracting grayscale statistical features and constructing a hybrid predictive framework that integrates stepwise regression for feature selection and multilayer perceptron for nonlinear modeling, enabling accurate mapping from image-based damage features to pollutant concentrations.</p>
</sec>
<sec>
<title>Results</title>
<p>Experiments show that the model performs consistently well across five cell types: HeLa, A549, HUVEC, PC12, and HaCaT. For example, it achieves an R<sup>2</sup> of 0.9911 on the HeLa test set, demonstrating strong generalization ability and robustness.</p>
</sec>
<sec>
<title>Discussion</title>
<p>The method does not require expensive equipment or complex sample preparation, offering an innovative, rapid, and low&#x2010;cost solution for monitoring environmental pollutant concentrations.</p>
</sec>
</abstract>
<kwd-group>
<kwd>cell image</kwd>
<kwd>environmental toxicology</kwd>
<kwd>grayscale statistical features</kwd>
<kwd>hybrid model</kwd>
<kwd>pollutant concentration prediction</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. We acknowledge financial support from the National Natural Science Foundation of China (Grant Nos. 22536007 and 22274117), Education Department of Guangdong Province (Grant No. 2022ZDJS027).</funding-statement>
</funding-group>
<counts>
<fig-count count="8"/>
<table-count count="5"/>
<equation-count count="0"/>
<ref-count count="39"/>
<page-count count="13"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Toxicology, Pollution and the Environment</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<label>1</label>
<title>Introduction</title>
<p>Cell damage is a direct reflection of the effects of environmental pollutants on living organisms (<xref ref-type="bibr" rid="B25">Sheller-Miller et al., 2020</xref>; <xref ref-type="bibr" rid="B37">Yang et al., 2024</xref>), and is gradually becoming an effective way to detect pollutant concentrations. Pollutants enter organisms through water, atmosphere or soil, and then cause physiological damage to cells (<xref ref-type="bibr" rid="B37">Yang et al., 2024</xref>; <xref ref-type="bibr" rid="B28">Suzuki et al., 2020</xref>; <xref ref-type="bibr" rid="B22">Pereira et al., 2021</xref>), and the extent of this damage is closely related to the pollutant concentration. The interference of environmental pollutants on cell functions is usually shown to be concentration dependent; that is, the greater the concentration of pollutants, the more significant the damage or functional interference to cells (<xref ref-type="bibr" rid="B6">Chukhlovin et al., 2001</xref>; <xref ref-type="bibr" rid="B35">Xin et al., 2015</xref>). Therefore, the degree of cellular damage can be used as a sensitive response to changes in pollutant concentrations, providing a scientific basis for the quantitative detection of pollutants. This method not only has important application value in the concentration detection of environmental pollutants, but also can provide new technical means for environmental toxicology research.</p>
<p>In the fields of environmental toxicology, drug discovery and disease diagnosis, cellular damage usually reflects the effects of external environment or drug treatment on the physiological functions of cells, and common methods of assessing cellular damage mainly include cellular activity assay, determination of cellular oxidative stress markers, and observation of cellular morphology. Cell viability detection methods (<xref ref-type="bibr" rid="B11">Kamiloglu et al., 2020</xref>) can be roughly divided into: the dye exclusion methods, the colorimetric analysis, fluorescent dye methods, the bioluminescence assays (such as Real-time viability assay (<xref ref-type="bibr" rid="B9">Hiers et al., 2024</xref>)) and the flow cytometry assays. Measurement of cellular oxidative stress markers is an important tool for assessing the extent of oxidative damage to cells, such as ROS levels by fluorescent probe assay. In principle, cells are stimulated with morphological changes (e.g., smaller cell size, rounded cells, reduced cell apposition, etc.,) (<xref ref-type="bibr" rid="B12">Kerr et al., 1972</xref>), which can be used as an important means to analyze cell damage. Traditional cell damage assessment methods usually rely on physicochemical indicators for qualitative or semi-quantitative analysis, which is a complex and time-consuming process and relies on specific equipment. In contrast, cell images provide rich structural and optical information, and analyzing the multidimensional features of the images through machine learning is expected to provide a more accurate and convenient way for contaminant toxicity assessment.</p>
<p>However, morphological analysis typically relies on complex image segmentation and parameter calculations, making it susceptible to interference from imaging conditions, cell density, and segmentation errors, affecting feature consistency and reproducibility (<xref ref-type="bibr" rid="B4">Chen et al., 2012</xref>). In contrast, grayscale distribution features directly reflect changes in optical density within cellular regions and are more sensitive to alterations in intracellular composition, density, and translucency caused by damage. This feature is computationally simple, highly stable, and less dependent on segmentation accuracy, making it more suitable as a robust indicator for high-throughput, automated analysis. Therefore, this study chooses grayscale distribution as the basic feature to establish a reliable and reproducible quantitative relationship between cell damage and contaminant concentration.</p>
<p>Previously, we developed a method based on grayscale frequency analysis to quantify the degree of cellular damage using image brightness, which achieved good results (<xref ref-type="bibr" rid="B16">Li et al., 2025</xref>). However, this method, which relies only on grayscale frequency analysis by calculating the ratio of the number of maximum pixel points in abnormal regions to the total number of maximum pixel points within normal and abnormal regions, may not adequately capture the complex information in cell images. We propose the use of hybrid models to capture complex information in cell images. Based on our experimental research observations, we found that the gray-scale distribution data of cell images can be used as an effective indicator of cell damage for quantitative analysis of environmental pollutant concentrations. However, direct processing of all gray-scale distribution data may lead to redundant information and increased computational cost, so feature selection methods are needed to extract the most representative information to improve model efficiency and performance. Feature selection methods have helped us simplify the data, but in order to mine the information in the data more comprehensively, we introduce a hybrid model based on feature selection. Hybrid modeling significantly improves model performance by integrating the strengths of multiple methods and compensating for the weaknesses of a single method. Many hybrid methods have been reported and shown excellent results in several application areas. For example, Improved Principal Component Analysis-Convolutional Neural Network-Long and Short-Term Memory Network (improved PCA-CNN-LSTM) (<xref ref-type="bibr" rid="B39">Zhu et al., 2023</xref>), Principal Component Analysis- Back Propagation-Artificial Neural Network (PCA-BP-ANN) (<xref ref-type="bibr" rid="B23">Sadrara and Khorrami, 2023</xref>), Principal Component Analysis-Ridge Regression (PCA-Ridge Regression) (<xref ref-type="bibr" rid="B30">Wang W. Y. et al., 2021</xref>), and so on.</p>
<p>In summary, cellular images provide an intuitive means for assessing pollutant toxicity, yet constructing a high-precision, low-cost quantitative prediction system still faces dual challenges. First, the grayscale frequency analysis method we previously proposed has significant limitations (<xref ref-type="bibr" rid="B16">Li et al., 2025</xref>). It relies solely on a single statistical measure, failing to fully leverage the rich grayscale distribution information within cellular images, resulting in insufficient prediction accuracy and robustness. More critically, mainstream detection technologies for environmental pollutant concentrations, such as electrochemical sensors, infrared spectroscopy, and mass spectrometry, While highly accurate, generally require expensive, specialized instruments and involve complex sample pretreatment (<xref ref-type="bibr" rid="B15">Kumunda et al., 2021</xref>; <xref ref-type="bibr" rid="B19">Meher and Zarouri, 2025</xref>). This makes achieving low-cost, high-throughput rapid screening difficult. Addressing these dual bottlenecks of &#x201c;insufficient feature utilization&#x201d; and &#x201c;excessive equipment dependency,&#x201d; this study aims to explore a novel &#x201c;one-stop&#x201d; prediction paradigm: starting directly from cell images obtained via conventional optical microscopy, extracting their full-band grayscale statistical features, and constructing intelligent prediction models to ultimately achieve precise quantitative determination of pollutant concentrations.</p>
<p>To this end, we propose the stepwise regression&#x2013;multilayer perceptron (SR-MLP) hybrid model and compare it with two linear hybrid variants: stepwise regression&#x2013;linear regression (SR-LR) and stepwise regression&#x2013;ridge regression (SR-RR). The dataset is divided into training and testing sets in an 8:2 ratio for all three models. SR-LR combines stepwise regression with linear regression, offering simplicity but a tendency to overfit. SR-RR integrates stepwise regression (SR) with ridge regression (RR), which mitigates multicollinearity through L2 regularization, yet remains limited to linear mappings. In contrast, SR-MLP retains SR for feature selection and further employs a multilayer perceptron with L2 regularization to model nonlinear interactions, effectively capturing complex relationships between features and pollutant concentrations. Experimental results demonstrate that while SR-LR and SR-RR perform adequately under linear assumptions, SR-MLP achieves superior fitting and generalization in scenarios involving nonlinear dependencies. Moreover, SR-MLP consistently surpasses baseline models without feature selection (linear regression (LR), RR, and multilayer perceptron (MLP)) across all evaluation metrics, confirming its enhanced accuracy and robustness. Thus, SR-MLP provides a more accurate and flexible approach for quantifying environmental pollutants and elucidating their dose-dependent impact on cellular damage.</p>
<p>The proposed SR-MLP hybrid framework in this study innovates by establishing a new paradigm for quantitative mapping between &#x201c;image features and pollutant concentrations&#x201d; that does not rely on complex model architectures or high computational resources. Current mainstream approaches in bioimage analysis typically rely on deep learning models such as convolutional neural networks (CNNs) or Transformers to extract multi-level, structured visual features (<xref ref-type="bibr" rid="B26">Shobayo and Saatchi, 2025</xref>). While these methods possess strong feature representation capabilities, they often suffer from limitations including complex model structures, high training costs, strong dependence on large-scale labeled data, and relatively weak interpretability (<xref ref-type="bibr" rid="B3">Atabansi et al., 2023</xref>). In contrast, this study demonstrates for the first time that one-dimensional grayscale statistical features extracted solely from cell images can establish a highly accurate quantitative relationship with pollutant concentrations through feature selection (SR) and nonlinear modeling (MLP). This approach significantly reduces model complexity and computational overhead while maintaining predictive performance. It enhances transparency in feature selection and interpretability of results, offering a lighter, more deployable solution for rapid environmental pollutant detection. Therefore, the core contributions of this study can be summarized as follows:<list list-type="order">
<list-item>
<p>Proposing the SR-MLP hybrid model to achieve high-precision pollutant concentration prediction across cell types.</p>
</list-item>
<list-item>
<p>Validating the &#x201c;one-stop&#x201d; quantitative prediction paradigm based on image damage features for its cross-cell universality and robustness.</p>
</list-item>
<list-item>
<p>Establishing a new low-cost, non-invasive, and easily deployable imaging-based detection scheme for environmental pollutants.</p>
</list-item>
</list>
</p>
</sec>
<sec id="s2">
<label>2</label>
<title>Experiments and data</title>
<sec id="s2-1">
<label>2.1</label>
<title>Data acquisition and image processing</title>
<p>First, well-conditioned HeLa cells were spread in six-well plates and cultured in adherence at an inoculum density of 1 &#xd7; 10<sup>6</sup> cells/mL per well for 24&#xa0;h. Then, cells were stimulated with Diniconazole (DIN) at concentrations of 0, 2.5, 5, 10, and 20&#xa0;&#x3bc;mol/L for 24&#xa0;h. The culture environment was maintained at 37&#xa0;&#xb0;C and 5% CO<sub>2</sub>. After stimulation, bright-field imaging was performed using a 10&#xd7; objective of an optical microscope (OLYMPUS CKX53), and conditions such as exposure time and light intensity were kept consistent to ensure uniform imaging conditions for all sample images. One hundred images were acquired for each concentration, and the resolution of the images was 3072 &#xd7; 2048 pixels, totaling 500 samples. For HUVEC, and HaCaT cells, stimulation was performed using DIN at concentrations of 0, 2.5, 5, 10, and 20&#xa0;&#x3bc;mol/L, and a total of 150 samples were collected. For A549 cells, stimulation was performed using DIN at concentrations of 0, 12.5, 25, and 50&#xa0;&#x3bc;mol/L, and a total of 120 samples were collected. For PC12 cells, stimulation was performed using DIN at concentrations of 0, 5, 10, 20 and 40&#xa0;&#x3bc;mol/L, and a total of 150 samples were collected. It should be noted that this study adopted a phased image acquisition strategy. Initially, HeLa cells were used as the model system for method development. To ensure statistical robustness and provide a solid data foundation for feature analysis, 100 images were collected at each concentration. After successful method validation, to assess its cross-cell line generalization ability and feasibility in scenarios with limited resources, 30 images were collected per concentration in the subsequent experiments with A549, HUVEC, PC12, and HaCaT cells.</p>
<p>In order to further analyze the grayscale characteristics of the cellular regions, we performed batch automatic segmentation of the cellular images by calling Cellpose&#x2019;s API and exported the corresponding masks (<xref ref-type="bibr" rid="B27">Stringer et al., 2021</xref>). Cell segmentation was performed using the Cellpose pre-trained model (cyto3). The parameters were set as follows: automatic diameter estimation, grayscale image channels, a flow threshold of 0.4, and a minimum cell size of 15 pixels. Tiled processing and network averaging were enabled to balance the processing of large images with segmentation accuracy. All segmentation tasks were accelerated using GPU processing. To visually demonstrate the image segmentation results, we overlaid the mask generated by Cellpose onto the original image during the image processing stage in <xref ref-type="fig" rid="F1">Figure 1</xref>. This clearly shows the extracted cell regions (as illustrated by the grayscale example in the image processing module), thereby providing an intuitive basis for quality verification in subsequent grayscale feature extraction. Then, we batch-calculated the grayscale values of cell regions and their corresponding pixel numbers based on mask, and adjusted the data with normalization based on the average occupancy of all samples to ensure comparability among different images. Ultimately, we constructed five datasets containing the cell grayscale distribution and DIN concentration for subsequent analysis and modeling.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Framework diagram for methodological design and modeling.</p>
</caption>
<graphic xlink:href="fenvs-14-1729913-g001.tif">
<alt-text content-type="machine-generated">Flowchart illustrates a machine learning pipeline for image-based data from five datasets&#x2014;HeLa, A549, Huvec, PC12, HaCaT&#x2014;covering image processing, model development using SR-LR, SR-RR, and SR-MLP, model evaluation with R squared, RMSE, and MAE, followed by selection of a multilayer perceptron network architecture with regression, and output shown as a predicted versus actual value plot.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s2-2">
<label>2.2</label>
<title>Data preprocessing</title>
<p>We performed a visual analysis of the samples at each concentration, using the sample stimulated with 10&#xa0;&#x3bc;mol/L DIN in HeLa cells as an example. <xref ref-type="fig" rid="F2">Figure 2</xref> shows the grayscale distribution of 100 representative samples, where a small number of outliers were observed. To address this, we applied the interquartile range (IQR) method to remove outliers (<xref ref-type="bibr" rid="B29">Swami et al., 2023</xref>). When the scaling factor k &#x3d; 3, it effectively eliminated apparent outlier curves while retaining most of the samples, thereby enhancing data reliability and preventing outliers from negatively affecting the model. Observing the gray scale distribution curve after removing the outliers in <xref ref-type="fig" rid="F3">Figure 3</xref>, we found that the data still has a certain degree of dispersion. Therefore, we standardized the data to make the data obey the standard normal distribution, which in turn improves the training effect of the model (<xref ref-type="bibr" rid="B20">Muhammad and Faraj, 2014</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Raw grayscale distribution of HeLa cells stimulated by 10&#xa0;&#x3bc;mol/L DIN.</p>
</caption>
<graphic xlink:href="fenvs-14-1729913-g002.tif">
<alt-text content-type="machine-generated">Line graph showing multiple color-coded curves representing pixel count versus gray levels ranging from zero to two hundred fifty-five. All curves peak sharply near a gray level of one hundred, then gradually decrease, with a small spike near two hundred fifty.</alt-text>
</graphic>
</fig>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Grayscale distribution of HeLa cells stimulated by 10&#xa0;&#x3bc;mol/L DIN after processing with the IQR method.</p>
</caption>
<graphic xlink:href="fenvs-14-1729913-g003.tif">
<alt-text content-type="machine-generated">Line graph showing pixel count versus gray levels (zero to two hundred fifty-five) with multiple colored curves. All curves peak sharply near gray level one hundred and have a secondary small peak near two hundred fifty.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec sec-type="methods" id="s3">
<label>3</label>
<title>Methods</title>
<p>We observed an increase in cell dehiscence and a tendency towards a rounded morphology with increasing DIN concentration, which may be attributed to DIN-induced apoptosis, leading to coalescence of nuclei and cytoplasm, gradual contraction of the cells and loss of adhesion, and the eventual formation of membrane-encapsulated apoptotic vesicles, which resulted in a rounded morphology of the cells (<xref ref-type="bibr" rid="B12">Kerr et al., 1972</xref>). Intuitively, the surrounding brightness of round cells is high, and the grayscale values of damaged cells are mainly concentrated in the 200-255 interval (e.g., <xref ref-type="fig" rid="F4">Figure 4</xref>), and the number of pixels in this interval tends to increase with increasing DIN concentration (e.g., <xref ref-type="fig" rid="F5">Figure 5</xref>). We inferred that there is a certain quantitative relationship between the gray scale distribution of cell images and pollutant concentration. To further explore this relationship, we chose three hybrid modeling approaches: SR-LR, SR-RR, and SR-MLP. The feature selection methods, modeling approaches, optimization strategies, and model evaluation metrics of these three models are briefly described below. The specific modeling framework of the methodology is shown in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Grayscale distribution of normal cells and abnormal cells.</p>
</caption>
<graphic xlink:href="fenvs-14-1729913-g004.tif">
<alt-text content-type="machine-generated">Line graph compares pixel count versus gray level values from zero to two hundred fifty-five for normal cells (solid orange), abnormal cells (dashed green), and all cells (dotted red), showing peaks near gray level one hundred for all and normal cells, and a lower, broader peak for abnormal cells.</alt-text>
</graphic>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Pixel distribution of abnormal cells in high grayscale range (200-255) at different DIN concentrations.</p>
</caption>
<graphic xlink:href="fenvs-14-1729913-g005.tif">
<alt-text content-type="machine-generated">Line graph showing pixel count versus gray levels from 200 to 255 for five concentrations: 20.0, 10.0, 5.0, 2.5, and 0.0 micromoles per liter. Higher concentrations show sharper peaks at gray level 245.</alt-text>
</graphic>
</fig>
<sec id="s3-1">
<label>3.1</label>
<title>SR</title>
<p>SR is a feature selection method based on statistical significance (P-value). It iteratively filters out the most relevant features to the target variable, thus reducing redundant features and improving the efficiency and predictive power of the model (<xref ref-type="bibr" rid="B38">Zhou and Jiang, 2016</xref>).</p>
</sec>
<sec id="s3-2">
<label>3.2</label>
<title>SR-LR and SR-RR</title>
<p>The SR-LR model is a combination of SR and LR, which is a simple and interpretable method of linear modeling through screened features (<xref ref-type="bibr" rid="B10">James et al., 2023</xref>). The SR-RR model introduces L2 regularization on this basis, i.e., it is a combination of SR and RR. RR reduces multicollinearity through L2 regularization, limits model weights, and reduces the risk of overfitting, thus improving the stability and predictive ability of the model (<xref ref-type="bibr" rid="B31">Wang X. et al., 2021</xref>). The advantage of RR is that it can better handle the situation of correlation between features and control the model complexity while maintaining the linear modeling framework.</p>
</sec>
<sec id="s3-3">
<label>3.3</label>
<title>SR-MLP</title>
<p>In the SR-MLP model, we employ the MLP for nonlinear modeling. The MLP is a feedforward neural network consisting of multiple hidden layers, which captures complex nonlinear relationships in data through weighted summation and activation functions (<xref ref-type="bibr" rid="B18">Liu et al., 2022</xref>). The structure of the MLP&#x2014;such as the number of hidden layers, the number of neurons, and the activation functions&#x2014;can be flexibly adjusted according to the specific task requirements. In this study, we constructed an MLP network with three hidden layers, containing 72, 48, and 24 neurons, respectively. The hidden layers use the Rectified Linear Unit (ReLU) activation function to enhance the modeling capability for complex nonlinear relationships (<xref ref-type="bibr" rid="B2">Alkhouly et al., 2021</xref>; <xref ref-type="bibr" rid="B8">Fu et al., 2020</xref>), while the output layer employs a linear transformation (Linear) to directly output continuous predictions for the regression task (<xref ref-type="bibr" rid="B13">K&#x131;l&#x131;&#xe7;arslan et al., 2021</xref>).</p>
<p>To prevent overfitting and enhance the model&#x2019;s generalization capability, we employed the following regularization strategies during training: First, L2 regularization was introduced by adding a weight penalty term to the loss function, thereby constraining the magnitude of weights and suppressing overfitting (<xref ref-type="bibr" rid="B34">Xie et al., 2022</xref>). Second, the Dropout method was applied to randomly drop a portion of hidden layer neurons during training, reducing model complexity and further improving its generalization ability (<xref ref-type="bibr" rid="B24">Salehin and Kang, 2023</xref>). We monitored the trends of training loss and validation loss to guide hyperparameter optimization. Model convergence was considered satisfactory when both losses decreased smoothly, remained closely aligned, and eventually stabilized. A scenario where training loss continued to decline while validation loss plateaued or increased prematurely indicated potential overfitting, whereas persistently high losses with slow reduction suggested underfitting (<xref ref-type="bibr" rid="B32">Wang et al., 2022</xref>). Accordingly, we systematically adjusted hyperparameters including the number of training epochs, batch size, regularization strength, learning rate, and Dropout rate to achieve optimal convergence performance.</p>
</sec>
<sec id="s3-4">
<label>3.4</label>
<title>Evaluation metrics</title>
<p>To fully evaluate the performance of the hybrid model, we use the following commonly used metrics:<list list-type="order">
<list-item>
<p>Coefficient of determination (R<sup>2</sup>): a measure of the goodness of fit of the model, the closer the value is to 1 the better the model fits the data and the better the prediction (<xref ref-type="bibr" rid="B5">Chicco et al., 2021</xref>).</p>
</list-item>
<list-item>
<p>Root Mean Square Error (RMSE): a measure of the difference between the predicted value and the true value, emphasizing the effect of larger errors. Smaller values indicate higher model prediction accuracy (<xref ref-type="bibr" rid="B5">Chicco et al., 2021</xref>).</p>
</list-item>
<list-item>
<p>Mean Absolute Error (MAE): Calculates the average of the absolute error between the predicted value and the true value, reflecting the overall error level of the model. The smaller the value indicates the higher the prediction accuracy of the model (<xref ref-type="bibr" rid="B5">chicco et al., 2021</xref>).</p>
</list-item>
</list>
</p>
</sec>
</sec>
<sec sec-type="results|discussion" id="s4">
<label>4</label>
<title>Results and discussion</title>
<sec id="s4-1">
<label>4.1</label>
<title>Analysis of models performance</title>
<p>We evaluated the performance of the three hybrid models (SR-LR, SR-RR, and SR-MLP) and the baseline models (LR, RR, and MLP) using R<sup>2</sup>, RMSE, and MAE metrics, as summarized in <xref ref-type="table" rid="T1">Table 1</xref>. The results indicate that all hybrid models incorporating SR outperformed their non-SR counterparts across most datasets, underscoring the efficacy of SR in feature selection for enhancing model performance. And among these three hybrid models, the R<sup>2</sup> values of SR-MLP on all cellular datasets were significantly better than those of SR-LR and SR-RR and higher than 0.9, indicating a better fitting ability. In the case of the HeLa cell dataset, for example, the R<sup>2</sup> of SR-MLP was as high as 0.9919, while SR-LR and SR-RR were 0.9707 and 0.9708, respectively. Moreover, the RMSE and MAE of SR-MLP are lower than those of SR-LR and SR-RR on all datasets, which indicates that its prediction error is smaller and its stability is higher. In contrast, the R<sup>2</sup> of SR-LR and SR-RR was higher than 0.9 on the HeLa, PC12 and HaCaT cell datasets, but lower than 0.9 on the A549 and HUVEC cell datasets, which indicated a poorer fit and limited generalization ability.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>List of statistical parameters.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Dataset</th>
<th align="center">Method</th>
<th align="center">R<sup>2</sup>
</th>
<th align="center">RMSE</th>
<th align="center">MAE</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="6" align="center">HeLa</td>
<td align="center">LR</td>
<td align="center">0.8306</td>
<td align="center">2.7705</td>
<td align="center">1.5626</td>
</tr>
<tr>
<td align="center">RR</td>
<td align="center">0.9386</td>
<td align="center">1.6684</td>
<td align="center">1.0388</td>
</tr>
<tr>
<td align="center">MLP</td>
<td align="center">0.9770</td>
<td align="center">1.1481</td>
<td align="center">0.7993</td>
</tr>
<tr>
<td align="center">SR-LR</td>
<td align="center">0.9707</td>
<td align="center">1.1518</td>
<td align="center">0.8827</td>
</tr>
<tr>
<td align="center">SR-RR</td>
<td align="center">0.9708</td>
<td align="center">1.1504</td>
<td align="center">0.8837</td>
</tr>
<tr>
<td align="center">
<bold>SR-MLP</bold>
</td>
<td align="center">
<bold>0.9911</bold>
</td>
<td align="center">
<bold>0.6364</bold>
</td>
<td align="center">
<bold>0.3730</bold>
</td>
</tr>
<tr>
<td rowspan="6" align="center">A549</td>
<td align="center">LR</td>
<td align="center">0.8453</td>
<td align="center">6.5973</td>
<td align="center">5.6149</td>
</tr>
<tr>
<td align="center">RR</td>
<td align="center">0.8457</td>
<td align="center">6.5899</td>
<td align="center">5.6121</td>
</tr>
<tr>
<td align="center">MLP</td>
<td align="center">0.8786</td>
<td align="center">5.3887</td>
<td align="center">4.5710</td>
</tr>
<tr>
<td align="center">SR-LR</td>
<td align="center">0.8809</td>
<td align="center">5.7900</td>
<td align="center">4.5223</td>
</tr>
<tr>
<td align="center">SR-RR</td>
<td align="center">0.8805</td>
<td align="center">5.8001</td>
<td align="center">4.5419</td>
</tr>
<tr>
<td align="center">
<bold>SR-MLP</bold>
</td>
<td align="center">
<bold>0.9716</bold>
</td>
<td align="center">
<bold>2.8269</bold>
</td>
<td align="center">
<bold>1.5795</bold>
</td>
</tr>
<tr>
<td rowspan="6" align="center">HUVEC</td>
<td align="center">LR</td>
<td align="center">0.7287</td>
<td align="center">3.9980</td>
<td align="center">3.1179</td>
</tr>
<tr>
<td align="center">RR</td>
<td align="center">0.7382</td>
<td align="center">3.9277</td>
<td align="center">3.0682</td>
</tr>
<tr>
<td align="center">MLP</td>
<td align="center">0.8398</td>
<td align="center">2.7994</td>
<td align="center">2.2135</td>
</tr>
<tr>
<td align="center">SR-LR</td>
<td align="center">0.8533</td>
<td align="center">2.9403</td>
<td align="center">2.3650</td>
</tr>
<tr>
<td align="center">SR-RR</td>
<td align="center">0.8507</td>
<td align="center">2.9659</td>
<td align="center">2.3633</td>
</tr>
<tr>
<td align="center">
<bold>SR-MLP</bold>
</td>
<td align="center">
<bold>0.9753</bold>
</td>
<td align="center">
<bold>1.2055</bold>
</td>
<td align="center">
<bold>0.8668</bold>
</td>
</tr>
<tr>
<td rowspan="6" align="center">PC12</td>
<td align="center">LR</td>
<td align="center">0.9340</td>
<td align="center">3.8624</td>
<td align="center">2.8333</td>
</tr>
<tr>
<td align="center">RR</td>
<td align="center">0.9340</td>
<td align="center">3.8628</td>
<td align="center">2.8382</td>
</tr>
<tr>
<td align="center">MLP</td>
<td align="center">0.8942</td>
<td align="center">3.9298</td>
<td align="center">3.3227</td>
</tr>
<tr>
<td align="center">SR-LR</td>
<td align="center">0.9375</td>
<td align="center">3.7580</td>
<td align="center">3.2913</td>
</tr>
<tr>
<td align="center">SR-RR</td>
<td align="center">0.9384</td>
<td align="center">3.7308</td>
<td align="center">3.2686</td>
</tr>
<tr>
<td align="center">
<bold>SR-MLP</bold>
</td>
<td align="center">
<bold>0.9821</bold>
</td>
<td align="center">
<bold>2.0093</bold>
</td>
<td align="center">
<bold>1.3450</bold>
</td>
</tr>
<tr>
<td rowspan="6" align="center">HaCaT</td>
<td align="center">LR</td>
<td align="center">0.9018</td>
<td align="center">2.3391</td>
<td align="center">1.7062</td>
</tr>
<tr>
<td align="center">RR</td>
<td align="center">0.9024</td>
<td align="center">2.3316</td>
<td align="center">1.7084</td>
</tr>
<tr>
<td align="center">MLP</td>
<td align="center">0.8633</td>
<td align="center">2.6931</td>
<td align="center">2.1108</td>
</tr>
<tr>
<td align="center">SR-LR</td>
<td align="center">0.9174</td>
<td align="center">2.1452</td>
<td align="center">1.5500</td>
</tr>
<tr>
<td align="center">SR-RR</td>
<td align="center">0.9140</td>
<td align="center">2.1898</td>
<td align="center">1.5842</td>
</tr>
<tr>
<td align="center">
<bold>SR-MLP</bold>
</td>
<td align="center">
<bold>0.9222</bold>
</td>
<td align="center">
<bold>2.0822</bold>
</td>
<td align="center">
<bold>1.2773</bold>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Datasets: HeLa, A549, Huvec, PC12, and HaCaT represent the five different cell types used in the study. Model development: SR-LR, SR-RR, and SR-MLP stand for the hybrid models &#x201C;stepwise regression&#x2013;linear regression,&#x201D; &#x201C;stepwise regression&#x2013;ridge regression,&#x201D; and &#x201C;stepwise regression&#x2013;multilayer perceptron,&#x201D; respectively. Model evaluation: R<sup>2</sup>, RMSE, and MAE denote the coefficient of determination, root mean square error, and mean absolute error, respectively, which are used to quantify model performance.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>To further assess the predictive power of SR-MLP, we compared the predicted and true values of SR-RR (e.g., <xref ref-type="table" rid="T2">Table 2</xref>) with those of SR-MLP (e.g., <xref ref-type="table" rid="T3">Table 3</xref>) models. Taking the HeLa cell dataset as an example, the predicted values of SR-MLP and SR-RR were 19.44&#xa0;&#x3bc;mol/L and 19.07&#xa0;&#x3bc;mol/L, respectively, at a high concentration of 20&#xa0;&#x3bc;mol/L, whereas the predicted values of SR-MLP and SR-RR were 2.65&#xa0;&#x3bc;mol/L and 3.54&#xa0;&#x3bc;mol/L, respectively, at a low concentration of 2.5&#xa0;&#x3bc;mol/L. It can be seen that the predicted values of SR-MLP are closer to the true values, and the errors are smaller, indicating that the model has the ability to predict the true values at different concentrations. MLP&#x2019;s prediction value is closer to the real value with smaller error, indicating that the model has strong prediction accuracy under different concentration conditions.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Comparison of predicted and true values of the SR-RR model.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="10" align="center">SR-RR</th>
</tr>
<tr>
<th colspan="5" align="center">Predicted (&#x3bc;mol/L)</th>
<th colspan="5" align="center">Actual (&#x3bc;mol/L)</th>
</tr>
<tr>
<th align="center">HeLa</th>
<th align="center">A549</th>
<th align="center">HUVEC</th>
<th align="center">PC12</th>
<th align="center">HaCaT</th>
<th align="center">HeLa</th>
<th align="center">A549</th>
<th align="center">HUVEC</th>
<th align="center">PC12</th>
<th align="center">HaCaT</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">0.24</td>
<td align="center">2.65</td>
<td align="center">3.11</td>
<td align="center">5.71</td>
<td align="center">0.23</td>
<td align="center">0.00</td>
<td align="center">0.00</td>
<td align="center">0.00</td>
<td align="center">0.00</td>
<td align="center">0.00</td>
</tr>
<tr>
<td align="center">3.54</td>
<td align="center">13.60</td>
<td align="center">2.34</td>
<td align="center">4.28</td>
<td align="center">3.54</td>
<td align="center">2.50</td>
<td align="center">12.50</td>
<td align="center">2.50</td>
<td align="center">5.00</td>
<td align="center">2.50</td>
</tr>
<tr>
<td align="center">5.57</td>
<td align="center">30.99</td>
<td align="center">6.97</td>
<td align="center">13.57</td>
<td align="center">0.20</td>
<td align="center">5.00</td>
<td align="center">25.00</td>
<td align="center">5.00</td>
<td align="center">10.00</td>
<td align="center">5.00</td>
</tr>
<tr>
<td align="center">10.33</td>
<td align="center">47.94</td>
<td align="center">8.40</td>
<td align="center">14.84</td>
<td align="center">9.24</td>
<td align="center">10.00</td>
<td align="center">50.00</td>
<td align="center">10.00</td>
<td align="center">20.00</td>
<td align="center">10.00</td>
</tr>
<tr>
<td align="center">19.07</td>
<td align="left">&#x200b;</td>
<td align="center">23.65</td>
<td align="center">40.54</td>
<td align="center">17.82</td>
<td align="center">20.00</td>
<td align="left">&#x200b;</td>
<td align="center">20.00</td>
<td align="center">40.00</td>
<td align="center">20.00</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Comparison of predicted and true values of the SR-MLP model.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="10" align="center">SR-MLP</th>
</tr>
<tr>
<th colspan="5" align="center">Predicted (&#x3bc;mol/L)</th>
<th colspan="5" align="center">Actual (&#x3bc;mol/L)</th>
</tr>
<tr>
<th align="center">HeLa</th>
<th align="center">A549</th>
<th align="center">HUVEC</th>
<th align="center">PC12</th>
<th align="center">HaCaT</th>
<th align="center">HeLa</th>
<th align="center">A549</th>
<th align="center">HUVEC</th>
<th align="center">PC12</th>
<th align="center">HaCaT</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">0.11</td>
<td align="center">0.37</td>
<td align="center">0.20</td>
<td align="center">0.26</td>
<td align="center">0.73</td>
<td align="center">0.00</td>
<td align="center">0.00</td>
<td align="center">0.00</td>
<td align="center">0.00</td>
<td align="center">0.00</td>
</tr>
<tr>
<td align="center">2.65</td>
<td align="center">12.93</td>
<td align="center">3.35</td>
<td align="center">5.29</td>
<td align="center">2.44</td>
<td align="center">2.50</td>
<td align="center">12.50</td>
<td align="center">2.50</td>
<td align="center">5.00</td>
<td align="center">2.50</td>
</tr>
<tr>
<td align="center">4.94</td>
<td align="center">27.29</td>
<td align="center">5.05</td>
<td align="center">10.80</td>
<td align="center">2.92</td>
<td align="center">5.00</td>
<td align="center">25.00</td>
<td align="center">5.00</td>
<td align="center">10.00</td>
<td align="center">5.00</td>
</tr>
<tr>
<td align="center">9.92</td>
<td align="center">49.85</td>
<td align="center">8.98</td>
<td align="center">18.95</td>
<td align="center">10.96</td>
<td align="center">10.00</td>
<td align="center">50.00</td>
<td align="center">10.00</td>
<td align="center">20.00</td>
<td align="center">10.00</td>
</tr>
<tr>
<td align="center">19.44</td>
<td align="left">&#x200b;</td>
<td align="center">19.75</td>
<td align="center">42.48</td>
<td align="center">20.11</td>
<td align="center">20.00</td>
<td align="left">&#x200b;</td>
<td align="center">20.00</td>
<td align="center">40.00</td>
<td align="center">20.00</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s4-2">
<label>4.2</label>
<title>Analysis of feature generalisation of cross-cell</title>
<p>In order to reduce data dimensionality and enhance model stability, we employed the SR method to screen gray-scale features based on statistical significance. During the screening process, differentiated p-value inclusion thresholds (ranging from &#x3c;0.001 to &#x3c;0.05) were set according to the data characteristics of different cell datasets and the need to control model complexity. Specifically, for the HeLa dataset, which exhibited clearer feature-concentration relationships and higher data quality, a stricter threshold (p &#x3c; 0.001) was applied to construct a highly concise initial feature set. For the other datasets, relatively lenient thresholds (p &#x3c; 0.05 or p &#x3c; 0.01) were adopted to retain more potentially relevant feature information for the subsequent MLP to perform nonlinear learning. The setting of all thresholds followed the statistical principle of controlling Type I errors while also considering the connection with the subsequent nonlinear modeling stage (<xref ref-type="bibr" rid="B1">Aguinis et al., 2021</xref>).</p>
<p>Despite the differences, the screening results also indicate some similarities among key features across different cell datasets, as shown in <xref ref-type="table" rid="T4">Table 4</xref>. For instance, feature 244 was selected in the HeLa, A549, and HUVEC cell datasets, while key feature 204 for PC12 cells and key feature 248 for HaCaT cells, along with feature 244, all fell within the gray-scale range of 200&#x2013;255. This suggests that these features may possess strong generalizability across different cell types and can stably reflect the effects of pollutants on cells. The gray-scale range of 200&#x2013;255 typically corresponds to abnormal cells, and features within this range exhibit more significant variations. Moreover, the features screened in this range demonstrated better p-values, further validating the importance of these features in the cellular damage response. Therefore, during the feature selection process, we focused on the key features of cell damage and controlled the number of features within 20 to optimize the computational efficiency and generalization capability of the model.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Features of five cell types screened by SR method.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Dataset</th>
<th align="left">P-value</th>
<th align="left">Filtered features (grayscale values)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">HeLa</td>
<td align="center">&#x3c;0.001</td>
<td align="center">27, 49, 77, 81, 115, 133, 136, 183, 231, 238, 242, 244, 245, 250</td>
</tr>
<tr>
<td align="center">A549</td>
<td align="center">&#x3c;0.05</td>
<td align="center">32, 37, 39, 40, 54, 97, 215, 218, 221, 244</td>
</tr>
<tr>
<td align="center">HUVEC</td>
<td align="center">&#x3c;0.05</td>
<td align="center">16, 18, 20, 41, 47, 48, 52, 54, 117, 159, 180, 186, 191, 198, 220, 223, 244, 247</td>
</tr>
<tr>
<td align="center">PC12</td>
<td align="center">&#x3c;0.01</td>
<td align="center">16, 18, 20, 54, 55, 76, 83, 90, 118, 193, 194, 197, 200, 204</td>
</tr>
<tr>
<td align="center">HaCaT</td>
<td align="center">&#x3c;0.005</td>
<td align="center">12, 37, 52, 56, 64, 66, 67, 77, 122, 124, 127, 159, 172, 192, 248</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s4-3">
<label>4.3</label>
<title>SHAP-based analysis of the importance of high-grayscale features</title>
<p>To elucidate the contribution of key features in the SR-MLP model to pollutant concentration prediction, we applied the SHapley Additive exPlanations (SHAP) method. Derived from game-theoretic Shapley values, SHAP provides a consistent and interpretable quantification of feature contributions. Using SHAP&#x2019;s Explainer, we computed SHAP values for key features on the test set and visualized the results with beeswarm plots. In these plots, the X-axis represents SHAP values (indicating directional contribution), the Y-axis lists features in descending order of mean absolute SHAP value (importance), and point color reflects the original feature magnitude (red for high, blue for low), thus enabling an intuitive assessment of how feature values relate to their predictive influence (<xref ref-type="bibr" rid="B7">Ekanayake et al., 2022</xref>).</p>
<p>Analysis results are highly consistent with the key features selected based on statistical significance, strongly confirming the experimental finding that &#x201c;features in the high grayscale range (200&#x2013;255) are the core drivers for predicting pollutant concentration.&#x201d; The SHAP importance ranking reveals that across all cell types, features located within this high-brightness interval dominate (The SHAP beeswarm plot for HeLa cells is shown in <xref ref-type="fig" rid="F6">Figure 6</xref>, while the corresponding results for the remaining cell types (A549, HUVEC, PC12, HaCaT) are provided in the Supporting Information as <xref ref-type="sec" rid="s12">Supplementary Figures S1&#x2013;S4</xref>). Specifically, in HeLa cells, the top three features by importance are 242, 245, and 244; in A549 cells, they are 244, 221, and 218; in Huvec cells, they are 244, 198, and 48; in PC12 cells, they are 204, 76, and 200; and in HaCaT cells, they are 192, 37, and 172. It is particularly noteworthy that feature 244 ranks highly in HeLa, A549, and HUVEC cells, indicating its stable predictive ability across different cell types. The results for HaCaT cells show certain particularities: the top-ranked feature in SHAP importance is 192, which, although close to, does not fully fall within the 200&#x2013;255 high-brightness range. This may suggest that under DIN stimulation, HaCaT cells exhibit differences in brightness response thresholds or grayscale distribution patterns related to morphological damage compared to other cell lines&#x2014;for example, a smaller increase in brightness during apoptosis or interference from optical properties of other subcellular structures. This phenomenon warrants further investigation in future studies, considering cell type specificity.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>SHAP beeswarm plot for the HeLa cell.</p>
</caption>
<graphic xlink:href="fenvs-14-1729913-g006.tif">
<alt-text content-type="machine-generated">Scatter plot shows SHAP values for various features, where each dot&#x27;s position along the x-axis reflects feature influence and color indicates high (red) or low (blue) feature value.</alt-text>
</graphic>
</fig>
<p>In <xref ref-type="fig" rid="F6">Figure 6</xref>, key high-grayscale features (such as 242, 245, and 244) exhibit a distribution where blue points are concentrated on the left side of the X-axis, indicating that their lower feature values are associated with negative SHAP values. This suggests that the model has learned not a simple linear positive correlation but a more complex nonlinear response relationship: it is likely that only when these feature values exceed a certain threshold do they contribute positively and clearly to the prediction of high concentrations. This precise capture of nonlinear dependencies and feature interactions is precisely the intrinsic key to the SR-MLP model&#x2019;s ability to achieve high-precision predictions.</p>
<p>Overall, although individual features exhibit complex nonlinear influences in their SHAP values, from the perspective of overall feature importance ranking and dominant patterns, these observations align highly with morphological findings: after DIN stimulation, cells contract, become rounded, and gradually detach, leading to a significant increase in brightness in the cell regions, with grayscale values concentrated in the 200&#x2013;255 range (as shown in <xref ref-type="fig" rid="F4">Figure 4</xref>). Therefore, SHAP analysis confirms, at the level of model decision-making mechanisms, that the model ultimately relies on and integrates the information carried by these high-grayscale features, thereby successfully mapping the biological causal relationship between &#x201c;the degree of cellular damage (manifested as an increase in high-brightness pixels) and the rise in pollutant concentration.&#x201d;</p>
</sec>
<sec id="s4-4">
<label>4.4</label>
<title>Analysis of model training and convergence</title>
<p>By monitoring the trends of training loss and validation loss, we systematically optimized the hyperparameters of the SR-MLP model. The optimized hyperparameter configurations are presented in <xref ref-type="table" rid="T5">Table 5</xref>. As shown in <xref ref-type="fig" rid="F7">Figure 7</xref>, after tuning, both the training loss and validation loss exhibited a smooth downward trend and eventually stabilized, maintaining a small gap between them without evident divergence or premature convergence. These results indicate that the model did not suffer from overfitting or underfitting during training, demonstrating good convergence behavior and generalization ability (<xref ref-type="bibr" rid="B32">Wang et al., 2022</xref>). This validates the effectiveness of the adopted regularization strategies and hyperparameter configurations.</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Hyperparameter list with Mult. (multiplicity coefficient in IQR), Reg. (L2 regularization coefficient), Dropout 1 (first layer Dropout Ratio), Dropout 2 (second layer Dropout Ratio), Dropout 3 (third layer Dropout Ratio), LR (Learning Rate), Epochs (Training rounds) and Batch Size.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Dataset</th>
<th align="center">Method</th>
<th align="center">Mult</th>
<th align="center">Reg</th>
<th align="center">Dropout_1</th>
<th align="center">Dropout_2</th>
<th align="center">Dropout_3</th>
<th align="center">LR</th>
<th align="center">Epochs</th>
<th align="center">Batch size</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="2" align="center">HeLa</td>
<td align="center">SR-RR</td>
<td align="center">3</td>
<td align="center">0.01</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="center">SR-MLP</td>
<td align="center">3</td>
<td align="center">0.01</td>
<td align="center">0.1</td>
<td align="center">0.1</td>
<td align="center">0.1</td>
<td align="center">0.01</td>
<td align="center">200</td>
<td align="center">32</td>
</tr>
<tr>
<td rowspan="2" align="center">A549</td>
<td align="center">SR-RR</td>
<td align="center">2</td>
<td align="center">0.01</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="center">SR-MLP</td>
<td align="center">2</td>
<td align="center">0.01</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0.01</td>
<td align="center">150</td>
<td align="center">64</td>
</tr>
<tr>
<td rowspan="2" align="center">HUVEC</td>
<td align="center">SR-RR</td>
<td align="center">3</td>
<td align="center">0.01</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="center">SR-MLP</td>
<td align="center">3</td>
<td align="center">0.01</td>
<td align="center">0.1</td>
<td align="center">0.1</td>
<td align="center">0.1</td>
<td align="center">0.01</td>
<td align="center">200</td>
<td align="center">32</td>
</tr>
<tr>
<td rowspan="2" align="center">PC12</td>
<td align="center">SR-RR</td>
<td align="center">2</td>
<td align="center">0.01</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="center">SR-MLP</td>
<td align="center">2</td>
<td align="center">0.01</td>
<td align="center">0.1</td>
<td align="center">0.1</td>
<td align="center">0</td>
<td align="center">0.01</td>
<td align="center">400</td>
<td align="center">64</td>
</tr>
<tr>
<td rowspan="2" align="center">HaCaT</td>
<td align="center">SR-RR</td>
<td align="center">3</td>
<td align="center">0.01</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="center">SR-MLP</td>
<td align="center">3</td>
<td align="center">0.01</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0</td>
<td align="center">0.01</td>
<td align="center">300</td>
<td align="center">64</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Loss profiles of SR-MLP model for five cell types (<bold>(a&#x2013;e)</bold> are HeLa, A549, PC12, HUVEC, and HaCaT cells in that order).</p>
</caption>
<graphic xlink:href="fenvs-14-1729913-g007.tif">
<alt-text content-type="machine-generated">Grouped figure containing five line graphs labeled a through e, each showing training and test loss versus epochs. All graphs exhibit sharp loss decreases during initial epochs followed by stabilization, with both train and test lines closely aligned. Legends distinguish blue for train loss and orange for test loss. Axes labels are consistent, with loss on the y-axis and epochs on the x-axis, highlighting model training progress across different scenarios.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s4-5">
<label>4.5</label>
<title>Analysis of the superiority of nonlinear modeling methods</title>
<p>Based on the comparison of model performance, we conducted an in-depth analysis of the fundamental reasons behind the superior performance of the SR-MLP model. Analysis reveals that the core reason for the superior predictive performance of SR-MLP over SR-LR and SR-RR is its ability to model nonlinear relationships. The SR-LR and SR-RR model are based on linear regression, which assumes a simple linear relationship between the input features and pollutant concentrations, whereas SR-MLP is able to capture more complex patterns through a multilayered neural network and nonlinear activation functions. To validate the nonlinear relationship between the variables, we visualized the relationship between features and concentrations and used polynomial fit curves to observe data trends. Common manifestations of nonlinearity: the fitted curve is not a straight line, has inflection points, and exhibits significant curvature or fluctuation (e.g., U-shape (<xref ref-type="bibr" rid="B36">Yang et al., 2020</xref>), inverted U-shape (<xref ref-type="bibr" rid="B36">Yang et al., 2020</xref>; <xref ref-type="bibr" rid="B21">Northoff and Tumati, 2019</xref>), and S-shape (<xref ref-type="bibr" rid="B33">Xiao et al., 2009</xref>), etc.). By observing the variable fitting curves of HeLa cells as in <xref ref-type="fig" rid="F8">Figure 8</xref>, we found that the fitting curves of most of the features showed obvious nonlinearities, such as Feature 115 and Feature 133 showed U-shape variations. The results indicate that SR-MLP overcomes the limitations of the SR-LR and SR-RR linearity assumption by modeling nonlinear relationships, and is able to more accurately describe the complex mapping between the gray-scale features of cell damage and pollutant concentrations, improving the fitting ability and prediction accuracy of the model.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Scatterplot of variables and their fitted curves after stepwise regression for HeLa cells.</p>
</caption>
<graphic xlink:href="fenvs-14-1729913-g008.tif">
<alt-text content-type="machine-generated">Grid of fourteen scatter plots, each displaying the relationship between a specific feature and concentration. Blue dots indicate data points and a red line shows a fitted trend for each feature.</alt-text>
</graphic>
</fig>
<p>Having established the core advantage of the SR-MLP model in handling nonlinear relationships, we further applied it to quantitatively predict environmental pollutant concentrations based on cellular image features. This approach establishes a direct, data-driven correlation between cellular morphological damage severity and pollutant concentration, offering a novel research perspective for environmental toxicity assessment. The efficacy of the SR-MLP framework in environmental concentration prediction is corroborated by related studies. For instance, Liu et al. successfully calibrated air quality monitoring data using a similar hybrid model (<xref ref-type="bibr" rid="B17">Liu et al., 2021</xref>). By transferring and validating this effective modeling strategy at the cellular level, this study proposes a novel, efficient, and reliable computational method for predicting pollutant concentrations based on cellular damage features. This expands the application scope of the hybrid model to microscopic biological response analysis.</p>
</sec>
<sec id="s4-6">
<label>4.6</label>
<title>Analysis of method applicability</title>
<p>To validate the applicability of the method in different cell types, we applied the SR-MLP model to four other cell types (A549, HUVEC, PC12, HaCaT) and evaluated the performance of the model on different cell datasets. As can be seen from the data in <xref ref-type="table" rid="T4">Table 4</xref>, the SR-MLP model showed relatively small errors between the predicted and true values at each concentration level in the HeLa, A549, HUVEC, and PC12 cell datasets, whereas the predictions of certain concentrations in the HaCaT cell dataset were slightly biased, e.g., the predicted value of 2.92&#xa0;&#x3bc;mol/L at 5&#xa0;&#x3bc;mol/L true value, but the predictions of other concentrations were still accurate. This indicates that the model still has good adaptability and generalization ability across different cellular datasets. We found that despite the differences in biological properties and data distribution among cell types, the overall trends were highly similar, and the SR-MLP model was able to accurately predict contaminant concentrations and compare the degree of cellular damage in different cell models.</p>
</sec>
<sec id="s4-7">
<label>4.7</label>
<title>Methodological limitations and future directions</title>
<p>To ensure that changes in image grayscale features primarily reflect the toxic effects of pollutants, this study implemented systematic experimental design and data processing procedures to control for potential confounding factors. Specific measures included: during the cell culture phase, all cell lines were cultured simultaneously in a standard incubator under constant temperature and humidity, using the same batch of culture medium and serum, while controlling passage number and inoculation density to maintain approximate consistency; during the image acquisition phase, all samples were imaged using the same optical microscope and a 10&#xd7; objective, with fixed exposure time, light intensity, and white balance parameters, and each imaging session was preceded by background correction and uniform field calibration; during the image analysis phase, an automated segmentation pipeline based on a pre-trained model (Cellpose cyto3) was employed, with unified flow threshold and minimum cell size settings to eliminate morphological and grayscale biases due to segmentation variability; during data processing, rigorous outlier removal and data normalization procedures were applied.</p>
<p>Nevertheless, we recognize that certain potential confounding factors are difficult to fully eliminate, such as intrinsic cellular heterogeneity (e.g., cell cycle distribution, metabolic state fluctuations) (<xref ref-type="bibr" rid="B14">Kondo et al., 2021</xref>), spontaneous morphological changes unrelated to toxicity that may occur during apoptosis or stress, and potential edge illumination attenuation in microscopic imaging fields despite calibration. These unmeasured or incompletely controlled variables may lead the model to partially rely on non-toxicity-related imaging artifacts or biological noise. Therefore, the quantitative &#x201c;image-concentration&#x201d; relationship established in this study should be interpreted as a strong statistical association captured under highly controlled experimental conditions. While this association provides a robust computational foundation and scalable framework for image-based toxicity prediction, the underlying biological causal chain warrants further systematic validation in the future through approaches such as intervention experiments (e.g., co-imaging with oxidative stress probes), multimodal data integration (e.g., combining fluorescence labeling with transcriptomics), and causal inference modeling.</p>
</sec>
</sec>
<sec sec-type="conclusion" id="s5">
<label>5</label>
<title>Conclusion</title>
<p>This study successfully establishes a novel quantitative &#x201c;image-to-concentration&#x201d; prediction paradigm based on cellular grayscale statistical features and an SR-MLP hybrid model. The approach enables high-accuracy, low-cost quantification of environmental pollutants using only conventional optical microscopy images, while demonstrating the broad applicability of high-grayscale features as cross-cellular damage markers. In advancing environmental toxicology, this work contributes methodologically by introducing a data-driven framework that transforms subjective morphological observations into objective concentration predictions, thereby enhancing the standardization and throughput of toxicity assessment. Furthermore, through interpretable analysis, it reveals nonlinear relationships between high-grayscale features and pollutant concentrations, opening new pathways for linking morphological changes to toxic mechanisms such as apoptosis and oxidative stress. Future research should expand the range of pollutants and toxicity endpoints to build a comprehensive &#x201c;image-feature-mechanism&#x201d; database. Developing dynamic monitoring models based on live-cell imaging will advance the method from static detection to real-time tracking and early warning. Additionally, efforts should focus on clarifying the biological significance of image features and establishing cross-platform standardization protocols to promote wider adoption in environmental monitoring, toxicity screening, and risk assessment.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The dataset for this study and the analysis code supporting the findings are located in the following Google Drive folder: <ext-link ext-link-type="uri" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="https://drive.google.com/drive/folders/1H9F113bZ4DlOXx1_jkmN_BTLeoY1BktX?usp=sharing">https://drive.google.com/drive/folders/1H9F113bZ4DlOXx1_jkmN_BTLeoY1BktX?usp=sharing</ext-link>.</p>
</sec>
<sec sec-type="author-contributions" id="s7">
<title>Author contributions</title>
<p>LZ: Conceptualization, Formal Analysis, Data curation, Investigation, Writing &#x2013; original draft. AL: Investigation, Writing &#x2013; original draft, Methodology, Validation. YZ: Investigation, Data curation, Writing &#x2013; original draft. BJ: Data curation, Formal Analysis, Software, Writing &#x2013; original draft. CL: Funding acquisition, Project administration, Writing &#x2013; review and editing. XX: Funding acquisition, Project administration, Writing &#x2013; review and editing, Conceptualization, Supervision. JJ: Conceptualization, Funding acquisition, Writing &#x2013; review and editing, Formal Analysis.</p>
</sec>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s10">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="s12">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fenvs.2026.1729913/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fenvs.2026.1729913/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Supplementaryfile1.docx" id="SM1" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aguinis</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Vassar</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wayant</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>On reporting and interpreting statistical significance and p values in medical research</article-title>. <source>BMJ Evid-Based Med.</source> <volume>26</volume> (<issue>2</issue>), <fpage>39</fpage>&#x2013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.1136/bmjebm-2019-111264</pub-id>
<pub-id pub-id-type="pmid">31732498</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alkhouly</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Mohammed</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hefny</surname>
<given-names>H. A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Improving the performance of deep neural networks using two proposed activation functions</article-title>. <source>IEEE Access</source> <volume>9</volume>, <fpage>82249</fpage>&#x2013;<lpage>82271</lpage>. <pub-id pub-id-type="doi">10.1109/access.2021.3085855</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Atabansi</surname>
<given-names>C. C.</given-names>
</name>
<name>
<surname>Nie</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>A survey of transformer applications for histopathological image analysis: new developments and future directions</article-title>. <source>Biomed. Eng. Online</source> <volume>22</volume> (<issue>1</issue>), <fpage>96</fpage>. <pub-id pub-id-type="doi">10.1186/s12938-023-01157-0</pub-id>
<pub-id pub-id-type="pmid">37749595</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Recent advances in morphological cell image analysis</article-title>. <source>Comput. Math. Methods Med.</source> <volume>2012</volume> (<issue>1</issue>), <fpage>101536</fpage>. <pub-id pub-id-type="doi">10.1155/2012/101536</pub-id>
<pub-id pub-id-type="pmid">22272215</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chicco</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Warrens</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Jurman</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>The coefficient of determination R-squared is more informative than SMAPE, MAE, MAPE, MSE and RMSE in regression analysis evaluation</article-title>. <source>PeerJ Comput. Sci.</source> <volume>7</volume>, <fpage>e623</fpage>. <pub-id pub-id-type="doi">10.7717/peerj-cs.623</pub-id>
<pub-id pub-id-type="pmid">34307865</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chukhlovin</surname>
<given-names>A. B.</given-names>
</name>
<name>
<surname>Tokalov</surname>
<given-names>S. V.</given-names>
</name>
<name>
<surname>Yagunov</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Westendorf</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Reincke</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Karbe</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>
<italic>In vitro</italic> suppression of thymocyte apoptosis by metal-rich complex environmental mixtures: potential role of zinc and cadmium excess</article-title>. <source>Sci. Total Environ.</source> <volume>281</volume> (<issue>1-3</issue>), <fpage>153</fpage>&#x2013;<lpage>163</lpage>. <pub-id pub-id-type="doi">10.1016/s0048-9697(01)00843-9</pub-id>
<pub-id pub-id-type="pmid">11778948</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ekanayake</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Meddage</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Rathnayake</surname>
<given-names>U.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A novel approach to explain the black-box nature of machine learning in compressive strength predictions of concrete using shapley additive explanations (SHAP)</article-title>. <source>Case Stud. Constr. Mat.</source> <volume>16</volume>, <fpage>e01059</fpage>. <pub-id pub-id-type="doi">10.1016/j.cscm.2022.e01059</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname>
<given-names>D. D.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Q. H.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Analysis of S-Ovalbumin content of different varieties of eggs during storage and its nondestructive testing model by visible-near infrared spectroscopy</article-title>. <source>Chin. J. Anal. Chem.</source> <volume>48</volume> (<issue>2</issue>), <fpage>289</fpage>&#x2013;<lpage>297</lpage>.</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hiers</surname>
<given-names>R. D.</given-names>
</name>
<name>
<surname>Khajotia</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Merritt</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Esteban Florez</surname>
<given-names>F. L.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Optimization of an ultra-bright real-time high-throughput renilla luciferase assay for antibacterial assessment of Streptococcus mutans biofilms</article-title>. <source>Dent. Mater</source> <volume>40</volume> (<issue>9</issue>), <fpage>1313</fpage>&#x2013;<lpage>1321</lpage>. <pub-id pub-id-type="doi">10.1016/j.dental.2024.06.012</pub-id>
<pub-id pub-id-type="pmid">38876827</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>James</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Witten</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2023</year>). <source>Linear regression [M]. An introduction to statistical learning: with applications in python</source>. <publisher-name>Springer</publisher-name>, <fpage>69</fpage>&#x2013;<lpage>134</lpage>.</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kamiloglu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sari</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Ozdal</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Capanoglu</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Guidelines for cell viability assays</article-title>. <source>Food Front.</source> <volume>1</volume> (<issue>3</issue>), <fpage>332</fpage>&#x2013;<lpage>349</lpage>. <pub-id pub-id-type="doi">10.1002/fft2.44</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kerr</surname>
<given-names>J. F.</given-names>
</name>
<name>
<surname>Wyllie</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Currie</surname>
<given-names>A. R.</given-names>
</name>
</person-group> (<year>1972</year>). <article-title>Apoptosis: a basic biological phenomenon with wide-ranging implications in tissue kinetics</article-title>. <source>Br. J. Cancer</source> <volume>26</volume> (<issue>4</issue>), <fpage>239</fpage>&#x2013;<lpage>257</lpage>. <pub-id pub-id-type="doi">10.1038/bjc.1972.33</pub-id>
<pub-id pub-id-type="pmid">4561027</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>K&#x131;l&#x131;&#xe7;arslan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Adem</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>&#xc7;elik</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>An overview of the activation functions used in deep learning algorithms</article-title>. <source>J. New Results Sci.</source> <volume>10</volume> (<issue>3</issue>), <fpage>75</fpage>&#x2013;<lpage>88</lpage>. <pub-id pub-id-type="doi">10.54187/jnrs.1011739</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kondo</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ratcliffe</surname>
<given-names>C. D.</given-names>
</name>
<name>
<surname>Hooper</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ellis</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>MacRae</surname>
<given-names>J. I.</given-names>
</name>
<name>
<surname>Hennequart</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Single-cell resolved imaging reveals intra-tumor heterogeneity in glycolysis, transitions between metabolic states, and their regulatory mechanisms</article-title>. <source>Cell Rep.</source> <volume>34</volume> (<issue>7</issue>), <fpage>108750</fpage>. <pub-id pub-id-type="doi">10.1016/j.celrep.2021.108750</pub-id>
<pub-id pub-id-type="pmid">33596424</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kumunda</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Adekunle</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Mamba</surname>
<given-names>B. B.</given-names>
</name>
<name>
<surname>Hlongwa</surname>
<given-names>N. W.</given-names>
</name>
<name>
<surname>Nkambule</surname>
<given-names>T. T. I.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Electrochemical detection of environmental pollutants based on graphene derivatives: a review</article-title>. <source>Front. Mater</source> <volume>7</volume>, <fpage>616787</fpage>. <pub-id pub-id-type="doi">10.3389/fmats.2020.616787</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jia</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Gray frequency-based methodology for assessing cell damage</article-title>. <source>ACS Omega</source> <volume>10</volume> (<issue>14</issue>), <fpage>14084</fpage>&#x2013;<lpage>14093</lpage>. <pub-id pub-id-type="doi">10.1021/acsomega.4c11226</pub-id>
<pub-id pub-id-type="pmid">40256511</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Q. B.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>Y. Q.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Application of combined model of stepwise regression analysis and artificial neural network in data calibration of miniature air quality detector</article-title>. <source>Sci. Rep.</source> <volume>11</volume> (<issue>1</issue>), <fpage>3247</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-021-82871-4</pub-id>
<pub-id pub-id-type="pmid">33547414</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A combined model for multivariate time series forecasting based on MLP-Feedforward attention-LSTM</article-title>. <source>IEEE Access</source> <volume>10</volume>, <fpage>88644</fpage>&#x2013;<lpage>88654</lpage>. <pub-id pub-id-type="doi">10.1109/access.2022.3192430</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Meher</surname>
<given-names>A. K.</given-names>
</name>
<name>
<surname>Zarouri</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Environmental applications of mass spectrometry for emerging contaminants</article-title>. <source>Molecules</source> <volume>30</volume> (<issue>2</issue>), <fpage>364</fpage>. <pub-id pub-id-type="doi">10.3390/molecules30020364</pub-id>
<pub-id pub-id-type="pmid">39860232</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muhammad</surname>
<given-names>A. L. I. P.</given-names>
</name>
<name>
<surname>Faraj</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Data normalization and standardization: a technical report</article-title>.</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Northoff</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Tumati</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Average is good, extremes are bad &#x2013; non-linear inverted U-shaped relationship between neural mechanisms and functionality of mental features</article-title>. <source>Neurosci. Biobehav Rev.</source> <volume>104</volume>, <fpage>11</fpage>&#x2013;<lpage>25</lpage>. <pub-id pub-id-type="doi">10.1016/j.neubiorev.2019.06.030</pub-id>
<pub-id pub-id-type="pmid">31251964</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pereira</surname>
<given-names>S. P.</given-names>
</name>
<name>
<surname>Santos</surname>
<given-names>S. M. A.</given-names>
</name>
<name>
<surname>Fernandes</surname>
<given-names>M. A. S.</given-names>
</name>
<name>
<surname>Deus</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Martins</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Pedroso de Lima</surname>
<given-names>M. C.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Improving pollutants environmental risk assessment using a multi model toxicity determination with <italic>in vitro,</italic>, bacterial, animal and plant model systems: the case of the herbicide alachlor</article-title>. <source>Environ. Pollut.</source> <volume>286</volume>, <fpage>117239</fpage>. <pub-id pub-id-type="doi">10.1016/j.envpol.2021.117239</pub-id>
<pub-id pub-id-type="pmid">33990048</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sadrara</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Khorrami</surname>
<given-names>M. K.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Principal component analysis-multivariate adaptive regression splines (PCA-MARS) and back propagation-artificial neural network (BP-ANN) methods for predicting the efficiency of oxidative desulfurization systems using ATR-FTIR spectroscopy</article-title>. <source>Spectrochim. Acta A</source>, <fpage>300</fpage>. <pub-id pub-id-type="doi">10.1016/j.saa.2023.122944</pub-id>
<pub-id pub-id-type="pmid">37269660</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salehin</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>D.-K.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>A review on dropout regularization approaches for deep neural networks within the scholarly domain</article-title>. <source>Electronics</source> <volume>12</volume> (<issue>14</issue>), <fpage>3106</fpage>. <pub-id pub-id-type="doi">10.3390/electronics12143106</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sheller-Miller</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Radnaa</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Arita</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Getahun</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Jones</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Peltier</surname>
<given-names>M. R.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Environmental pollutant induced cellular injury is reflected in exosomes from placental explants</article-title>. <source>Placenta</source> <volume>89</volume>, <fpage>42</fpage>&#x2013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1016/j.placenta.2019.10.008</pub-id>
<pub-id pub-id-type="pmid">31675489</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shobayo</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Saatchi</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Developments in deep learning artificial neural network techniques for medical image analysis and interpretation</article-title>. <source>Diagnostics</source> <volume>15</volume> (<issue>9</issue>), <fpage>1072</fpage>. <pub-id pub-id-type="doi">10.3390/diagnostics15091072</pub-id>
<pub-id pub-id-type="pmid">40361891</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stringer</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Michaelos</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pachitariu</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Cellpose: a generalist algorithm for cellular segmentation</article-title>. <source>Nat. Methods</source> <volume>18</volume> (<issue>1</issue>), <fpage>100</fpage>&#x2013;<lpage>106</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-020-01018-x</pub-id>
<pub-id pub-id-type="pmid">33318659</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Suzuki</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Hidaka</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Kumagai</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yamamoto</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Environmental pollutants and the immune response</article-title>. <source>Nat. Immunol.</source> <volume>21</volume> (<issue>12</issue>), <fpage>1486</fpage>&#x2013;<lpage>1495</lpage>. <pub-id pub-id-type="doi">10.1038/s41590-020-0802-6</pub-id>
<pub-id pub-id-type="pmid">33046888</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Swami</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Dave</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ranga</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>IQR-based approach for DDoS detection and mitigation in SDN</article-title>. <source>Def. Technol.</source> <volume>25</volume>, <fpage>76</fpage>&#x2013;<lpage>87</lpage>. <pub-id pub-id-type="doi">10.1016/j.dt.2022.10.006</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>W. Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X. F.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Prediction method of core dead stock column temperature based on PCA and ridge regression</article-title>. <source>ISIJ Int.</source> <volume>61</volume> (<issue>11</issue>), <fpage>2785</fpage>&#x2013;<lpage>2791</lpage>. <pub-id pub-id-type="doi">10.2355/isijinternational.isijint-2020-497</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>Y. Q.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>High precision error prediction algorithm based on ridge regression predictor for reversible data hiding</article-title>. <source>IEEE Signal Proc. Lett.</source> <volume>28</volume>, <fpage>1125</fpage>&#x2013;<lpage>1129</lpage>. <pub-id pub-id-type="doi">10.1109/lsp.2021.3080181</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A comprehensive survey of loss functions in machine learning</article-title>. <source>Ann. Data Sci.</source> <volume>9</volume> (<issue>2</issue>), <fpage>187</fpage>&#x2013;<lpage>212</lpage>. <pub-id pub-id-type="doi">10.1007/s40745-020-00253-5</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiao</surname>
<given-names>J.-Q.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>D.-X.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>F. L.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Inverted S-shaped model for nonlinear fatigue damage of rock</article-title>. <source>Int. J. Rock Mech. Min.</source> <volume>46</volume> (<issue>3</issue>), <fpage>643</fpage>&#x2013;<lpage>648</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijrmms.2008.11.002</pub-id>
</mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xie</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Moshayedi</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Noori Skandari</surname>
<given-names>M. H.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A hybrid improved neural networks algorithm based on L2 and dropout regularization</article-title>. <source>Math. Probl. Eng.</source> <volume>2022</volume> (<issue>1</issue>), <fpage>8220453</fpage>. <pub-id pub-id-type="doi">10.1155/2022/8220453</pub-id>
</mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xin</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>The development of GADD45&#x3b1; luciferase reporter assays in human cells for assessing the genotoxicity of environmental pollutants</article-title>. <source>Toxicol. Mech. Methods</source> <volume>25</volume> (<issue>2</issue>), <fpage>136</fpage>&#x2013;<lpage>142</lpage>. <pub-id pub-id-type="doi">10.3109/15376516.2014.1003357</pub-id>
<pub-id pub-id-type="pmid">25560476</pub-id>
</mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Zha</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Exploring the nonlinear association between environmental regulation and carbon intensity in China: the mediating effect of green technology</article-title>. <source>Ecol. Indic.</source> <volume>114</volume>, <fpage>106309</fpage>. <pub-id pub-id-type="doi">10.1016/j.ecolind.2020.106309</pub-id>
</mixed-citation>
</ref>
<ref id="B37">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Ferroptosis induced by pollutants: an emerging mechanism in environmental toxicology</article-title>. <source>Environ. Sci. Technol.</source> <volume>58</volume> (<issue>5</issue>), <fpage>2166</fpage>&#x2013;<lpage>2184</lpage>. <pub-id pub-id-type="doi">10.1021/acs.est.3c06127</pub-id>
<pub-id pub-id-type="pmid">38275135</pub-id>
</mixed-citation>
</ref>
<ref id="B38">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Metamodel selection based on stepwise regression</article-title>. <source>Struct. Multidiscip. Optim.</source> <volume>54</volume> (<issue>3</issue>), <fpage>641</fpage>&#x2013;<lpage>657</lpage>. <pub-id pub-id-type="doi">10.1007/s00158-016-1442-1</pub-id>
</mixed-citation>
</ref>
<ref id="B39">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Guan</surname>
<given-names>X. R.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>sEMG-Based lower limb motion prediction using CNN-LSTM with improved PCA optimization algorithm</article-title>. <source>J. Bionic Eng.</source> <volume>20</volume> (<issue>2</issue>), <fpage>612</fpage>&#x2013;<lpage>627</lpage>. <pub-id pub-id-type="doi">10.1007/s42235-022-00280-3</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1864850/overview">Rui Zhang</ext-link>, University of Jinan, China</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1937420/overview">Hongmei Deng</ext-link>, Guangzhou University, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1695951/overview">Muhammad Zafar Irshad Khan</ext-link>, Zhejiang University, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3277635/overview">Vinod Chandra S. S.</ext-link>, University of Kerala, India</p>
</fn>
</fn-group>
</back>
</article>