<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Microbiol.</journal-id>
<journal-title>Frontiers in Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">1664-302X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmicb.2023.1101357</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Rapid discrimination of <italic>Shigella</italic> spp. and <italic>Escherichia coli via</italic> label-free surface enhanced Raman spectroscopy coupled with machine learning algorithms</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Wei</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<xref rid="fn0003" ref-type="author-notes"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2195925/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tang</surname>
<given-names>Jia-Wei</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
<xref rid="fn0003" ref-type="author-notes"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2209949/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mou</surname>
<given-names>Jing-Yi</given-names>
</name>
<xref rid="aff3" ref-type="aff"><sup>3</sup></xref>
<xref rid="fn0003" ref-type="author-notes"><sup>&#x2020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lyu</surname>
<given-names>Jing-Wen</given-names>
</name>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2178816/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Di</surname>
<given-names>Yu-Wei</given-names>
</name>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liao</surname>
<given-names>Ya-Long</given-names>
</name>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2179233/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Luo</surname>
<given-names>Yan-Fei</given-names>
</name>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Zheng-Kang</given-names>
</name>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
<xref rid="c001" ref-type="corresp"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2050049/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wu</surname>
<given-names>Xiang</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<xref rid="c002" ref-type="corresp"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1579254/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wang</surname>
<given-names>Liang</given-names>
</name>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
<xref rid="c003" ref-type="corresp"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/456094/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>School of Medical Informatics and Engineering, Xuzhou Medical University</institution>, <addr-line>Xuzhou, Jiangsu</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Laboratory Medicine, Guangdong Provincial People&#x2019;s Hospital, Guangdong Academy of Medical Sciences, Southern Medical University</institution>, <addr-line>Guangzhou, Guangdong</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>The First School of Clinical Medicine, Xuzhou Medical University</institution>, <addr-line>Xuzhou, Jiangsu</addr-line>, <country>China</country></aff>
<author-notes>
<fn id="fn0001" fn-type="edited-by"><p>Edited by: Shyam Sundar Paul, ICAR, India</p></fn>
<fn id="fn0002" fn-type="edited-by"><p>Reviewed by: Min Yue, Zhejiang University, China; Pawan Kumar Kanaujia, Mahayogi Gorakhnath University, India</p></fn>
<corresp id="c001">&#x002A;Correspondence: Zheng-Kang Li, <email>lizhengkang@gdph.org.cn</email></corresp>
<corresp id="c002">Xiang Wu, <email>wuxiang@xzhmu.edu.cn</email></corresp>
<corresp id="c003">Liang Wang, <email>wangliang@gdph.org.cn</email>;</corresp>
<fn id="fn0003" fn-type="equal"><p><sup>&#x2020;</sup>These authors have contributed equally to this work</p></fn>
<fn id="fn0004" fn-type="other"><p>This article was submitted to Systems Microbiology, a section of the journal Frontiers in Microbiology</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>08</day>
<month>03</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1101357</elocation-id>
<history>
<date date-type="received">
<day>17</day>
<month>11</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>02</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2023 Liu, Tang, Mou, Lyu, Di, Liao, Luo, Li, Wu and Wang.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Liu, Tang, Mou, Lyu, Di, Liao, Luo, Li, Wu and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p><italic>Shigella</italic> and enterotoxigenic <italic>Escherichia coli</italic> (ETEC) are major bacterial pathogens of diarrheal disease that is the second leading cause of childhood mortality globally. Currently, it is well known that <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> are very closely related with many common characteristics. Evolutionarily speaking, <italic>Shigella</italic> spp., are positioned within the phylogenetic tree of <italic>E</italic>. <italic>coli</italic>. Therefore, discrimination of <italic>Shigella</italic> spp., from <italic>E</italic>. <italic>coli</italic> is very difficult. Many methods have been developed with the aim of differentiating the two species, which include but not limited to biochemical tests, nucleic acids amplification, and mass spectrometry, etc. However, these methods suffer from high false positive rates and complicated operation procedures, which requires the development of novel methods for accurate and rapid identification of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>. As a low-cost and non-invasive method, surface enhanced Raman spectroscopy (SERS) is currently under intensive study for its diagnostic potential in bacterial pathogens, which is worthy of further investigation for its application in bacterial discrimination. In this study, we focused on clinically isolated <italic>E</italic>. <italic>coli</italic> strains and <italic>Shigella</italic> species (spp.), that is, <italic>S</italic>. <italic>dysenteriae</italic>, <italic>S</italic>. <italic>boydii</italic>, <italic>S</italic>. <italic>flexneri</italic>, and <italic>S</italic>. <italic>sonnei</italic>, based on which SERS spectra were generated and characteristic peaks for <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> were identified, revealing unique molecular components in the two bacterial groups. Further comparative analysis of machine learning algorithms showed that, the Convolutional Neural Network (CNN) achieved the best performance and robustness in bacterial discrimination capacity when compared with Random Forest (RF) and Support Vector Machine (SVM) algorithms. Taken together, this study confirmed that SERS paired with machine learning could achieve high accuracy in discriminating <italic>Shigella</italic> spp., from <italic>E</italic>. <italic>coli</italic>, which facilitated its application potential for diarrheal prevention and control in clinical settings.
<fig position="float" id="g006">
<caption>
<p>Graphical abstract</p>
</caption>
<graphic xlink:href="fmicb-14-1101357-g006.tif"/>
</fig></p>
</abstract>
<kwd-group>
<kwd>diarrheal disease</kwd>
<kwd><italic>Shigella</italic> spp.</kwd>
<kwd><italic>Escherichia coli</italic></kwd>
<kwd>machine learning</kwd>
<kwd>deep learning</kwd>
<kwd>Raman effect</kwd>
<kwd>SERS spectra</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="42"/>
<page-count count="11"/>
<word-count count="8038"/>
</counts>
</article-meta>
</front>
<body>
<sec id="sec1">
<title>Novelty statement</title>
<p>In this study, we achieved the rapid and accurate predication of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> with high accuracy by using surface enhanced Raman spectroscopy paired with machine learning algorithms, among which convolutional neural network showed the best performance. In addition, DeconvNet method was used for generating 2-dimensional unique barcodes for <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>, which facilitated the rapid recognition of the two species.</p>
</sec>
<sec id="sec2">
<title>Highlights</title>
<p>
<list list-type="simple">
<list-item>
<p><italic>-Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> SERS spectra had unique characteristic peaks.</p>
</list-item>
<list-item>
<p><italic>-Shigella</italic> spp., could be discriminated from <italic>E</italic>. <italic>coli</italic> with high accuracy <italic>via</italic> SERS.</p>
</list-item>
<list-item>
<p>-Deconvolution generated unique SERS barcodes for <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>.</p>
</list-item>
</list>
</p>
</sec>
<sec id="sec3" sec-type="intro">
<label>1.</label>
<title>Introduction</title>
<p><italic>Shigella</italic> spp., is very closely related with <italic>Escherichia coli</italic> in terms of phenotypes and genotypes, both of which are Gram-negative bacteria and belong to the <italic>Enterobacterales</italic> phylum (<xref ref-type="bibr" rid="ref24">Pizzato et al., 2022</xref>). Previously, genetic studies based on multi-locus enzyme electrophoresis (MLEE) at population level identified that <italic>Shigella</italic> spp., fell within <italic>E</italic>. <italic>coli</italic> (<xref ref-type="bibr" rid="ref25">Pupo et al., 2000</xref>), while pH-indicator-based triple sugar ion (TSI) test showed poor sensitivity and specificity in terms of discriminating <italic>E</italic>. <italic>coli</italic> and <italic>Shigella</italic> spp., from other bacterial species (<xref ref-type="bibr" rid="ref26">Rautureau et al., 2019</xref>). Other methods commonly used in clinical laboratory such as 16S rRNA gene sequencing and matrix-assisted laser desorption/ionization-time of flight mass spectrometry (MALDI-TOF MS) cannot differentiate <italic>Shigella</italic> spp., from <italic>E</italic>. <italic>coli</italic> (<xref ref-type="bibr" rid="ref9">Devanga Ragupathi et al., 2018</xref>; <xref ref-type="bibr" rid="ref32">van den Beld et al., 2022</xref>). Therefore, it is very difficult and time-consuming to separate <italic>Shigella</italic> spp., from <italic>E</italic>. <italic>coli</italic> in clinical laboratories, though the two groups of bacteria show differences in epidemiology and clinical infections (<xref ref-type="bibr" rid="ref9">Devanga Ragupathi et al., 2018</xref>), and <italic>Shigella</italic> spp., have been confirmed to be not clones of <italic>E</italic>. <italic>coli</italic> but sister species in the genus <italic>Escherichia</italic> (<xref ref-type="bibr" rid="ref42">Zuo et al., 2013</xref>).</p>
<p>From clinical perspective, <italic>Shigella</italic> spp., are responsible for life-threatening dysentery (also known as shigellosis) and the infection leads to high childhood morbidity and mortality globally (<xref ref-type="bibr" rid="ref36">Wang et al., 2019</xref>; <xref ref-type="bibr" rid="ref41">Zhu et al., 2020</xref>), while <italic>E</italic>. <italic>coli</italic> are normally commensals found in human gut microbiota (<xref ref-type="bibr" rid="ref26">Rautureau et al., 2019</xref>). However, among the many <italic>E</italic>. <italic>coli</italic> sub-strains, enteroinvasive <italic>E</italic>. <italic>coli</italic> (EIEC) behaves similarly as <italic>Shigella</italic> spp., by causing invasion and inflammatory destruction of the human colonic epithelium, which also leads to the development of shigellosis (<xref ref-type="bibr" rid="ref4">Belotserkovsky and Sansonetti, 2018</xref>). In fact, both EIEC and <italic>Shigella</italic> spp., evolved from commensal <italic>E</italic>. <italic>coli</italic> through loss and/or gain of functional genes and virulence genes (<xref ref-type="bibr" rid="ref4">Belotserkovsky and Sansonetti, 2018</xref>). Therefore, it is important to rapidly and accurately discriminate <italic>E</italic>. <italic>coli</italic> from <italic>Shigella</italic> spp., in order to facilitate the clinical diagnosis, prevention and control of <italic>Shigell</italic>a spp., and <italic>E</italic>. <italic>coli</italic> infections.</p>
<p>Since both <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> are able to grow on distinctive selective media, traditional biochemical tests and serotyping experiments are regularly used for their discrimination in clinical labs (<xref ref-type="bibr" rid="ref24">Pizzato et al., 2022</xref>). However, these methods suffer from multi-step complexity and reliance on commercially-available kits, which makes the differentiation procedure time-consuming, sophisticated, and expensive, calling for the development of novel techniques and methods in the field (<xref ref-type="bibr" rid="ref24">Pizzato et al., 2022</xref>). Recently, as a rapidly developed emerging technique, surface enhanced Raman spectrometry (SERS) has been extensively explored for its potential and promising application in bacterial pathogen detection and antibiotic resistance profiling (<xref ref-type="bibr" rid="ref31">Tang et al., 2021</xref>; <xref ref-type="bibr" rid="ref33">Wang et al., 2021</xref>; <xref ref-type="bibr" rid="ref17">Liu et al., 2022</xref>; <xref ref-type="bibr" rid="ref30">Tang et al., 2022</xref>). There are currently multiple studies using SERS technique combined with machine learning models to detect different types of bacterial pathogens, which have been summarized in recent reviews and will not be described in details here (<xref ref-type="bibr" rid="ref18">Liu et al., 2017</xref>; <xref ref-type="bibr" rid="ref14">Lee et al., 2021</xref>; <xref ref-type="bibr" rid="ref33">Wang et al., 2021</xref>; <xref ref-type="bibr" rid="ref27">Rebrosova et al., 2022</xref>). Therefore, SERS technique holds promising future for rapid and non-invasive diagnostics of bacterial pathogens in clinical settings. In addition, <xref ref-type="bibr" rid="ref6">Chen et al. (2022)</xref> developed nanoporous Ag nanorods as SERS substrates to sensitively detect adenine, spike glycoprotein, and different types of bacteria, while <xref ref-type="bibr" rid="ref16">Liu et al. (2022)</xref> constructed novel Ag nanoparticles that are able to generate high antibacterial activities.</p>
<p>Although many studies have applied SERS technique in the rapid identification of bacterial pathogens, there are currently few studies focusing on using the combination of SERS technique and machine learning models to discriminate <italic>Shigella</italic> spp., from <italic>E</italic>. <italic>coli</italic>. In this study, we collected SERS spectra for <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli via</italic> handheld Raman spectrometer, which were then analyzed <italic>via</italic> machine learning algorithms. According to the results, <italic>Shigella</italic> spp., could be rapidly and accurately discriminated from <italic>E</italic>. <italic>coli</italic> through the combination of SERS technique and machine learning algorithms, which provides a promising future for the application of SERS technique in diarrheal prevention and control in clinical settings.</p>
</sec>
<sec id="sec4">
<label>2.</label>
<title>Methods and materials</title>
<sec id="sec5">
<label>2.1.</label>
<title>Collection of bacterial strains</title>
<p>Ten <italic>E</italic>. <italic>coli</italic> strains and eight <italic>Shigella</italic> strains were used in this experiment. Two of the laboratory strains <italic>E</italic>. <italic>coli</italic> BL21 (DE3) and BW25113 was purchased from Tiangen Biotech Co. Ltd (Beijing, China), the remaining eight <italic>E</italic>. <italic>coli</italic> strains and eight <italic>Shigella</italic> spp., strains (<italic>S</italic>. <italic>dysenteriae</italic>: 2 strains, <italic>S</italic>. <italic>boydii</italic>: 2 strains, <italic>S</italic>. <italic>flexneri</italic>: 2 strains, and <italic>S</italic>. <italic>sonnei</italic>: 2 strains) were directly isolated from clinical samples and confirmed <italic>via</italic> both biochemical tests and mass spectrometry in Xuzhou Infectious Diseases Hospital affiliated to Xuzhou Medical University. All the strains were stored in liquid Luria Broth (LB) culture with 25% glycerol stock at &#x2212;80&#x00B0;C. During the study, all the strains were recovered from the &#x2212;80&#x00B0;C freezer by streaking on LB agar plate and incubating at 37&#x00B0;C overnight before experimental analysis.</p>
</sec>
<sec id="sec6">
<label>2.2.</label>
<title>Preparation of silver nanoparticles as surface enhanced Raman spectroscopy substrate</title>
<p>The preparation procedures for silver nanoparticles (AgNPs) have been well documents in previous studies (<xref ref-type="bibr" rid="ref31">Tang et al., 2021</xref>; <xref ref-type="bibr" rid="ref17">Liu et al., 2022</xref>; <xref ref-type="bibr" rid="ref30">Tang et al., 2022</xref>; <xref ref-type="bibr" rid="ref34">Wang et al., 2022a,b</xref>). Therefore, we only briefly stated the preparation steps in terms of the key reactions. In particular, 33.72&#x2009;mg of silver nitrate (AgNO<sub>3</sub>) was added to a triangular flask with 200&#x2009;mL of deionized distilled water (ddH<sub>2</sub>O) with stirring and heating until boiling. 8&#x2009;mL of sodium citrate (Na<sub>3</sub>C<sub>6</sub>H<sub>5</sub>O<sub>7</sub>) was then added with stirring and heating at 650&#x2009;r/min for 40&#x2009;min. Stop heating and keep stirring until the solution cools down to room temperature, which was then filled up to 200&#x2009;mL with ddH<sub>2</sub>O. 1&#x2009;mL of the prepared solution was transferred to a clean Eppendorf (EP) tube for 7-min centrifugation at 7000&#x2009;r/min. Discard the supernatant and resuspend the pellet with 100&#x2009;&#x03BC;L of ddH<sub>2</sub>O, which was the AgNP substrate that were stored without light at room temperature for long-term use.</p>
</sec>
<sec id="sec7">
<label>2.3.</label>
<title>Surface-enhanced Raman spectroscopy</title>
<p>For each bacterial species (10 <italic>E</italic>. <italic>coli</italic> strains and eight <italic>Shigella</italic> spp., strains) used in this study, after recovering <italic>via</italic> cultivating on LB agar plate overnight, a single colony was selected and inoculated into 15&#x2009;&#x03BC;L phosphate buffer saline (PBS) and well mixed <italic>via</italic> vortexing, which was then well mixed with 15&#x2009;&#x03BC;L negatively-charged AgNPs substrate solution. The well-mixed suspension was dropped onto the surface of silicon wafer and to form a circular spot of suitable size, which was dried naturally before SERS spectroscopy. The hand-held Raman spectrometer Anton Paar&#x2122; Cora100 (Anton Paar Shanghai Trading Co., Ltd., China.) was used for sample analysis and Raman spectral detection by using the following settings of parameters: (1) excitation wavelength: 784.56&#x2009;nm; (2) excitation power: 25&#x2009;mW; (3) spectral resolution: 1&#x2009;nm; (4) spectral wave number resolution: 10&#x2009;cm<sup>&#x2212;1</sup>; (5) detection spectral range: 400&#x2013;2,300&#x2009;cm<sup>&#x2212;1</sup>. All the SERS spectra were calibrated using the Raman peak at 520&#x2009;cm<sup>&#x2212;1</sup> as the reference peak and the dark current was deducted during integration time. For each bacterial species, a total of 200 spectra were collected by randomly selecting detecting sites in each of the dried sample spots. Therefore, a total of 800 spectra for <italic>Shigella</italic> spp., and 800 SERS spectra of <italic>E</italic>. <italic>coli</italic> were used for further analysis in this study,</p>
</sec>
<sec id="sec8">
<label>2.4.</label>
<title>Average surface enhanced Raman spectroscopy spectra and characteristic peaks</title>
<sec id="sec9">
<label>2.4.1.</label>
<title>Calculational analysis of average surface enhanced Raman spectroscopy spectra</title>
<p>By calculating the average intensities under each Raman shift for all the SERS spectra that were generated from <italic>E</italic>. <italic>coli</italic> (<italic>N</italic>&#x2009;=&#x2009;800) and <italic>Shigella</italic> spp (<italic>N</italic>&#x2009;=&#x2009;800), respectively, average Raman spectra were then obtained. 20% of standard deviation (SD) was also calculated and visualized as shaded region around the average SERS spectra for <italic>E</italic>. <italic>coli</italic> and <italic>Shigella</italic> spp. Average Raman spectra with standard error bands were plotted using Origin software (OriginLab, United States). The width of the error bands showed the reproducibility of Raman spectra. The wider the error band, the worse the reproducibility.</p>
</sec>
<sec id="sec10">
<label>2.4.2.</label>
<title>Computational identification of characteristic peaks</title>
<p>Characteristic peaks for the SERS spectra of <italic>E</italic>. <italic>coli</italic> and <italic>Shigella</italic> spp., were conducted <italic>via</italic> the software LabSpec6 (HORIBA Scientific, Japan). In specificity, <italic>GaussLoren</italic> function was used for the analysis with parameters set to Level&#x2009;=&#x2009;13%, Size&#x2009;=&#x2009;20, and Iteration&#x2009;=&#x2009;5, while other parameters were in default. All the identified characteristic peaks were marked with black arrows and labelled with corresponding Raman shifts along the average SERS spectra. Biological meanings of all the characteristic peaks were sourced from literature.</p>
</sec>
</sec>
<sec id="sec11">
<label>2.5.</label>
<title>Surface enhanced Raman spectroscopy spectral deconvolution and barcoding</title>
<p>In order to explore the characteristic features of the average Raman spectra for <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>, we performed deconvolution operations on each average Raman spectrum. In specificity, baseline correction was first performed on the average spectrum with the parameter set to type&#x2009;=&#x2009;Polynom and degree&#x2009;=&#x2009;4, which aims to highlight the representative characteristic peaks so that finer differences can be found by means of deconvolution. The function <italic>fit peaks</italic> pro in Origin (version 2019b 32bit) was applied for peak fitting, which used <italic>Voigt</italic> function maximum value and half width to obtain the Doppler and Lorentz lines to solve the deconvolution sub-bands of spectra. Before fitting, appropriate values for the <italic>Gaussian width</italic> and <italic>Lorentzian width</italic> parameters were selected to avoid fitting failures. In addition, barcodes are an efficient mean for electronic record-keeping, which enables rapid identification <italic>via</italic> software (<xref ref-type="bibr" rid="ref21">Pezzotti et al., 2021</xref>). Therefore, in this study, in order to improve the accessibility of spectral data, we designed barcodes for the deconvoluted Raman spectra in terms of different variants and their subtypes. The barcodes were generated through assigning each band a line with width equal to 1/30 of the width of the sub-band and a distance from the successive line proportional to the band area, which provided necessary flexibility and rapidity for Raman spectroscopy methods.</p>
</sec>
<sec id="sec12">
<label>2.6.</label>
<title>Unsupervised clustering analysis of surface enhanced Raman spectroscopy spectra</title>
<p>In order to investigate the inherent differences among SERS spectra of <italic>E</italic>. <italic>coli</italic> and <italic>Shigella</italic> spp., T-Distributed Stochastic Neighbor Embedding (T-SNE) algorithm was used for dimensionality reduction and clustering visualization of bacterial spectral data. Set n_components&#x2009;=&#x2009;2 and learning_rate&#x2009;=&#x2009;10 for the TSNE function in the <italic>scikit-learn</italic> package (version 0.21.3) to analyze the spectral difference between <italic>Shigella spp</italic>., and <italic>E</italic>. <italic>coli</italic> spectra. For data visualization, we chose the first two feature dimensions after TSNE dimensionality reduction as the coordinate axises, and displayed the categories of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> in the form of scatter plots.</p>
</sec>
<sec id="sec13">
<label>2.7.</label>
<title>Supervised machine learning analysis</title>
<sec id="sec14">
<label>2.7.1.</label>
<title>Supervised clustering analysis of surface enhanced Raman spectroscopy spectra</title>
<p>Orthogonal partial least squares discriminant analysis (OPLS-DA) algorithm was used in this study to visually distinguish <italic>E</italic>. <italic>coli</italic> and <italic>Shigella</italic> spp., based on their SERS spectra. In specificity, all SERS data were imported into the software SIMCA (Umetrics, Sweden). Select OPLS-DA as the model type, and then click <italic>Autofit</italic> button to fit the model. The software automatically calculated R2X, R2Y and Q2 to measure model performance. Select the <italic>Scatter</italic> option under the <italic>Scores</italic> function to visualize the classification results of the model in the form of scatter plots. Different spectra data were represented by different colors, and dashed circles and labels were used to indicate the corresponding data categories.</p>
</sec>
<sec id="sec15">
<label>2.7.2.</label>
<title>Classical machine learning analysis of surface enhanced Raman spectroscopy spectra</title>
<p>To identify the spectral differences between <italic>E</italic>. <italic>coli</italic> and <italic>Shigella</italic> spp., we applied two classical machine learning (ML) algorithms, Random Forest (RF) and Support Vector Machine (SVM), and deep learning algorithms Convolutional Neural Network (CNN) for SERS spectral analysis. Before performing ML analysis, we used the <italic>train_test_split</italic> function to split all SERS spectral data into training, validation and test sets in a ratio of 6:2:2. The test set data was only used to test the prediction performance of the model on unfamiliar data sets. The two machine learning algorithms were implemented by calling the <italic>RandomForestClassifier</italic> and <italic>SVC</italic> function models in the <italic>scikit-learn</italic> package (version 0.21.3). During training the two machine learning models, we used the <italic>GridSearch</italic> function to train and tuning the model parameters in order to achieve the best fitting effect of ML modes (<xref rid="SM1" ref-type="supplementary-material">Supplementary Table S1</xref>).</p>
</sec>
<sec id="sec16">
<label>2.7.3.</label>
<title>Convolutional neural network analysis of surface enhanced Raman spectroscopy spectra</title>
<p>Due to the high dimension of SERS spectral data and the subtle spectral differences between bacterial species, ML algorithms frequently failed to predict spectra correctly. Since deep learning algorithms have feature extraction performance and does not require excessive parameter optimization and feature engineering, raw SERS spectral data could be directly imported into models to obtain better discrimination and prediction results. CNN mainly consists of convolutional Layer, MaxPooling Layer and Fully Connected Layer. The convolutional layers were used to learn the intrinsic feature representation of the spectral data, and a nonlinear activation function <italic>ReLU</italic> was applied to each convolutional layer to enable the network to detect nonlinear features. In this study, the size of the convolution kernel was set to 3&#x002A;1, and the size of the filters was set to 8, 8 and 16, respectively. The MaxPooling layer can compress the extracted feature information, so that the entire network can extract a wider range of feature information. In this study, a MaxPooling layer was connected after each two convolutional layers, and the pool_size was set to 3. After multiple convolutional and pooling layers, the global information was input into the Fully Connected layer for classification using the <italic>Softmax</italic> function.</p>
</sec>
</sec>
<sec id="sec17">
<label>2.8.</label>
<title>Comparative evaluation of machine learning algorithms</title>
<p>To evaluate the capacities of machine learning algorithms on the differentiation of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>, quantitative metrics were used to measure the performance of these algorithms. Accuracy (ACC), as the most basic evaluation index in spectral signal identification, is often used to describe the correct prediction of the overall result. In this study, to avoid the data imbalance issue caused by the random splitting of data, we used <italic>Precision</italic> (P) and <italic>Recall</italic> (R) to obtain objective model evaluations. <italic>Precision</italic> represents the probability of a sample that is actually positive among all samples that are predicted to be positive, while <italic>Recall</italic> represents the probability of a sample that is predicted to be positive among all samples that are actually positive. During the data analysis process, the <italic>average</italic> parameters of Precision and Recall were set to <italic>Micro</italic> and <italic>Macro</italic>, respectively. As <italic>Precision</italic> and <italic>Recall</italic> are mutually influencing indicators, <italic>F1-Score</italic> as the harmonic average of the two indicators, were introduced to provide a comprehensive evaluation, and the <italic>average</italic> parameter was weighted. In addition, in order to avoid the occurrence of overfitting of the model during training, we used the five-fold cross-validation method with cv.&#x2009;=&#x2009;5 in the <italic>cross_val_score</italic> function, which divided the training set data into 5 equal-sized subsets and tested the models consecutively. That is, during the training process, a set of data subsets were selected as the validation set, and the remaining 4 sets were used as the training set, and 5 models were trained to correspond to 5 accuracy rates, respectively, while the average accuracy rate was calculated as the final training effect. In addition, ROC curves and confusion matrix were also drawn to measure the performance of the models. In specificity, we evaluated machine learning models by using <italic>roc_curve</italic> to draw the ROC curve. In addition, the area under the curve (AUC) value calculated by the <italic>roc_auc_score</italic> function was also used as a metric to eliminate the imbalance of sample categories. In order to more intuitively observe the performance of the model on the test set data, we visualized the prediction results of the optimal model CNN <italic>via</italic> confusion matrix <italic>via confusi_matrix</italic> function in the form of a 2&#x002A;2 matrix.</p>
</sec>
<sec id="sec18">
<label>2.9.</label>
<title>Interpretive analysis of surface enhanced Raman spectroscopy spectra</title>
<p>It was worth noting that, in this study, we also used the Grad-CAM algorithm to explain how the deep learning model extracted the SERS spectral features and the decision-making process of the convolutional layer on the SERS spectral signal. In the specific calculation process, the <italic>tf</italic>.<italic>GradientTape</italic> method was conducted to calculate the gradient vector of the last convolutional layer, and the channel mean was calculated using the <italic>tf</italic>.<italic>reduce_mean</italic> method. The Grad-CAM of the target bacterial species was generated according to the gradient vector and the channel mean. In addition to obtaining the weight distribution of the model for the spectral data, we also investigated how the model classified the spectral data of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coil</italic>. Therefore, we input the abstract features extracted from the last layer of the convolution layer (num_layer&#x2009;=&#x2009;5) into TSNE for classification, which further proved the feasibility of the CNN model. During the classification, the TSNE parameters were set to n_components&#x2009;=&#x2009;2, init&#x2009;=&#x2009;&#x2018;pca&#x2019;, and random_state&#x2009;=&#x2009;0. A brief flow chat was given to show the logic of the SERS spectral collection and computational analysis behind the discrimination of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> (<xref rid="fig1" ref-type="fig">Figure 1</xref>).</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Schematic illustration of bacterial spectral collection and computational analysis of SERS spectra of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>.</p>
</caption>
<graphic xlink:href="fmicb-14-1101357-g001.tif"/>
</fig>
</sec>
</sec>
<sec id="sec19" sec-type="results">
<label>3.</label>
<title>Results</title>
<sec id="sec20">
<label>3.1.</label>
<title>Average and deconvoluted surface enhanced Raman spectroscopy spectra</title>
<p>Both bacterial morphological characteristics and physiological states have different molecular basis, while SERS spectra can reflect these molecular differences and are able to transform these chemical and structural information into SERS signal intensities at different Raman shifts (<xref ref-type="bibr" rid="ref20">Lu et al., 2020</xref>). As for bacterial cells belonging to the same species, they are similar to each other in terms of morphology and physiology, while those from different species are quite dissimilar (<xref ref-type="bibr" rid="ref20">Lu et al., 2020</xref>). Therefore, different bacterial species could be discriminated based on the analysis of their SERS spectra. In this study, we collected SERS spectra for <italic>Shigella</italic> spp., and <italic>Escherichia coli</italic>, respectively. Average Raman spectra with shaded standard error (SE) bands for the two species were calculated to quantitatively display the general trend of SERS spectral repeats and also reflect the data variance among the spectra (<xref ref-type="bibr" rid="ref17">Liu et al., 2022</xref>), according to which, SERS spectra were well repeated for <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>, and the reproducibility of SERS spectra varied in acceptable ranges (<xref rid="fig2" ref-type="fig">Figures 2A</xref>,<xref rid="fig2" ref-type="fig">B</xref>). In this study, deconvoluted SERS spectral band components that were directly linked to molecular structures and chemical components were also generated, which aimed to evaluate SERS spectral characteristics efficiently (<xref ref-type="bibr" rid="ref22">Pezzotti et al., 2022</xref>). Based on the deconvoluted SERS spectra, two-dimensional (2D) Raman barcoding bands were then generated for <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> at the upper right corners of <xref rid="fig2" ref-type="fig">Figures 2C</xref>,<xref rid="fig2" ref-type="fig">D</xref>. In particular, the deconvolution spectra consisted of a series of Vogit sub-bands, each representing a spectral characteristic peak. It could be seen that the method fts the important characteristic peaks of Raman spectra well and could eliminate the interference of other artifactual peaks. In addition, <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coil</italic> Raman barcodes also contained subtle details of the structure of internal metabolites, amplifying the differences among the two bacterial genera. Taken together, the Raman barcodes generated through deconvolution analysis greatly supported the electronic storage of SERS spectra, converted molecular characteristics into information, and improved the recognition of bacterial species.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Average and deconvoluted SERS spectra of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>. <bold>(A,B)</bold> Average SERS spectra of <italic>Escherichia coli</italic> (N&#x2009;=&#x2009;800) and <italic>Shigella</italic> spp (<italic>N</italic> =&#x2009;800). <bold>(C,D)</bold> Deconvoluted SERS spectra of <italic>Escherichia coli</italic> and <italic>Shigella</italic> spp., <italic>X</italic>-axis represents Raman shifts in the range of 530&#x2013;1800&#x2009;cm<sup>&#x2212;1</sup>, while <italic>Y</italic>-axis represents the relative Raman intensity. a.u. means artificial unit and has no real meaning. Two-dimensional barcodes at the upper-right corners were generated <italic>via</italic> deconvolution, which were unique for <italic>Escherichia coli</italic> and <italic>Shigella</italic> spp., respectively.</p>
</caption>
<graphic xlink:href="fmicb-14-1101357-g002.tif"/>
</fig>
</sec>
<sec id="sec21">
<label>3.2.</label>
<title>Characteristic peaks of surface enhanced Raman spectroscopy spectra</title>
<p>As previously mentioned, due to the compositional and physiological differences between bacterial species, SERS spectra contains unique characteristic peaks corresponding to different molecular structures and components (<xref ref-type="bibr" rid="ref31">Tang et al., 2021</xref>). In this study, under the signal measurement of SERS spectra at the wavelength of 785&#x2009;nm, characteristic peaks for <italic>E</italic>. <italic>coli</italic> and <italic>Shigella</italic> spp., were computationally identified, respectively. All the characteristic peaks were annotated with a black arrow in <xref rid="fig2" ref-type="fig">Figure 2</xref>, while band assignments of characteristic peaks corresponding to potential molecular structure and components were given in details in <xref rid="tab1" ref-type="table">Table 1</xref>. The unique characteristic peaks to both bacteria revealed apparent differences between <italic>E</italic>. <italic>coli</italic> and <italic>shigella</italic> spp. We can see that there are many different peaks between the two bacterial genera. In specificity, as for <italic>E</italic>. <italic>coli</italic>, the unique characteristic peaks identified in its average SERS spectrum include C=O, C-N and ring deformation at 794&#x2009;cm<sup>&#x2212;1</sup> (<xref ref-type="bibr" rid="ref12">Kubryk et al., 2016</xref>), Ribose vibration, one of the distinct RNA modes at 910&#x2009;cm<sup>&#x2212;1</sup> (<xref ref-type="bibr" rid="ref28">Szekeres and Kneipp, 2019</xref>), v(C-C) at 1034&#x2009;cm<sup>&#x2212;1</sup> (<xref ref-type="bibr" rid="ref2">Athamneh et al., 2014</xref>), Amine III of proteins at 1248&#x2009;cm<sup>&#x2212;1</sup> (<xref ref-type="bibr" rid="ref3">Bashir et al., 2021</xref>), (C-N) stretch at 1320&#x2009;cm<sup>&#x2212;1</sup> (<xref ref-type="bibr" rid="ref39">Zeiri et al., 2004</xref>), and Stretch C=C in the quinoid ring at 1414&#x2009;cm<sup>&#x2212;1</sup> (<xref ref-type="bibr" rid="ref13">Laska and Widlarz, 2005</xref>). On the other hand, for <italic>Shigella</italic> spp., their unique characteristic peaks include C-C chain stretch of cell wall lipids at 1096&#x2009;cm<sup>&#x2212;1</sup> (<xref ref-type="bibr" rid="ref40">Zheng et al., 2018</xref>), tryptophan at 1332&#x2009;cm<sup>&#x2212;1</sup> (<xref ref-type="bibr" rid="ref38">Xie et al., 2013</xref>), and Ring stretching (Adenine, guanine) at 1594&#x2009;cm<sup>&#x2212;1</sup> (<xref ref-type="bibr" rid="ref8">Demirel et al., 2009</xref>).</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Band assignments of characteristic peaks to potential metabolites in SERS spectra for <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top"><bold>Wavenumber (cm</bold><sup><bold>&#x2212;1</bold></sup><bold>)</bold></th>
<th align="left" valign="top"><bold>Band assignment</bold></th>
<th align="left" valign="top"><italic>Escherichia</italic><bold><italic>coli</italic></bold></th>
<th align="left" valign="top"><bold><italic>Shigella</italic> spp.</bold></th>
<th align="left" valign="top"><bold>References</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">656/658</td>
<td align="left" valign="top">COO-bending in tyrosine, guanine vibration</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref3">Bashir et al. (2021)</xref></td>
</tr>
<tr>
<td align="left" valign="top">730/732</td>
<td align="left" valign="top"><italic>v</italic>(glycosidic)</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref12">Kubryk et al. (2016)</xref></td>
</tr>
<tr>
<td align="left" valign="top">794</td>
<td align="left" valign="top">C=O, C-N and ring deformation</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref12">Kubryk et al. (2016)</xref></td>
</tr>
<tr>
<td align="left" valign="top">910</td>
<td align="left" valign="top">Ribose vibration, one of the distinct RNA modes</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref28">Szekeres and Kneipp (2019)</xref></td>
</tr>
<tr>
<td align="left" valign="top">956/960</td>
<td align="left" valign="top">&#x03B4;(C=C)</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref38">Xie et al. (2013)</xref></td>
</tr>
<tr>
<td align="left" valign="top">1,034</td>
<td align="left" valign="top"><italic>v</italic>(C-C)</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref2">Athamneh et al. (2014)</xref></td>
</tr>
<tr>
<td align="left" valign="top">1,096</td>
<td align="left" valign="top">C&#x2013;C chain stretch of cell wall lipids</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref40">Zheng et al. (2018)</xref></td>
</tr>
<tr>
<td align="left" valign="top">1,124</td>
<td align="left" valign="top">C-C stretching</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref19">Lu et al. (2011)</xref></td>
</tr>
<tr>
<td align="left" valign="top">1,248</td>
<td align="left" valign="top">Amide III (of collagen)</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref7">Cheng et al. (2005)</xref></td>
</tr>
<tr>
<td align="left" valign="top">1,320</td>
<td align="left" valign="top">(C&#x2013;N) stretch</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref39">Zeiri et al. (2004)</xref></td>
</tr>
<tr>
<td align="left" valign="top">1,332</td>
<td align="left" valign="top">Tryptophan</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref38">Xie et al. (2013)</xref></td>
</tr>
<tr>
<td align="left" valign="top">1,414</td>
<td align="left" valign="top">Stretch C=C in the quinoid ring</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref13">Laska and Widlarz (2005)</xref></td>
</tr>
<tr>
<td align="left" valign="top">1450/1452/1454</td>
<td align="left" valign="top">&#x03B4; (CH<sub>2</sub>) scissoring</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref38">Xie et al. (2013)</xref></td>
</tr>
<tr>
<td align="left" valign="top">1576/1584</td>
<td align="left" valign="top"><italic>v</italic>(C=C)</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref38">Xie et al. (2013)</xref></td>
</tr>
<tr>
<td align="left" valign="top">1,594</td>
<td align="left" valign="top">Ring stretching (Adenine, guanine)</td>
<td/>
<td/>
<td align="left" valign="top"><xref ref-type="bibr" rid="ref8">Demirel et al. (2009)</xref></td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec22">
<label>3.3.</label>
<title>Clustering analysis of <italic>Shigella</italic> spp., and <italic>Escherichia coli</italic> surface enhanced Raman spectroscopy spectra</title>
<p>Clustering analysis is able to find commonalities between data elements, therefore dividing SERS spectra into different parts (also known as clusters) so that spectra in the same part are similar to each other while spectra in different parts are dissimilar to each other, leading to the differentiation of bacterial species (<xref ref-type="bibr" rid="ref29">Talabis et al., 2015</xref>). In this study, we applied the two algorithms, TSNE and OPLS-DA, for the clustering analysis of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> SERS spectra. TSNE is considered as one of the best high-dimensionality data reduction method and clustering visualization tool, though it has obvious disadvantages of large memory consumption and long running time (<xref ref-type="bibr" rid="ref15">Linderman and Steinerberger, 2019</xref>; <xref ref-type="bibr" rid="ref23">Pezzotti et al., 2019</xref>). During the application of TSNE method in SERS spectra, the result showed that two bacterial genera could be well separated into two groups but the classification boundary is not clear due to the mixture of certain number of <italic>E</italic>. <italic>coli</italic> SERS spectra (<xref rid="fig3" ref-type="fig">Figure 3A</xref>). As for OPLS-DA, it is a multivariate statistical method for supervised data clustering, which provides insights into the divisions of data groups based on high-dimensional spectral measurements (<xref ref-type="bibr" rid="ref37">Worley and Powers, 2016</xref>). When using OPLS-DA method for analyzing the same SERS spectral dataset, it was found that <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> spectra were well clustered into two groups with smaller intra-genus variations and the boundary between the two genera was clear (<xref rid="fig3" ref-type="fig">Figure 3B</xref>). In addition, unlike TSNE, OPLS-DA gave a quantitative measurement of the clustering result, which showed that R2X (<italic>cum</italic>)&#x2009;=&#x2009;0.964, R2Y (<italic>cum</italic>)&#x2009;=&#x2009;0.806 and Q2 (<italic>cum</italic>)&#x2009;=&#x2009;0.799. The larger the three parameters are, the better the classification performance of the model is, and the difference between R2X and R2Y is generally no more than 0.3 (<xref ref-type="bibr" rid="ref1">Abdel-Ilah et al., 2017</xref>).</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Clustering analysis of SERS spectra of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> through T-SNE and OPLS-DA algorithms. <bold>(A)</bold> Scatterplot of SERS spectra <italic>via</italic> T-SNE algorithm. <bold>(B)</bold> Scatterplot of SERS spectra <italic>via</italic> OPLS-DA algorithm.</p>
</caption>
<graphic xlink:href="fmicb-14-1101357-g003.tif"/>
</fig>
</sec>
<sec id="sec23">
<label>3.4.</label>
<title>Prediction of <italic>Shigella</italic> spp., and <italic>Escherichia coli</italic> based on surface enhanced Raman spectroscopy spectra</title>
<p>Although clustering analysis could differentiate SERS spectra of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> into different groups, it is difficult to know the accuracy and robustness of the analysis. Therefore, supervised machine learning analysis was used for predicting the identity of a particular SERS spectra. In particular, supervised machine learning algorithms are able to learn the patterns in the input variable X and the construct mapping functions Y&#x2009;=&#x2009;f(X) in order to achieve the purpose of using unknown input data X to accurately predict its output Y (<xref ref-type="bibr" rid="ref31">Tang et al., 2021</xref>). In this study, we compared the predictive capacities of three representative machine learning algorithms, CNN, SVM, and RF. The results were shown in <xref rid="tab2" ref-type="table">Table 2</xref>, according to which, all the prediction parameters for the deep learning model CNN reached to values of 99.64%, indicating that CNN model worked the best in capturing the features of the SERS spectral signals and was able to predict <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> with no mistake. As for the two classic machine learning algorithms, it was found that both SVM and RF achieved very high accuracy and robustness, which was very close to the performance of CNN, confirming that SVM and RF were also suitable in predicting SERS spectra of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Comparison of the predictive abilities of three supervised machine learning algorithms in the analysis of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> SERS spectral data.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top"><bold>Algorithm</bold></th>
<th align="center" valign="top"><bold>ACC (%)</bold></th>
<th align="center" valign="top"><bold>Recall (%)</bold></th>
<th align="center" valign="top"><bold>Precision (%)</bold></th>
<th align="center" valign="top"><bold>F1 (%)</bold></th>
<th align="center" valign="top"><bold>5-Fold CV (%)</bold></th>
<th align="center" valign="top"><bold>AUC (%)</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top"><bold>CNN</bold></td>
<td align="center" valign="top">99.64</td>
<td align="center" valign="top">99.64</td>
<td align="center" valign="top">99.59</td>
<td align="center" valign="top">99.64</td>
<td align="center" valign="top">99.65</td>
<td align="center" valign="top">100</td>
</tr>
<tr>
<td align="left" valign="top"><bold>SVM</bold></td>
<td align="center" valign="top">98.95</td>
<td align="center" valign="top">99.31</td>
<td align="center" valign="top">99.31</td>
<td align="center" valign="top">99.31</td>
<td align="center" valign="top">99.21</td>
<td align="center" valign="top">98.97</td>
</tr>
<tr>
<td align="left" valign="top"><bold>RF</bold></td>
<td align="center" valign="top">96.49</td>
<td align="center" valign="top">96.49</td>
<td align="center" valign="top">96.11</td>
<td align="center" valign="top">96.48</td>
<td align="center" valign="top">97.10</td>
<td align="center" valign="top">95.69</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>ROC curve aims to compare the sensitivity and specificity across a range of values for the predictive ability of supervised machine learning methods, and AUC means overall accuracies in distinguishing data samples (<xref ref-type="bibr" rid="ref10">Florkowski, 2008</xref>). As for confusion matrix, it is a table that shows the classification results based on the true class and predicted class (<xref ref-type="bibr" rid="ref31">Tang et al., 2021</xref>). Therefore, in this study, we plotted both ROC curve and confusion matrix for the optimal prediction model CNN. As for the ROC curve, the x-axis represents the specificity (false positive rate, FPR) while the y-axis represents the sensitivity (true positive rate, TPR). According to <xref rid="fig4" ref-type="fig">Figure 4A</xref>, it could be seen that the AUC value was 1.00, which indicated that the CNN model had very high specificity and sensitivity. The confusion matrix showed the specific performance of the model on the test set data (<xref rid="fig4" ref-type="fig">Figure 4B</xref>), It could be seen that the prediction accuracy of CNN models was 100% for <italic>Shigella</italic> spp., and 99% for <italic>E</italic>. <italic>coli</italic>, while 1% of the <italic>E</italic>. <italic>coli</italic> spectra was misidentified as <italic>Shigella</italic> spp., indicating that these spectra could be accurately assigned to the correct species with very low error rate.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>ROC curve and confusion matrix for the deep learning CNN model when applied to the SERS spectra of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coil</italic>. <bold>(A)</bold> ROC curve. According to the comparison, CNN achieved the best performance with area under curve (AUC)&#x2009;=&#x2009;1.00 than all other algorithms. <bold>(B)</bold> Confusion matrix. Numbers in the confusion matrix stood for the percentage of correctly classified (diagonal) or mis-classified (off-diagonal) spectra, respectively.</p>
</caption>
<graphic xlink:href="fmicb-14-1101357-g004.tif"/>
</fig>
</sec>
<sec id="sec24">
<label>3.5.</label>
<title>Grad-CAM analysis of <italic>Shigella</italic> spp., and <italic>Escherichia coli</italic> surface enhanced Raman spectroscopy spectra</title>
<p>In order to observe the distributions of the CNN model in the SERS spectra of different bacterial genera, we used the Grad-CAM algorithm to analyze the full spectral data. It could be seen that the heatmap distribution of the raw spectra data was determined by the intensity of characteristic peaks, that is, high intensity region appeared in red and low intensity region appeared in white (<xref rid="fig5" ref-type="fig">Figure 5A</xref>). As for the spectral data output by the CNN model, they were not classified according to the characteristic peaks as previously inferred. Instead, according to the results, there were obvious differences in the weight distribution between the spectra of the two bacterial genera (<xref rid="fig5" ref-type="fig">Figure 5B</xref>). In order to better interpret the result, we arbitrarily divided the heatmap into three regions. In the first region of the spectra, the CNN model assigned more attention in the range of 756-754&#x2009;cm<sup>&#x2212;1</sup> in <italic>E</italic>. <italic>coil</italic>, while more attention was distributed in the range of 688-721&#x2009;cm<sup>&#x2212;1</sup> for the SERS spectra of <italic>Shigella</italic> spp. In the second region, where the spectral intensity was intermediate, the model did not pay much attention to <italic>E</italic>. <italic>coli</italic> in this area, while for <italic>Shigella</italic> spp., the attention of CNN model mainly focused on around the characteristic peak at 994&#x2013;1000&#x2009;cm<sup>&#x2212;1</sup>. In the third region of the spectra, the model focused on the Raman shifts at 1484&#x2013;1542&#x2009;cm<sup>&#x2212;1</sup> for <italic>E</italic>. <italic>coil</italic>, but for <italic>Shigella</italic>, the model assigned more weights on the end of the spectrum from 1764&#x2009;cm<sup>&#x2212;1</sup> to 1776&#x2009;cm<sup>&#x2212;1</sup>. To further demonstrate how the CNN model classified <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coil</italic>, we used TSNE to show the extraction results of spectral features by the model. It could be seen that the two bacterial groups were divided into two well-separated clusters, and according the label display, it can be judged that the model can distinguish the two bacteria well (<xref rid="fig5" ref-type="fig">Figure 5C</xref>). In sum, Grad-CAM analysis confirmed the reliability of the CNN model, indicating that it had the ability to accurately identify <italic>Shigella</italic> spp., from <italic>E</italic>. <italic>coil</italic>.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Schematic illustration of the computational mechanisms behind the CNN model classification of <italic>Shigella spp</italic>., and <italic>E</italic>. <italic>coil</italic> SERS spectra. <bold>(A)</bold> Heatmap of raw SERS spectra. <bold>(B)</bold> Model weight allocation in SERS spectra arbitrarily divided into three regions. <bold>(C)</bold> Classification of SERS spectra. For the heatmap, the darker the color, the more attention the CNN model pays. As for the clustering analysis, the two bacterial genera, <italic>Shigella</italic> spp., and <italic>Escherichia coli</italic>, were represented by different labels and colors.</p>
</caption>
<graphic xlink:href="fmicb-14-1101357-g005.tif"/>
</fig>
</sec>
</sec>
<sec id="sec25" sec-type="discussions">
<label>4.</label>
<title>Discussion</title>
<p>It is well known that, due to close similarities in both genotypes and phenotypes, it is technically difficult and time-consuming to differentiate <italic>Shigella</italic> spp., from <italic>E</italic>. <italic>coli</italic> (<xref ref-type="bibr" rid="ref26">Rautureau et al., 2019</xref>), which mainly involves biochemical characteristics and serotyping (<xref ref-type="bibr" rid="ref9">Devanga Ragupathi et al., 2018</xref>). Recently, <xref ref-type="bibr" rid="ref32">van den Beld et al. (2022)</xref> reported that MALDI-TOF MS using a customized database, biomarker assignment, or mathematical classifiers cannot differentiate <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>, either, which strengthened the difficulties of the issue. However, as a proof-of-concept, <xref ref-type="bibr" rid="ref24">Pizzato et al. (2022)</xref> used MALDI-TOF MS with negative ion mode to generate lipid profiles of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>, through which these species could be discriminated at accurate rates of around 0.9 when paired with in-house machine learning algorithm and top-ranked features. Recently, with the development of whole genome sequencing technology, the advanced method has also been used for the differentiation of <italic>E</italic>. <italic>coli</italic> and <italic>Shigella</italic> spp. According to a study by <xref ref-type="bibr" rid="ref5">Chattaway et al. (2017)</xref> <italic>Shigella</italic> was successfully identified from <italic>E</italic>. <italic>coli</italic> and accurately differentiated to the species level <italic>via</italic> kmer-based approach. A nuclear magnetic resonance (NMR) based method for the characterizing the metabolomic features of culture media for lactose negative <italic>E</italic>. <italic>coli</italic> and <italic>Shigella</italic> spp., has also been reported recently, according to the results, when coupled with multivariate classification model analysis, it was revealed that the two very closely related species could be separated <italic>via</italic> bacterial metabolic footprints (<xref ref-type="bibr" rid="ref26">Rautureau et al., 2019</xref>). However, considering the sophisticated procedures and high expenses of these novel methods, it is implausible to adopt the methodologies and apply them to routine laboratory tests.</p>
<p>As an easy-to-learn, low-cost, non-invasive and label-free method, Raman spectroscopy, especially the surface enhanced Raman spectroscopy due to the significantly enhanced Raman signals, has great application potential for rapid and accurate bacterial pathogen identification in clinical settings, though huge challenges exist and the method has been officially used in real-world situation yet (<xref ref-type="bibr" rid="ref33">Wang et al., 2021</xref>). Previously, the promising SERS technique has been widely used for both genus/species discrimination and antibiotic resistance profiling in clinically important bacterial pathogens with rapid speed and high accuracy (<xref ref-type="bibr" rid="ref11">Ho et al., 2019</xref>; <xref ref-type="bibr" rid="ref31">Tang et al., 2021</xref>; <xref ref-type="bibr" rid="ref17">Liu et al., 2022</xref>; <xref ref-type="bibr" rid="ref30">Tang et al., 2022</xref>; <xref ref-type="bibr" rid="ref34">Wang et al., 2022a</xref>,<xref ref-type="bibr" rid="ref35">b</xref>). However, there is currently no reported of using label-free SERS technique coupled with machine learning algorithms for the differentiation of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>, which is thoroughly investigated in this study from the comparison of characteristic peaks for unique molecular structure and components, to clustering analysis of distinct spectral groups, and then to species predictions based on supervised machine learning algorithms. According to the results, it was found that the deep learning algorithm CNN had the best performance and could achieve 99.64% accuracy for the discrimination of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>. The result is consistent with previous studies, in which CNN model has been found to be the best for analyzing and predicting bacterial species (<xref ref-type="bibr" rid="ref31">Tang et al., 2021</xref>; <xref ref-type="bibr" rid="ref17">Liu et al., 2022</xref>; <xref ref-type="bibr" rid="ref30">Tang et al., 2022</xref>; <xref ref-type="bibr" rid="ref34">Wang et al., 2022a,b</xref>), though other machine learning algorithms such as SVM and RF also achieved very high levels of accuracy for species identification. Therefore, through this study, it was suggested that the label-free SERS technique coupled with machine learning algorithms could be used for the rapid discrimination of <italic>Shigella</italic> spp., and <italic>Escherichia coli</italic>.</p>
</sec>
<sec id="sec26">
<label>5.</label>
<title>Conclusion and limitations</title>
<p>Rapid and accurate identification and discrimination of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> is essential in the prevention and control of diarrhea, especially for children under the age of 5 years old. However, current methods suffer from limitations in discriminating the two very closely related bacterial species and novel techniques are urgently needed in clinical laboratories. In this study, we explored the performance of the rapid and sensitive SERS technique and combined it with the advanced deep learning algorithm CNN in order to identify <italic>Shigella</italic> spp., from <italic>E</italic>. <italic>coli</italic> by using the handheld Raman spectrometer. According to the results, the portable spectrometer is sufficient in acquiring high-quality SERS spectra from <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> colonies in clinical lab, which confirms the applicability of the instrument as a POCT device. In addition, SERS spectral analysis revealed that intrinsic differences existed between <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> due to the presence of unique characteristic peaks, which was further confirmed through clustering analysis <italic>via</italic> both unsupervised and supervised machine learning models. As for species prediction, comparative machine learning analysis of SERS spectra showed that the deep learning algorithm CNN had the best performance. However, due to the comparatively small number of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> strains involved in this study, the capacity of the CNN model generalization might be restricted. In addition, since different bacterial culture media, cultivation conditions, and physiological states could also influence the SERS spectra, more <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic> strains cultivated under different conditions should be included for SERS spectral analysis in future investigations, which will greatly improve the robustness and generalization of the constructed machine learning models. Taken together, this study confirmed the application potential of SERS technique <italic>via</italic> handheld Raman spectrometer in the discrimination of <italic>Shigella</italic> spp., and <italic>E</italic>. <italic>coli</italic>, which may facilitate diagnosis, control and prevention of diarrhea in clinical laboratory in near future.</p>
</sec>
<sec id="sec27" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="sec28">
<title>Author contributions</title>
<p>LW, XW, and Z-KL conceived and designed the experiments. LW and XW provided platform and resources. LW contributed to project administration and student supervision. LW and WL contributed to the funding acquisitions. WL, J-WT, J-YM, J-WL, Y-WD, Y-LL, and Y-FL carried out the computational and experimental investigations. All the authors wrote and revised the manuscript, and contributed to the article and approved the submitted version.</p>
</sec>
<sec id="sec29" sec-type="funding-information">
<title>Funding</title>
<p>LW was supported by National Natural Science Foundation of China (Grant No. 31900022), Xuzhou Key R&#x0026;D Plan Social Development Project (Grant No. KC22300), and Jiang-Su Qing-Lan Project (2020).</p>
</sec>
<sec id="conf1" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="sec100" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<ack>
<p>We thank the reviewers for their thoughtful comments that greatly improve the quality of the manuscript.</p>
</ack>
<sec id="sec31" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fmicb.2023.1101357/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fmicb.2023.1101357/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.DOCX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Abdel-Ilah</surname> <given-names>L.</given-names></name> <name><surname>Veljovi&#x0107;</surname> <given-names>E.</given-names></name> <name><surname>Gurbeta</surname> <given-names>L.</given-names></name> <name><surname>Badnjevi&#x0107;</surname> <given-names>A.</given-names></name></person-group> (<year>2017</year>). <article-title>Applications of QSAR Study in Drug Design</article-title>. <source>Int. J. Eng. Res. Technol.</source>, <volume>6</volume>, <fpage>1</fpage>&#x2013;<lpage>6</lpage>.</citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Athamneh</surname> <given-names>A.</given-names></name> <name><surname>Alajlouni</surname> <given-names>R.</given-names></name> <name><surname>Wallace</surname> <given-names>R.</given-names></name> <name><surname>Seleem</surname> <given-names>M.</given-names></name> <name><surname>Senger</surname> <given-names>R.</given-names></name></person-group> (<year>2014</year>). <article-title>Phenotypic profiling of antibiotic response signatures in <italic>Escherichia coli</italic> using Raman spectroscopy</article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>58</volume>, <fpage>1302</fpage>&#x2013;<lpage>1314</lpage>. doi: <pub-id pub-id-type="doi">10.1128/AAC.02098-13</pub-id>, PMID: <pub-id pub-id-type="pmid">24295982</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bashir</surname> <given-names>S.</given-names></name> <name><surname>Nawaz</surname> <given-names>H.</given-names></name> <name><surname>Majeed</surname> <given-names>M. I.</given-names></name> <name><surname>Mohsin</surname> <given-names>M.</given-names></name> <name><surname>Nawaz</surname> <given-names>A.</given-names></name> <name><surname>Rashid</surname> <given-names>N.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Surface-enhanced Raman spectroscopy for the identification of tigecycline-resistant E. coli strains</article-title>. <source>Spectrochim. Acta A Mol. Biomol. Spectrosc.</source> <volume>258</volume>:<fpage>119831</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.saa.2021.119831</pub-id></citation></ref>
<ref id="ref4"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Belotserkovsky</surname> <given-names>I.</given-names></name> <name><surname>Sansonetti</surname> <given-names>P. J.</given-names></name></person-group> (<year>2018</year>). &#x201C;<article-title><italic>Shigella</italic> and Enteroinvasive <italic>Escherichia coli</italic></article-title>&#x201D; in <source><italic>Escherichia coli</italic>, a versatile pathogen. Current Topics in Microbiology and Immunology</source>, <italic>Vol</italic> <volume>416</volume>. eds. <person-group person-group-type="editor"><name><surname>Singh</surname> <given-names>U.</given-names></name> <name><surname>Praharaj</surname> <given-names>C.</given-names></name> <name><surname>Singh</surname> <given-names>S.</given-names></name> <name><surname>Singh</surname> <given-names>N.</given-names></name></person-group> (<publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>1</fpage>&#x2013;<lpage>26</lpage>.</citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chattaway</surname> <given-names>M. A.</given-names></name> <name><surname>Schaefer</surname> <given-names>U.</given-names></name> <name><surname>Tewolde</surname> <given-names>R.</given-names></name> <name><surname>Dallman</surname> <given-names>T. J.</given-names></name> <name><surname>Jenkins</surname> <given-names>C.</given-names></name> <name><surname>Ledeboer</surname> <given-names>N. A.</given-names></name></person-group> (<year>2017</year>). <article-title>Identification of <italic>Escherichia coli</italic> and <italic>Shigella</italic> species from whole-genome sequences</article-title>. <source>J. Clin. Microbiol.</source> <volume>55</volume>, <fpage>616</fpage>&#x2013;<lpage>623</lpage>. doi: <pub-id pub-id-type="doi">10.1128/JCM.01790-16</pub-id>, PMID: <pub-id pub-id-type="pmid">27974538</pub-id></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>Q.</given-names></name> <name><surname>Zhao</surname> <given-names>L.</given-names></name> <name><surname>Liu</surname> <given-names>H.</given-names></name> <name><surname>Ding</surname> <given-names>Q.</given-names></name> <name><surname>Jia</surname> <given-names>C.</given-names></name> <name><surname>Liao</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Nanoporous silver nanorods as surface-enhanced Raman scattering substrates</article-title>. <source>Biosens. Bioelectron.</source> <volume>202</volume>:<fpage>114004</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.bios.2022.114004</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cheng</surname> <given-names>W. T.</given-names></name> <name><surname>Liu</surname> <given-names>M. T.</given-names></name> <name><surname>Liu</surname> <given-names>H. N.</given-names></name> <name><surname>Lin</surname> <given-names>S. Y.</given-names></name></person-group> (<year>2005</year>). <article-title>Micro-Raman spectroscopy used to identify and grade human skin pilomatrixoma</article-title>. <source>Microsc. Res. Tech.</source> <volume>68</volume>, <fpage>75</fpage>&#x2013;<lpage>79</lpage>. doi: <pub-id pub-id-type="doi">10.1002/jemt.20229</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Demirel</surname> <given-names>M.</given-names></name> <name><surname>Kao</surname> <given-names>P.</given-names></name> <name><surname>Malvadkar</surname> <given-names>N.</given-names></name> <name><surname>Wang</surname> <given-names>H.</given-names></name> <name><surname>Gong</surname> <given-names>X.</given-names></name> <name><surname>Poss</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>Bio-organism sensing via surface enhanced Raman spectroscopy on controlled metal/polymer nanostructured substrates</article-title>. <source>Biointerphases</source> <volume>4</volume>, <fpage>35</fpage>&#x2013;<lpage>41</lpage>. doi: <pub-id pub-id-type="doi">10.1116/1.3147962</pub-id>, PMID: <pub-id pub-id-type="pmid">20408721</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Devanga Ragupathi</surname> <given-names>N. K.</given-names></name> <name><surname>Muthuirulandi Sethuvel</surname> <given-names>D. P.</given-names></name> <name><surname>Inbanathan</surname> <given-names>F. Y.</given-names></name> <name><surname>Veeraraghavan</surname> <given-names>B.</given-names></name></person-group> (<year>2018</year>). <article-title>Accurate differentiation of <italic>Escherichia coli</italic> and <italic>Shigella</italic> serogroups: challenges and strategies</article-title>. <source>New Microb. New Infect.</source> <volume>21</volume>, <fpage>58</fpage>&#x2013;<lpage>62</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.nmni.2017.09.003</pub-id>, PMID: <pub-id pub-id-type="pmid">29204286</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Florkowski</surname> <given-names>C. M.</given-names></name></person-group> (<year>2008</year>). <article-title>Sensitivity, specificity, receiver-operating characteristic (ROC) curves and likelihood ratios: communicating the performance of diagnostic tests</article-title>. <source>Clin. Biochem. Rev.</source> <volume>29</volume>, <fpage>S83</fpage>&#x2013;<lpage>S87</lpage>. PMID: <pub-id pub-id-type="pmid">18852864</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ho</surname> <given-names>C.-S.</given-names></name> <name><surname>Jean</surname> <given-names>N.</given-names></name> <name><surname>Hogan</surname> <given-names>C. A.</given-names></name> <name><surname>Blackmon</surname> <given-names>L.</given-names></name> <name><surname>Jeffrey</surname> <given-names>S. S.</given-names></name> <name><surname>Holodniy</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Rapid identification of pathogenic bacteria using Raman spectroscopy and deep learning. <italic>Nature</italic></article-title>. <source>Communications</source> <volume>10</volume>:<fpage>2898</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-019-12898-9</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kubryk</surname> <given-names>P.</given-names></name> <name><surname>Niessner</surname> <given-names>R.</given-names></name> <name><surname>Ivleva</surname> <given-names>N. P.</given-names></name></person-group> (<year>2016</year>). <article-title>The origin of the band at around 730 cm&#x2212; 1 in the SERS spectra of bacteria: a stable isotope approach</article-title>. <source>Analyst</source> <volume>141</volume>, <fpage>2874</fpage>&#x2013;<lpage>2878</lpage>. doi: <pub-id pub-id-type="doi">10.1039/C6AN00306K</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Laska</surname> <given-names>J.</given-names></name> <name><surname>Widlarz</surname> <given-names>J.</given-names></name></person-group> (<year>2005</year>). <article-title>Spectroscopic and structural characterization of low molecular weight fractions of polyaniline</article-title>. <source>Polymer</source> <volume>46</volume>, <fpage>1485</fpage>&#x2013;<lpage>1495</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.polymer.2004.12.008</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>K. S.</given-names></name> <name><surname>Landry</surname> <given-names>Z.</given-names></name> <name><surname>Pereira</surname> <given-names>F. C.</given-names></name> <name><surname>Wagner</surname> <given-names>M.</given-names></name> <name><surname>Berry</surname> <given-names>D.</given-names></name> <name><surname>Huang</surname> <given-names>W. E.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Raman microspectroscopy for microbiology</article-title>. <source>Nat. Rev. Methods Prim.</source> <volume>1</volume>:<fpage>75</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s43586-021-00075-6</pub-id></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Linderman</surname> <given-names>G. C.</given-names></name> <name><surname>Steinerberger</surname> <given-names>S. J. S. J. O. M. O. D. S.</given-names></name></person-group> (<year>2019</year>). <article-title>Clustering with t-SNE</article-title>. <source>Provably</source> <volume>1</volume>, <fpage>313</fpage>&#x2013;<lpage>332</lpage>. doi: <pub-id pub-id-type="doi">10.1137/18M1216134</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Peng</surname> <given-names>N.</given-names></name> <name><surname>Yao</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Peng</surname> <given-names>X.</given-names></name> <name><surname>Zhao</surname> <given-names>L.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Breaking the nanoparticle&#x2019;s dispersible limit via rotatable surface ligands</article-title>. <source>Nat. Commun.</source> <volume>13</volume>:<fpage>3581</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-022-31275-7</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>W.</given-names></name> <name><surname>Tang</surname> <given-names>J.-W.</given-names></name> <name><surname>Lyu</surname> <given-names>J.-W.</given-names></name> <name><surname>Wang</surname> <given-names>J.-J.</given-names></name> <name><surname>Pan</surname> <given-names>Y.-C.</given-names></name> <name><surname>Shi</surname> <given-names>X.-Y.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Discrimination between Carbapenem-resistant and Carbapenem-sensitive <italic>Klebsiella pneumoniae</italic> strains through computational analysis of surface-enhanced Raman spectra: a pilot study</article-title>. <source>Microbiol. Spectr.</source> <volume>10</volume>:<fpage>e0240921</fpage>. doi: <pub-id pub-id-type="doi">10.1128/spectrum.02409-21</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Zhou</surname> <given-names>H.</given-names></name> <name><surname>Hu</surname> <given-names>Z.</given-names></name> <name><surname>Yu</surname> <given-names>G.</given-names></name> <name><surname>Yang</surname> <given-names>D.</given-names></name> <name><surname>Zhao</surname> <given-names>J.</given-names></name></person-group> (<year>2017</year>). <article-title>Label and label-free based surface-enhanced Raman scattering for pathogen bacteria detection: A review</article-title>. <source>Biosens. Bioelectron.</source> <volume>94</volume>, <fpage>131</fpage>&#x2013;<lpage>140</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.bios.2017.02.032</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lu</surname> <given-names>X.</given-names></name> <name><surname>Al-Qadiri</surname> <given-names>H. M.</given-names></name> <name><surname>Lin</surname> <given-names>M.</given-names></name> <name><surname>Rasco</surname> <given-names>B. A.</given-names></name></person-group> (<year>2011</year>). <article-title>Application of mid-infrared and Raman spectroscopy to the study of bacteria</article-title>. <source>Food Bioprocess Technol.</source> <volume>4</volume>, <fpage>919</fpage>&#x2013;<lpage>935</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11947-011-0516-8</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lu</surname> <given-names>W.</given-names></name> <name><surname>Chen</surname> <given-names>X.</given-names></name> <name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Fu</surname> <given-names>Y. V. J. A. C.</given-names></name></person-group> (<year>2020</year>). <article-title>Combination of an artificial intelligence approach and laser tweezers Raman spectroscopy for microbial identification</article-title>. <source>Anal Chem.</source> <volume>92</volume>, <fpage>6288</fpage>&#x2013;<lpage>6296</lpage>. doi: <pub-id pub-id-type="doi">10.1021/acs.analchem.9b04946</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pezzotti</surname> <given-names>G.</given-names></name> <name><surname>Boschetto</surname> <given-names>F.</given-names></name> <name><surname>Ohgitani</surname> <given-names>E.</given-names></name> <name><surname>Fujita</surname> <given-names>Y.</given-names></name> <name><surname>Shin-Ya</surname> <given-names>M.</given-names></name> <name><surname>Adachi</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Raman molecular fingerprints of SARS-CoV-2 British variant and the concept of Raman barcode</article-title>. <source>Adv. Sci.</source> <volume>9</volume>:<fpage>e2103287</fpage>. doi: <pub-id pub-id-type="doi">10.1002/advs.202103287</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pezzotti</surname> <given-names>G.</given-names></name> <name><surname>Kobara</surname> <given-names>M.</given-names></name> <name><surname>Nakaya</surname> <given-names>T.</given-names></name> <name><surname>Imamura</surname> <given-names>H.</given-names></name> <name><surname>Fujii</surname> <given-names>T.</given-names></name> <name><surname>Miyamoto</surname> <given-names>N.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Raman metabolomics of <italic>Candida auris</italic> clades: profiling and barcode identification</article-title>. <source>Int. J. Mol. Sci.</source> <volume>23</volume>:<fpage>1736</fpage>. doi: <pub-id pub-id-type="doi">10.3390/ijms231911736</pub-id>, PMID: <pub-id pub-id-type="pmid">36233043</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pezzotti</surname> <given-names>N.</given-names></name> <name><surname>Thijssen</surname> <given-names>J.</given-names></name> <name><surname>Mordvintsev</surname> <given-names>A.</given-names></name> <name><surname>H&#x00F6;llt</surname> <given-names>T.</given-names></name> <name><surname>Van Lew</surname> <given-names>B.</given-names></name> <name><surname>Lelieveldt</surname> <given-names>B. P.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>GPGPU linear complexity t-SNE optimization</article-title>. <source>IEEE Trans. Vis. Comput. Graph.</source> <volume>26</volume>, <fpage>1172</fpage>&#x2013;<lpage>1181</lpage>. doi: <pub-id pub-id-type="doi">10.1109/TVCG.2019.2934307</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pizzato</surname> <given-names>J.</given-names></name> <name><surname>Tang</surname> <given-names>W.</given-names></name> <name><surname>Bernabeu</surname> <given-names>S.</given-names></name> <name><surname>Bonnin</surname> <given-names>R. A.</given-names></name> <name><surname>Bille</surname> <given-names>E.</given-names></name> <name><surname>Farfour</surname> <given-names>E.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Discrimination of <italic>Escherichia coli</italic>, <italic>Shigella flexneri</italic>, and <italic>Shigella sonnei</italic> using lipid profiling by MALDI-TOF mass spectrometry paired with machine learning</article-title>. <source>Microbiol. Open</source> <volume>11</volume>:<fpage>e1313</fpage>. doi: <pub-id pub-id-type="doi">10.1002/mbo3.1313</pub-id>, PMID: <pub-id pub-id-type="pmid">36004556</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pupo</surname> <given-names>G. M.</given-names></name> <name><surname>Lan</surname> <given-names>R.</given-names></name> <name><surname>Reeves</surname> <given-names>P. R.</given-names></name></person-group> (<year>2000</year>). <article-title>Multiple independent origins of <italic>Shigella</italic> clones of <italic>Escherichia coli</italic> and convergent evolution of many of their characteristics</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>97</volume>, <fpage>10567</fpage>&#x2013;<lpage>10572</lpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.180094797</pub-id>, PMID: <pub-id pub-id-type="pmid">10954745</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rautureau</surname> <given-names>G. J. P.</given-names></name> <name><surname>Palama</surname> <given-names>T. L.</given-names></name> <name><surname>Canard</surname> <given-names>I.</given-names></name> <name><surname>Mirande</surname> <given-names>C.</given-names></name> <name><surname>Chatellier</surname> <given-names>S.</given-names></name> <name><surname>Van Belkum</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Discrimination of <italic>Escherichia coli</italic> and <italic>Shigella</italic> spp., by nuclear magnetic resonance based Metabolomic characterization of culture media</article-title>. <source>ACS Infect. Dis.</source> <volume>5</volume>, <fpage>1879</fpage>&#x2013;<lpage>1886</lpage>. doi: <pub-id pub-id-type="doi">10.1021/acsinfecdis.9b00199</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rebrosova</surname> <given-names>K.</given-names></name> <name><surname>Samek</surname> <given-names>O.</given-names></name> <name><surname>Kizovsky</surname> <given-names>M.</given-names></name> <name><surname>Bernatova</surname> <given-names>S.</given-names></name> <name><surname>Hola</surname> <given-names>V.</given-names></name> <name><surname>Ruzicka</surname> <given-names>F.</given-names></name></person-group> (<year>2022</year>). <article-title>Raman spectroscopy&#x2014;A novel method for identification and characterization of microbes on a single-cell level in clinical settings</article-title>. <source>Front. Cell. Infect. Microbiol.</source> <volume>12</volume>:<fpage>6463</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fcimb.2022.866463</pub-id></citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Szekeres</surname> <given-names>G. P.</given-names></name> <name><surname>Kneipp</surname> <given-names>J.</given-names></name></person-group> (<year>2019</year>). <article-title>SERS probing of proteins in gold nanoparticle agglomerates</article-title>. <source>Front. Chem.</source> <volume>7</volume>:<fpage>30</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fchem.2019.00030</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Talabis</surname> <given-names>M. R. M.</given-names></name> <name><surname>Mcpherson</surname> <given-names>R.</given-names></name> <name><surname>Miyamoto</surname> <given-names>I.</given-names></name> <name><surname>Martin</surname> <given-names>J. L.</given-names></name> <name><surname>Kaye</surname> <given-names>D.</given-names></name></person-group> (eds) (<year>2015</year>). &#x201C;<article-title>Analytics defined</article-title>&#x201D; in <source>Information security analytics</source>, <publisher-name>Syngress</publisher-name>, <fpage>1</fpage>&#x2013;<lpage>12</lpage>.</citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname> <given-names>J. W.</given-names></name> <name><surname>Li</surname> <given-names>J. Q.</given-names></name> <name><surname>Yin</surname> <given-names>X. C.</given-names></name> <name><surname>Xu</surname> <given-names>W. W.</given-names></name> <name><surname>Pan</surname> <given-names>Y. C.</given-names></name> <name><surname>Liu</surname> <given-names>Q. H.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Rapid discrimination of clinically important pathogens through machine learning analysis of surface enhanced Raman spectra</article-title>. <source>Front. Microbiol.</source> <volume>13</volume>:<fpage>843417</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fmicb.2022.843417</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname> <given-names>J.-W.</given-names></name> <name><surname>Liu</surname> <given-names>Q.-H.</given-names></name> <name><surname>Yin</surname> <given-names>X.-C.</given-names></name> <name><surname>Pan</surname> <given-names>Y.-C.</given-names></name> <name><surname>Wen</surname> <given-names>P.-B.</given-names></name> <name><surname>Liu</surname> <given-names>X.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Comparative analysis of machine learning algorithms on surface enhanced Raman spectra of clinical staphylococcus species</article-title>. <source>Front. Microbiol.</source> <volume>12</volume>:<fpage>6921</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fmicb.2021.696921</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van Den Beld</surname> <given-names>M. J. C.</given-names></name> <name><surname>Rossen</surname> <given-names>J. W. A.</given-names></name> <name><surname>Evers</surname> <given-names>N.</given-names></name> <name><surname>Kooistra-Smid</surname> <given-names>M. A. M. D.</given-names></name> <name><surname>Reubsaet</surname> <given-names>F. A. G.</given-names></name></person-group> (<year>2022</year>). <article-title>MALDI-TOF MS using a custom-made database, biomarker assignment, or mathematical classifiers does not differentiate <italic>Shigella</italic> spp., and <italic>Escherichia coli</italic></article-title>. <source>Microorganisms</source> <volume>10</volume>:<fpage>435</fpage>. doi: <pub-id pub-id-type="doi">10.3390/microorganisms10020435</pub-id></citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Liu</surname> <given-names>W.</given-names></name> <name><surname>Tang</surname> <given-names>J.-W.</given-names></name> <name><surname>Wang</surname> <given-names>J.-J.</given-names></name> <name><surname>Liu</surname> <given-names>Q.-H.</given-names></name> <name><surname>Wen</surname> <given-names>P.-B.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Applications of Raman spectroscopy in bacterial infections: principles, advantages, and shortcomings</article-title>. <source>Front. Microbiol.</source> <volume>12</volume>:<fpage>3580</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fmicb.2021.683580</pub-id>, PMID: <pub-id pub-id-type="pmid">34349740</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Tang</surname> <given-names>J.-W.</given-names></name> <name><surname>Li</surname> <given-names>F.</given-names></name> <name><surname>Usman</surname> <given-names>M.</given-names></name> <name><surname>Wu</surname> <given-names>C.-Y.</given-names></name> <name><surname>Liu</surname> <given-names>Q.-H.</given-names></name> <etal/></person-group>. (<year>2022a</year>). <article-title>Identification of bacterial pathogens at genus and species levels through combination of Raman spectrometry and deep-learning algorithms</article-title>. <source>Microbiol. Spectr.</source> <volume>10</volume>:<fpage>e0258022</fpage>. doi: <pub-id pub-id-type="doi">10.1128/spectrum.02580-22</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Zhang</surname> <given-names>X.-D.</given-names></name> <name><surname>Tang</surname> <given-names>J.-W.</given-names></name> <name><surname>Ma</surname> <given-names>Z.-W.</given-names></name> <name><surname>Usman</surname> <given-names>M.</given-names></name> <name><surname>Liu</surname> <given-names>Q.-H.</given-names></name> <etal/></person-group>. (<year>2022b</year>). <article-title>Machine learning analysis of SERS fingerprinting for the rapid determination of mycobacterium tuberculosis infection and drug resistance</article-title>. <source>Comput. Struct. Biotechnol. J.</source> <volume>20</volume>, <fpage>5364</fpage>&#x2013;<lpage>5377</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.csbj.2022.09.031</pub-id>, PMID: <pub-id pub-id-type="pmid">36212533</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Zhu</surname> <given-names>Z.</given-names></name> <name><surname>Qian</surname> <given-names>H.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Ma</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Comparative genome analysis of 15 clinical <italic>Shigella flexneri</italic> strains regarding virulence and antibiotic resistance</article-title>. <source>AIMS Microbiol.</source> <volume>5</volume>, <fpage>205</fpage>&#x2013;<lpage>222</lpage>. doi: <pub-id pub-id-type="doi">10.3934/microbiol.2019.3.205</pub-id>, PMID: <pub-id pub-id-type="pmid">31663057</pub-id></citation></ref>
<ref id="ref37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Worley</surname> <given-names>B.</given-names></name> <name><surname>Powers</surname> <given-names>R.</given-names></name></person-group> (<year>2016</year>). <article-title>PCA as a practical indicator of OPLS-DA model reliability</article-title>. <source>Curr. Metabolomics</source> <volume>4</volume>, <fpage>97</fpage>&#x2013;<lpage>103</lpage>. doi: <pub-id pub-id-type="doi">10.2174/2213235X04666160613122429</pub-id>, PMID: <pub-id pub-id-type="pmid">27547730</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xie</surname> <given-names>Y.</given-names></name> <name><surname>Xu</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Shao</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>Label-free detection of the foodborne pathogens of Enterobacteriaceae by surface-enhanced Raman spectroscopy</article-title>. <source>Anal. Methods</source> <volume>5</volume>, <fpage>946</fpage>&#x2013;<lpage>952</lpage>. doi: <pub-id pub-id-type="doi">10.1039/C2AY26107C</pub-id></citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zeiri</surname> <given-names>L.</given-names></name> <name><surname>Bronk</surname> <given-names>B.</given-names></name> <name><surname>Shabtai</surname> <given-names>Y.</given-names></name> <name><surname>Eichler</surname> <given-names>J.</given-names></name> <name><surname>Efrima</surname> <given-names>S.</given-names></name></person-group> (<year>2004</year>). <article-title>Surface-enhanced Raman spectroscopy as a tool for probing specific biochemical components in bacteria</article-title>. <source>Appl. Spectrosc.</source> <volume>58</volume>, <fpage>33</fpage>&#x2013;<lpage>40</lpage>. doi: <pub-id pub-id-type="doi">10.1366/000370204322729441</pub-id>, PMID: <pub-id pub-id-type="pmid">14727718</pub-id></citation></ref>
<ref id="ref40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zheng</surname> <given-names>D.-W.</given-names></name> <name><surname>Liu</surname> <given-names>X.-Y.</given-names></name> <name><surname>Zhang</surname> <given-names>P.</given-names></name> <name><surname>Su</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>L.-M.</given-names></name> <name><surname>Wei</surname> <given-names>X.-D.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Rapid identification of mixed enteropathogenic bacteria by means of au nanoparticles@ bacteria using portable Raman spectrometer</article-title>. <source>J. Nanosci. Nanotechnol.</source> <volume>18</volume>, <fpage>6776</fpage>&#x2013;<lpage>6785</lpage>. doi: <pub-id pub-id-type="doi">10.1166/jnn.2018.15510</pub-id>, PMID: <pub-id pub-id-type="pmid">29954493</pub-id></citation></ref>
<ref id="ref41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhu</surname> <given-names>Z.</given-names></name> <name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Qian</surname> <given-names>H.</given-names></name> <name><surname>Gu</surname> <given-names>F.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Comparative genome analysis of 12 <italic>Shigella sonnei</italic> strains: virulence, resistance, and their interactions</article-title>. <source>Int. Microbiol.</source> <volume>24</volume>, <fpage>83</fpage>&#x2013;<lpage>91</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10123-020-00145-x</pub-id></citation></ref>
<ref id="ref42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zuo</surname> <given-names>G.</given-names></name> <name><surname>Xu</surname> <given-names>Z.</given-names></name> <name><surname>Hao</surname> <given-names>B.</given-names></name></person-group> (<year>2013</year>). <article-title><italic>Shigella</italic> strains are not clones of <italic>Escherichia coli</italic> but sister species in the genus <italic>Escherichia</italic></article-title>. <source>Genomics Proteomics Bioinformatics</source> <volume>11</volume>, <fpage>61</fpage>&#x2013;<lpage>65</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.gpb.2012.11.002</pub-id>, PMID: <pub-id pub-id-type="pmid">23395177</pub-id></citation></ref>
</ref-list>
</back>
</article>