<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="review-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mol. Biosci.</journal-id>
<journal-title>Frontiers in Molecular Biosciences</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mol. Biosci.</abbrev-journal-title>
<issn pub-type="epub">2296-889X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1483326</article-id>
<article-id pub-id-type="doi">10.3389/fmolb.2024.1483326</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Molecular Biosciences</subject>
<subj-group>
<subject>Review</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Application of machine learning for mass spectrometry-based multi-omics in thyroid diseases</article-title>
<alt-title alt-title-type="left-running-head">Che et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fmolb.2024.1483326">10.3389/fmolb.2024.1483326</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Che</surname>
<given-names>Yanan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2735206/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhao</surname>
<given-names>Meng</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2737556/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gao</surname>
<given-names>Yan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zhang</surname>
<given-names>Zhibin</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zhang</surname>
<given-names>Xiangyang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1912966/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>School of Pharmaceutical Science and Technology</institution>, <institution>Tianjin University</institution>, <addr-line>Tianjin</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of General Surgery</institution>, <institution>Tianjin First Central Hospital</institution>, <addr-line>Tianjin</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1685386/overview">Michele Costanzo</ext-link>, University of Naples Federico II, Italy</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1415363/overview">Giuseppina Fanelli</ext-link>, University of Tuscia, Italy</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2216073/overview">Renu Pandey</ext-link>, Indian Institute of Technology Bombay, India</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Zhibin Zhang, <email>zhibin-zhang@nankai.edu.cn</email>; Xiangyang Zhang, <email>xiangyang.zhang@tju.edu.cn</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>17</day>
<month>12</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>11</volume>
<elocation-id>1483326</elocation-id>
<history>
<date date-type="received">
<day>23</day>
<month>08</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>02</day>
<month>12</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Che, Zhao, Gao, Zhang and Zhang.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Che, Zhao, Gao, Zhang and Zhang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Thyroid diseases, including functional and neoplastic diseases, bring a huge burden to people&#x2019;s health. Therefore, a timely and accurate diagnosis is necessary. Mass spectrometry (MS) based multi-omics has become an effective strategy to reveal the complex biological mechanisms of thyroid diseases. The exponential growth of biomedical data has promoted the applications of machine learning (ML) techniques to address new challenges in biology and clinical research. In this review, we presented the detailed review of applications of ML for MS-based multi-omics in thyroid disease. It is primarily divided into two sections. In the first section, MS-based multi-omics, primarily proteomics and metabolomics, and their applications in clinical diseases are briefly discussed. In the second section, several commonly used unsupervised learning and supervised algorithms, such as principal component analysis, hierarchical clustering, random forest, and support vector machines are addressed, and the integration of ML techniques with MS-based multi-omics data and its application in thyroid disease diagnosis is explored.</p>
</abstract>
<kwd-group>
<kwd>mass spectrometry</kwd>
<kwd>proteomics</kwd>
<kwd>metabolomics</kwd>
<kwd>multi-omics</kwd>
<kwd>thyroid diseases</kwd>
<kwd>machine learning</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Metabolomics</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>The thyroid gland is a small, butterfly-shaped gland located at the base of the neck (<xref ref-type="bibr" rid="B157">Sofia et al., 2019</xref>; <xref ref-type="bibr" rid="B127">Mullur et al., 2014</xref>). It plays a crucial role in regulating various metabolic processes by secreting hormones (<xref ref-type="bibr" rid="B157">Sofia et al., 2019</xref>; <xref ref-type="bibr" rid="B127">Mullur et al., 2014</xref>). Thyroid disease refers to various diseases affecting the thyroid gland, categorized into functional and neoplastic diseases (<xref ref-type="bibr" rid="B169">Vanderpump, 2011</xref>; <xref ref-type="bibr" rid="B197">Zhang et al., 2022</xref>). Functional diseases are classified as hyperthyroidism or hypothyroidism, whereas neoplastic diseases are classified as benign or malignant (<xref ref-type="bibr" rid="B197">Zhang et al., 2022</xref>).</p>
<p>In the field of neoplastic diseases, tumors are classified as benign tumors, low-risk neoplasms, and malignant neoplasms according to prognostic risk categories (<xref ref-type="bibr" rid="B18">Basolo et al., 2023</xref>). Thyroid cancer refers to malignant tumors, originating from follicular or parafollicular thyroid cells, which can metastasize to other places in the body (<xref ref-type="bibr" rid="B134">Omur and Baran, 2014</xref>). Thyroid cancer is one of the most common endocrine neoplasia, and its incidence has been on the rise in the past 40 years, disproportionately affecting women (<xref ref-type="bibr" rid="B38">Chen et al., 2023a</xref>; <xref ref-type="bibr" rid="B60">Guarino et al., 2010</xref>).</p>
<p>According to &#x201c;The 5th edition of the World Health Organization (WHO) classification of endocrine tumors&#x201d; which was released in 2022, thyroid cancer exists in several forms (<xref ref-type="bibr" rid="B153">Schneider and Chen, 2013</xref>), including differentiated thyroid cancer (DTC), undifferentiated thyroid cancer, and medullary thyroid cancer (MTC). DTC, the most prevalent type of thyroid malignancy, primarily includes papillary thyroid carcinoma (PTC), follicular thyroid carcinoma (FTC), and oncocytic thyroid carcinoma, with PTC accounting for 85% &#x2013;90% of all DTC cases (<xref ref-type="bibr" rid="B134">Omur and Baran, 2014</xref>; <xref ref-type="bibr" rid="B32">Caria et al., 2019</xref>). Thyroid cancer presents a complex and clinically significant challenge. To explore the molecular mechanisms of thyroid cancer, researchers have increasingly turned to omics approaches.</p>
<p>Omics is a technique for the comprehensive evaluation of different classes of biomolecules, including genomics, transcriptomics, proteomics, metabolomics, and others (<xref ref-type="bibr" rid="B15">Babu and Snyder, 2023</xref>). Using only one type of data to understand the characteristics and complications of a disease is not enough. Recently, exhaustive exploration through multi-omics strategies has garnered increasing attention among analytical chemists (<xref ref-type="bibr" rid="B83">Kappler and Lehmann, 2019</xref>). Advances in various omics technologies, such as proteomics and metabolomics, coupled with enhanced computing capabilities, have paved the way for innovative integration of diverse omics data (<xref ref-type="bibr" rid="B15">Babu and Snyder, 2023</xref>). With the rapid development of high throughput sequencing and multi-omics, biomedical research has increasingly adopted a combination of multi-omics technologies. Multi-omics strategies aim to scrutinize the same samples using two or more omics methods, integrating diverse omics data to reveal coherent associations and attain a comprehensive, holistic understanding of biomedical processes (<xref ref-type="bibr" rid="B83">Kappler and Lehmann, 2019</xref>).</p>
<p>Mass spectrometry (MS) is crucial for studying multi-omics. It is a high-throughput analytical technology that can quantify countless molecules, from metabolites and lipids to peptides and proteins (<xref ref-type="bibr" rid="B199">Zhao et al., 2022a</xref>; <xref ref-type="bibr" rid="B100">Leung Kwan et al., 2021</xref>). This analytical technology aids in discovering biomarkers, understanding diseases at the molecular level, and provides a new perspective in the biological field (<xref ref-type="bibr" rid="B100">Leung Kwan et al., 2021</xref>). As an emerging approach of biomarker discovery, MS-based multi-omics plays a significant role in the early diagnosis and screening, classification, and prognosis of diseases. However, the large amounts of data generated by high-throughput technologies require specialized data analysis strategies (<xref ref-type="bibr" rid="B200">Zhao et al., 2022b</xref>).</p>
<p>Machine learning (ML) is a driving force behind data integration in systems biology (<xref ref-type="bibr" rid="B4">Alber et al., 2019</xref>). Through data-driven bioinformatics analysis of MS-based multi-omics data, ML serves as a powerful tool for revealing the intrinsic mechanisms of various biological events (<xref ref-type="bibr" rid="B100">Leung Kwan et al., 2021</xref>). The combination of MS-based multi-omics and advanced data integration approach holds promise for deeper investigation of complex biological processes.</p>
<p>In this review, we presented the detailed review of applications of ML for MS-based multi-omics in thyroid disease. In literature previously published, applications of ML in thyroid disease or applications of MS-based multi-omics in thyroid disease are reviewed, but no one has combined them into a comprehensive review. This review can provide new insights to the people who focuses on applications of combining ML with MS-based multi-omics in thyroid disease. It is primarily divided into two sections. The first section briefly introduces MS-based multi-omics, mainly proteomics and metabolomics, and their applications in clinical diseases. The second section addresses a comprehensive overview of ML models, and explores the integration of ML techniques into MS-based multi-omics data, and its application in thyroid disease diagnosis.</p>
</sec>
<sec id="s2">
<title>2 Mass spectrometry-based multi-omics in thyroid diseases</title>
<p>Data from various studies, including genomics, transcriptomics, proteomics, and metabolomics studies together are denoted as &#x201c;multi-omics&#x201d; data (<xref ref-type="fig" rid="F1">Figure 1</xref>). Individual datasets from these &#x201c;-omics&#x201d; studies can serve as valuable biomarkers for studying, exploring, and understanding the traits and complexities of biological organisms (<xref ref-type="bibr" rid="B113">Manochkumar et al., 2023</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Multi-omics analysis flow chart.</p>
</caption>
<graphic xlink:href="fmolb-11-1483326-g001.tif"/>
</fig>
<p>MS plays a crucial role in multi-omics research by detecting metabolites or proteins in samples (<xref ref-type="bibr" rid="B141">Qiu et al., 2023</xref>). The use of mass spectrometry technology for detecting metabolites or proteins in samples can identify thousands of proteins or metabolites across a substantial volume of samples (<xref ref-type="bibr" rid="B94">Kowalczyk et al., 2020</xref>). This high-throughput approach not only improves our ability to identify molecular signatures but also helps us gain a more comprehensive understanding of the intricate biological processes within organisms (<xref ref-type="bibr" rid="B100">Leung Kwan et al., 2021</xref>).</p>
<sec id="s2-1">
<title>2.1 Mass spectrometry-based proteomics</title>
<p>Oncogenesis is associated with changes in the levels of various proteins involved in cell proliferation, migration, and apoptosis (<xref ref-type="bibr" rid="B122">Migisha et al., 2020</xref>). Proteomics enables the maximum identification and quantification of all proteins in cells or tissues, establishes the connection between genes and their corresponding protein products, and provides information about proteins, including their subcellular localization, post-translational modifications, and interactions with other proteins, aiming to reveal the mechanisms behind their biological functions (<xref ref-type="bibr" rid="B113">Manochkumar et al., 2023</xref>; <xref ref-type="bibr" rid="B37">Chen et al., 2023b</xref>; <xref ref-type="bibr" rid="B82">Kang et al., 2022</xref>). The analysis of the proteome can provide valuable insights into the fundamental molecular mechanisms of diseases, responses to therapy, and the identification of diagnostic, predictive biomarkers and prognostic crucial for precision medicine (<xref ref-type="bibr" rid="B16">Ball et al., 2023</xref>).</p>
<p>Mass spectrometry (MS) is an analytical technique that measures the mass-to-charge ratio (m/z) of ionized molecules. The basic components of a mass spectrometer include the ion source, mass analyzer, and detector. Proteins or peptides are ionized in the ion source, separated based on their m/z in the mass analyzer, and detected to generate a mass spectrum. This mass spectrum provides detailed information about the molecular weight and structural characteristics of the analyte. Mass spectrometry-based proteomics mainly includes five processes (<xref ref-type="fig" rid="F2">Figure 2</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>The workflow of MS-based proteomics and metabolomics analysis.</p>
</caption>
<graphic xlink:href="fmolb-11-1483326-g002.tif"/>
</fig>
<sec id="s2-1-1">
<title>2.1.1 Sample preparation</title>
<p>The proteomics workflow begins with the preparation of biological samples. Proteins are extracted from the sample, often followed by enrichment or fractionation to reduce complexity. This step is critical for ensuring the accurate identification and quantification of proteins.</p>
<p>The proteins are then digested into smaller peptides, typically using an enzyme like trypsin. This peptide mixture is more amenable to analysis by MS.</p>
</sec>
<sec id="s2-1-2">
<title>2.1.2 Peptide ionization</title>
<p>Peptides are ionized in the ion source, which can be achieved through various techniques. The most common ionization methods in proteomics are Electrospray Ionization (ESI) and Matrix-Assisted Laser Desorption/Ionization (MALDI).</p>
<p>ESI is widely used for liquid chromatography-mass spectrometry (LC-MS) and generates ions by applying a high voltage to a liquid sample, producing charged droplets that release ions. MALDI involves embedding the sample in a matrix that absorbs laser energy, leading to the ionization of peptides.</p>
</sec>
<sec id="s2-1-3">
<title>2.1.3 Mass analysis</title>
<p>The ionized peptides are introduced into the mass analyzer, where they are separated based on their m/z ratio. There are several types of mass analyzers, including Quadrupole, Time-of-Flight (TOF), Orbitrap, and Ion Trap, each offering different advantages in terms of resolution, accuracy, and speed.</p>
<p>High-resolution mass analyzers, such as the Orbitrap and TOF, are particularly valuable in proteomics for their ability to distinguish between ions with very similar m/z ratios, enabling the identification of complex peptide mixtures.</p>
</sec>
<sec id="s2-1-4">
<title>2.1.4 Peptide fragmentation</title>
<p>To obtain sequence information, peptides are often subjected to fragmentation in the mass spectrometer. Tandem mass spectrometry (MS/MS) involves two stages of mass analysis: the first stage selects a precursor ion, which is then fragmented, and the second stage analyzes the resulting fragment ions.</p>
<p>The fragmentation patterns are characteristic of the peptide&#x2019;s amino acid sequence, allowing for the identification of the peptide and inference of the protein from which it originated (<xref ref-type="bibr" rid="B154">Searle et al., 2020</xref>).</p>
</sec>
<sec id="s2-1-5">
<title>2.1.5 Data analysis</title>
<p>The mass spectrometry data are processed using sophisticated bioinformatics tools. Software such as MaxQuant, Proteome Discoverer, DIA-NN, Peaks, Spectronaut and Mascot matches the obtained mass spectra to theoretical spectra derived from protein databases, enabling protein identification.</p>
<p>Quantitative proteomics can be achieved through various techniques, including label-free quantification, stable isotope labeling (e.g., SILAC, iTRAQ), and tandem mass tags (TMT). These approaches allow for the relative or absolute quantification of proteins across different samples.</p>
<p>The development of highly sensitive and high-throughput MS platforms over the past decade means that it is now possible to identify and quantify thousands of proteins from large numbers of biological samples. Rapid advancements in MS and data analysis strategies have significantly enhanced proteomics research worldwide (<xref ref-type="bibr" rid="B64">Halder et al., 2021</xref>). MS-based proteomics is increasingly recognized as a widely adopted technique for characterizing proteomes (<xref ref-type="bibr" rid="B122">Migisha et al., 2020</xref>). Proteomics research can be divided into untargeted proteomics and targeted proteomics. Untargeted proteomics is also called discovery proteomics, which detects differential proteins in different samples by detecting proteins as many as possible. The research objects of untargeted proteomics are uncertain, and are often all the protein or peptide components contained in the sample, which are relatively large in number. Targeted proteomics is the quantitative detection of target proteins. The research objects of targeted proteomics are specific and the number is relatively small. Compared with untargeted proteomics, it has greater sensitivity and accuracy and is often used for verification analysis of biomarkers. Data-dependent acquisition (DDA) and data-independent acquisition (DIA) are the two primary MS strategies for untargeted proteomics (<xref ref-type="bibr" rid="B140">Qian et al., 2023</xref>). DDA is a traditional MS-based proteomics analysis method. In DDA, in the second stage of tandem mass spectrometry, a small number of peptides are selected for fragmentation within a narrow range of mass-to-charge ratio (m/z) signal intensity (<xref ref-type="bibr" rid="B65">Hu et al., 2016</xref>). DIA is another MS-based proteomics analysis method. DIA divides the entire full scan range of the mass spectrometer into several windows and then fragments all peptide precursors within each window simultaneously to generate a comprehensive MS<sup>2</sup> spectrum (<xref ref-type="bibr" rid="B86">Kawashima et al., 2019</xref>; <xref ref-type="bibr" rid="B180">Wang et al., 2022a</xref>).</p>
</sec>
</sec>
<sec id="s2-2">
<title>2.2 Mass spectrometry-based metabolomics</title>
<p>Metabolomics is to detect and qualitatively and quantitatively analyze the dynamic changes of metabolites of organisms, tissues or cells before and after a specific stimulus or interference which was initially introduced in 1999 by Jeremy-Nicholson and is an emerging research field (<xref ref-type="bibr" rid="B132">Nicholson et al., 1999</xref>; <xref ref-type="bibr" rid="B182">Wang et al., 2023a</xref>). The research objects are metabolites, which are mostly small molecule substances with a molecular mass range of &#x2264;1,000 Da, such as small organics: acids, amino acids, nucleotides, sugars, lipids, vitamins, etc. Metabolites are the end products of cellular processes and can directly reflect the physiological state of an organism. Liquid chromatography coupled to mass spectrometry (LC-MS) was first used to study thyroid cancer in serum samples in 2011 (<xref ref-type="bibr" rid="B194">Yao et al., 2011</xref>). DIA workflow was applied for metabolomics in 2017 (<xref ref-type="bibr" rid="B201">Zhou et al., 2017</xref>).</p>
<p>MS-based metabolomics involves the separation, detection, and characterization of metabolites, providing comprehensive coverage of the metabolome. The workflow is shown in <xref ref-type="fig" rid="F2">Figure 2</xref>.</p>
<sec id="s2-2-1">
<title>2.2.1 Sample preparation</title>
<p>The first step in MS-based metabolomics involves the preparation of biological samples. Metabolites can be extracted from various biological matrices, such as plasma, urine, tissues, or cell cultures, using extraction methods optimized for different classes of metabolites.</p>
<p>Sample preparation is critical to preserving the integrity of the metabolome and avoiding contamination or degradation. The extracted metabolites are often subjected to concentrate to improve the detection of low-abundance compounds.</p>
</sec>
<sec id="s2-2-2">
<title>2.2.2 Metabolite separation</title>
<p>Prior to mass spectrometric analysis, metabolites are typically separated using chromatographic techniques to reduce sample complexity. The most common techniques are Gas Chromatography (GC) and Liquid Chromatography (LC).</p>
<p>Gas Chromatography-Mass Spectrometry (GC-MS) is particularly well-suited for analyzing volatile and semi-volatile compounds. In GC-MS, metabolites are vaporized and separated in a gas phase before being ionized and detected by a mass spectrometer.</p>
<p>Liquid Chromatography-Mass Spectrometry (LC-MS) is more versatile and can handle a broader range of metabolites, including polar, non-volatile, and thermally labile compounds. LC-MS separates metabolites in a liquid phase based on their interaction with the stationary phase and then ionizes them for mass spectrometric detection.</p>
</sec>
<sec id="s2-2-3">
<title>2.2.3 Ionization of metabolites</title>
<p>The ionization of metabolites is a crucial step in mass spectrometry, as it converts neutral molecules into charged ions that can be detected. Common ionization methods include Electrospray Ionization (ESI) and Atmospheric Pressure Chemical Ionization (APCI) for LC-MS, and Electron Ionization (EI) for GC-MS.</p>
<p>ESI is widely used in LC-MS due to its ability to ionize a wide range of metabolites, particularly those that are polar and easily ionizable. ESI produces ions by applying a high voltage to the liquid sample, resulting in charged droplets that release ions as they evaporate.</p>
<p>EI, commonly used in GC-MS, involves bombarding gas-phase molecules with high-energy electrons, leading to ionization and fragmentation. The resulting fragment ions provide structural information about the metabolite.</p>
</sec>
<sec id="s2-2-4">
<title>2.2.4 Mass analysis and detection</title>
<p>Once ionized, metabolites are introduced into the mass analyzer, where they are separated based on their m/z ratio. Unlike proteomics, metabolomics is divided into positive and negative ion modes due to the different properties of the compounds. Various mass analyzers are used in metabolomics, including Quadrupole, Time-of-Flight (TOF), Orbitrap, and Ion Trap analyzers.</p>
<p>High-resolution mass analyzers, such as the Orbitrap and TOF, are particularly valuable in metabolomics for their ability to accurately measure the m/z of metabolites and distinguish between compounds with very similar masses.</p>
</sec>
<sec id="s2-2-5">
<title>2.2.5 Data acquisition and processing</title>
<p>The mass spectrometer generates a mass spectrum, which provides information on the m/z ratios and intensities of detected ions. This data is then processed using specialized software to identify and quantify metabolites.</p>
<p>The identification of metabolites is typically performed by matching the acquired mass spectra against reference libraries, databases or, such as HMDB, Compound Discover, METLIN and SMPDB (<xref ref-type="bibr" rid="B190">Xiao et al., 2012</xref>). Accurate mass measurements and fragmentation patterns are used to deduce the molecular structure of unknown metabolites.</p>
<p>Metabolites can be quantified either relatively, by comparing the intensity of ion signals between samples, or absolutely, using calibration curves with known standards.</p>
<p>MS is a major platform for clinical metabolomics due to its excellent sensitivity, selectivity, and wide dynamic range (<xref ref-type="bibr" rid="B48">Ding and Feng, 2023</xref>). MS-based metabolomics can simultaneously detect and quantify thousands of metabolite features (<xref ref-type="bibr" rid="B7">Alseekh et al., 2021</xref>). Common MS-based metabolomics methods include GC-MS and LC-MS. Compared with GC-MS, LC-MS generates extensive data, has high sensitivity, and can measure a wide range of metabolites. Due to the feasibility of liquid chromatography (LC) in separating a wide range of metabolites with broad polarity, combining LC with high-resolution MS systems consistently detects and quantifies thousands of metabolic features, even from minimal sample amounts such as 10 mg of tissue, 50 uL of urine, or as few as half a million cells (<xref ref-type="bibr" rid="B61">Guo et al., 2022a</xref>). LC-MS-based metabolomics has gained increasing attention for identifying disease biomarkers and providing unique insights into pathophysiological processes (<xref ref-type="bibr" rid="B48">Ding and Feng, 2023</xref>; <xref ref-type="bibr" rid="B143">Randall et al., 2023</xref>).</p>
<p>Mass spectrometry imaging (MSI) technology is also widely used in the study of the spatiotemporal distribution of various metabolites, peptides and proteins in animal/plant tissues due to its advantages such as label-free, non-specific, high sensitivity, high chemical coverage, and simultaneous detection of elements/molecules.</p>
</sec>
</sec>
<sec id="s2-3">
<title>2.3 Mass spectrometry-based multi-omics applications in thyroid diseases</title>
<p>High-throughput techniques, exemplified by MS, play a crucial role in the measurement of metabolomic and proteomic data (<xref ref-type="bibr" rid="B144">Reel et al., 2021</xref>). Collectively, these &#x201c;-omics&#x201d; data hold the potential to significantly advance precision medicine, particularly in the context of biomarker-driven approaches for conditions such as endocrine diseases, diabetes, cancer, cardiovascular disease, respiratory disorders, and Alzheimer&#x2019;s disease (<xref ref-type="bibr" rid="B144">Reel et al., 2021</xref>).</p>
<p>Regarding thyroid diseases, understanding the pathogenesis is essential for improving diagnostic accuracy, precise risk stratification, and enabling personalized treatment (<xref ref-type="bibr" rid="B103">Li et al., 2023a</xref>). In recent years, with the continuous development of MS, various omics analysis methods based on different sample types (cells, tissues, serum, and urine) have been applied to the study of thyroid disease, actively promoting the development of accurate diagnosis and treatment of thyroid disease by clarifying the pathogenesis, diagnostic grading, prognosis prediction and targeted therapy (<xref ref-type="bibr" rid="B103">Li et al., 2023a</xref>).</p>
<p>Biomarkers refer to &#x201c;an indicator that can be objectively detected and evaluated and can be used as an indicator of normal biological processes, pathological processes, or pharmacological responses to therapeutic intervention&#x201d; and are of great significance for screening, diagnosing, or monitoring diseases (<xref ref-type="bibr" rid="B25">Biomarkers, 2001</xref>; <xref ref-type="bibr" rid="B124">Mischak et al., 2010</xref>; <xref ref-type="bibr" rid="B78">Joshi et al., 2024</xref>). The exploration of biomarker discovery holds promise in identifying potential markers for early disease detection, prognosis assessment, predicting and monitoring treatment responses (<xref ref-type="bibr" rid="B76">Jimenez and Verheul, 2014</xref>). The identification and validation of reliable biomarkers will continue to help improve our understanding of thyroid disease and refine treatment strategies (<xref ref-type="bibr" rid="B45">Davis et al., 2020</xref>; <xref ref-type="bibr" rid="B30">Califf, 2018</xref>).</p>
<p>Misdiagnosis is common in the diagnosis of thyroid disease (<xref ref-type="bibr" rid="B172">Walsh, 2016</xref>). Therefore, it is necessary to identify biomarkers for specific thyroid disease states. MS-based proteomics and metabolomics have been widely used for the discovery of potential biomarkers in the research of thyroid disease.</p>
<p>Much of the published proteomic studies of thyroid disease have compared the protein profiles of thyroid disease groups with healthy thyroid groups to find potential protein markers (<xref ref-type="bibr" rid="B136">Paron et al., 2003</xref>). Tissues and cell lines of thyroid are always used for differential proteomics. In a 1997 study, Galectin-3 was proposed to be a potential biomarker of malignant thyroid tumors, especially papillary carcinomas (<xref ref-type="bibr" rid="B54">Fern&#xe1;ndez et al., 1997</xref>). This finding has been confirmed by several other independent researches using different proteomic approaches: MALDI-MSI (<xref ref-type="bibr" rid="B136">Paron et al., 2003</xref>), two-dimensional gel electrophoresis and LC-MS (<xref ref-type="bibr" rid="B167">Torres-Cabala et al., 2004</xref>). S100 family proteins are comprised of 21 small isoforms, and many of them implicated in important cellular functions such as proliferation, motility and survival (<xref ref-type="bibr" rid="B116">Martinez-Aguilar et al., 2015</xref>). Several papers have been published confirming them as potential biomarkers in thyroid cancer by proteomic approaches (<xref ref-type="bibr" rid="B167">Torres-Cabala et al., 2004</xref>; <xref ref-type="bibr" rid="B148">Nishimura et al., 1997</xref>; <xref ref-type="bibr" rid="B174">Wang et al., 2021</xref>). Torres-Cabala, C. et al. identified a new protein, S100C, which is highly expressed in PTC by two-dimensional gel electrophoresis and LC-MS (<xref ref-type="bibr" rid="B167">Torres-Cabala et al., 2004</xref>). S100A6 was found to be expressed at a significantly higher level in PTC compared with other tumor groups or normal tissues by LC-MS based proteomics (<xref ref-type="bibr" rid="B158">Sofiadis et al., 2010</xref>). <xref ref-type="bibr" rid="B133">Nipp et al. (2012)</xref> confirmed S100A10 and S100A6 as biomarkers of PTC with lymph node metastasis identified by MALDI-MSI proteomic approach. This result also demonstrated the potential application of MALDI-MSI proteomic approach in identifying biomarkers in thyroid cancer.</p>
<p>In recent years, exosomes, small membrane microvesicles derived from endosomal cells, have attracted great interest in the proteomics of thyroid diseases due to their role in transporting proteins, lipids and nucleic acids into target cells (<xref ref-type="bibr" rid="B198">Zhang et al., 2019</xref>). Transport of molecules via exosomes is one of the factors in the development of thyroid cancer, and the transported molecules can serve as cancer biomarkers (<xref ref-type="bibr" rid="B165">Surman et al., 2024</xref>). <xref ref-type="bibr" rid="B111">Luo et al. (2018)</xref> compared proteome profiles of serum-purified exosomes (SPEs) from PTC patients with LNM, PTC patients without LNM, and healthy donors. The results showed that specific proteins related to cancer cell metastasis, such as SRC, TLN1, ITGB2, and CAPNS1, were overexpressed in the SPEs of PTC patients with LNM (<xref ref-type="bibr" rid="B111">Luo et al., 2018</xref>). In the study of Xi Jia et al., the screened differentially expressed proteins, such as MAP1S, VAMP8, IF5, RSU1, ACTB and CXCL7, were mainly enriched in the immune system and metabolic system that can be seen as potential biomarkers, indicating that plasma exosomes may play an important role in the systemic immune imbalance of autoimmune thyroid diseases (AITDs) (<xref ref-type="bibr" rid="B75">Jia et al., 2021</xref>).</p>
<p>Proteomics can not only provide biomarkers for diagnosis but also reveal potential therapeutic targets. For example, protein HSP90 was found to be overexpressed in thyroid cancer (<xref ref-type="bibr" rid="B137">Pearl et al., 2008</xref>; <xref ref-type="bibr" rid="B109">Liu et al., 2017</xref>). HSP90 regulates protein degradation of several growth-mediating kinases such as BRAF and RET which are well known for the role they play in carcinogenesis (<xref ref-type="bibr" rid="B56">Gild et al., 2016</xref>). Several studies have shown that inhibition of HSP90 can not only attenuate cell proliferation but also improve the efficacy of radioiodine therapy in thyroid cancer patients (<xref ref-type="bibr" rid="B56">Gild et al., 2016</xref>; <xref ref-type="bibr" rid="B115">Marsee et al., 2004</xref>; <xref ref-type="bibr" rid="B185">Wickenberg et al., 2024</xref>; <xref ref-type="bibr" rid="B184">White et al., 2016</xref>).</p>
<p>Since tumors significantly alter major metabolic pathways, metabolomics is also rapidly becoming an important method for identifying cancer biomarkers. Alterations of the metabolome can be reflected in both tissues and biological fluids. Most chromatography-based metabolomics studies focus on biomarkers between disease and normal groups. <xref ref-type="bibr" rid="B67">Huang et al. (2019a)</xref> conducted metabolomic studies using 1,540 clinical serum and plasma samples, along with 114 clinical tissue samples, to characterize the metabolomic profiles of healthy controls and patients with thyroid nodules, including benign thyroid nodules (BTN) and PTC. Their research identified a group of circulating metabolites&#x2014;myo-inositol, &#x3b1;-N-phenylacetyl-L-glutamine, proline betaine, L-glutamic acid, LysoPC (18:0), and LysoPC (18:1)&#x2014;as potential biomarkers. <xref ref-type="bibr" rid="B72">Jajin et al. (2022)</xref> used GC-MS to perform plasma metabolomics profiling of medullary thyroid cancer (MTC) patients. Results showed that linoleic acid, linolenic acid, and leucine can be used as potential biomarkers for early detection of MTC. These findings provide a basis for the diagnosis and management of thyroid cancer patients from a metabolomics perspective.</p>
<p>Spatially resolved metabolomics integrates MSI and metabolomics technology to accurately measure the types, contents and differential spatial distribution of endogenous or exogenous metabolites in biological tissues and cells and shows great prospect in biomarker discovery of thyroid disease. Jialing <xref ref-type="bibr" rid="B196">Zhang et al. (2017b)</xref> used desorption electrospray ionization mass spectrometry imaging (DESI-MSI) to analyze metastatic thyroid cancer in human lymph node tissues and the results showed that the relative abundance of ceramide and glycerophosphoinositide increased.</p>
<p>
<xref ref-type="bibr" rid="B187">Wojakowska et al. (2018)</xref> used MALDI-MSI to analysis of lipid distribution directly in formalin-fixed tissue. The results showed that the abundance of phosphatidylcholine (32:0, 32:1, 34:1 and 36:3), sphingomyelin (34:1 and 36:1) and phosphatidic acid (36:2 and 36:3) were significantly higher in cancer tissues than them in non-cancer tissues (<xref ref-type="bibr" rid="B187">Wojakowska et al., 2018</xref>).</p>
<p>Luojiao <xref ref-type="bibr" rid="B68">Huang et al. (2019b)</xref> used the air-flow assisted desorption electrospray ionization (AFADESI) MSI to investigated the metabolic characteristics of different microregions of PTC and results showed that phenylalanine, leucine and tyrosine were expressed at the highest levels in tumors, with a trend of gradually decreasing from tumors to stromal tissues and normal tissues, while creatinine was the opposite.</p>
<p>Biomarker discovery can contribute to molecular subtyping in thyroid disease. The integration of MS-based multi-omics is a powerful tool for elucidating complex molecular signatures of various cancer subtypes (<xref ref-type="bibr" rid="B176">Wang et al., 2023b</xref>). This approach not only enhances our understanding of the mechanisms of action of various molecules within cancer but also facilitates more targeted and personalized therapeutic interventions for specific subtypes (<xref ref-type="bibr" rid="B24">Berger and Mardis, 2018</xref>).</p>
<p>
<xref ref-type="bibr" rid="B117">Martinez-Aguilar et al. (2016)</xref> applied DIA MS for quantitative analysis of expression levels for over 1,600 proteins across 32 specimens, discerning differences between normal thyroid tissue and the three prevalent thyroid gland tumors: follicular adenoma, follicular carcinoma, and papillary carcinoma. Proteomic pathway analysis revealed that changes in papillary carcinomas are associated with disruption of cell contacts (loss of E-cadherin), actin cytoskeletal dynamics, and loss of differentiation markers, characteristics of the aggressive phenotype (<xref ref-type="bibr" rid="B117">Martinez-Aguilar et al., 2016</xref>).</p>
<p>
<xref ref-type="bibr" rid="B186">Wojakowska et al. (2015)</xref> used the GC-MS method to extract, identify, and semi-quantitate metabolites in formalin-fixed paraffin-embedded (FFPE) tissue specimens from five different types of thyroid malignancies, benign follicular adenoma and normal thyroid and concluded that multicomponent metabolomic signatures can be used to classify different subtypes of follicular thyroid lesions.</p>
<p>MS-based multi-omics have significantly increased in recent years and enabled mapping of biochemical changes in thyroid disease and hence can provide an opportunity to develop predictive biomarkers that can trigger earlier interventions (<xref ref-type="bibr" rid="B177">Wang et al., 2013</xref>). MS can directly quantify thyroid analytes and its high resolution can enhance the accuracy and detection (<xref ref-type="bibr" rid="B74">Jasem et al., 2024</xref>). Biomarkers of thyroid disease screened out by MS-based proteomics and metabolomics can not only provide a basis for clinical diagnosis, but also provide insights into the biological mechanisms of thyroid disease. It can be used to distinguish different types of thyroid cancer, which is beneficial for classifying benign and malignant cancers for treatment, such as using different dosing strategies, thereby achieving precision medicine.</p>
</sec>
</sec>
<sec id="s3">
<title>3 Classic machine learning models and multi-omics applications in thyroid disease</title>
<p>This section will present several classic machine learning models and offer an overview of how these models contribute to the study of thyroid diseases.</p>
<sec id="s3-1">
<title>3.1 Classic machine learning models in data analysis</title>
<p>Machine learning (ML) is the science of developing algorithms and statistical models, which is a subset of artificial intelligence (<xref ref-type="bibr" rid="B156">Smith et al., 2023</xref>). Computer systems utilize these algorithms and models to perform tasks without explicit instructions, enabling machines to undertake activities requiring human intelligence, such as diagnosis, planning, and prediction, based on established patterns and reasoning (<xref ref-type="bibr" rid="B125">Mohammadzadeh et al., 2024</xref>). In recent years, the exponential growth of biomedical data has driven many applications of ML techniques to address new challenges in biology and clinical research (<xref ref-type="bibr" rid="B13">Auslander et al., 2021</xref>). ML methods are favored in statistical analysis because of their inherent nonlinear data representation and ability to quickly process large datasets (<xref ref-type="bibr" rid="B108">Liebal et al., 2020</xref>). ML algorithms are employed for training, key feature identification, and group classification (<xref ref-type="bibr" rid="B70">Huang et al., 2018</xref>).</p>
<p>Generally, ML can be categorized into four main types: unsupervised, supervised, semi-supervised, and reinforcement learning (<xref ref-type="fig" rid="F3">Figure 3</xref>). Current research in clinical diseases predominantly focuses on unsupervised and supervised learning algorithms, which will be the focus of this review (<xref ref-type="bibr" rid="B138">Perakakis et al., 2018</xref>).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Classification of ML learning algorithms.</p>
</caption>
<graphic xlink:href="fmolb-11-1483326-g003.tif"/>
</fig>
<p>This section examines the role of ML in handling and analyzing the vast and complex datasets generated by MS-based multi-omics approaches. It discusses specific algorithms and techniques for data processing, feature selection, and classification, emphasizing their importance in identifying potential biomarkers and therapeutic targets.</p>
<sec id="s3-1-1">
<title>3.1.1 Unsupervised learning</title>
<p>Unsupervised learning involves using datasets that contain only input data and attempts to find structure in the data by grouping or clustering the data points (<xref ref-type="bibr" rid="B8">Angra and Ahuja, 2017</xref>). Unsupervised learning algorithms are primarily employed for dimensionality reduction, clustering, and association tasks (<xref ref-type="bibr" rid="B11">Arjmand et al., 2022</xref>). Four common unsupervised algorithms include principal component analysis (PCA), t-distributed stochastic neighbor embedding (t-SNE), uniform manifold approximation and projection (UMAP), and hierarchical clustering (HCL).</p>
<sec id="s3-1-1-1">
<title>3.1.1.1 Principal component analysis (PCA)</title>
<p>The complexity of multivariate data often necessitates the use of dimensionality reduction methods to simplify the information. Dimensionality reduction of high-dimensional data plays a crucial role in downstream tasks such as pattern recognition, classification, and clustering (<xref ref-type="bibr" rid="B91">Kim et al., 2018</xref>). Principal component analysis (PCA) is a classic unsupervised dimensionality reduction method that identifies hidden features in data, providing the most significant signals, and is often used in machine learning. (<xref ref-type="bibr" rid="B91">Kim et al., 2018</xref>; <xref ref-type="bibr" rid="B40">Chen and Gao, 2016</xref>; <xref ref-type="bibr" rid="B112">Ma and Dai, 2011</xref>). PCA simplifies complex data and makes the analysis process easier. Essentially, PCA is an &#x201c;unsupervised&#x201d; method that analyzes data purely based on its characteristics, without knowing the grouping of each sample. PCA effectively identifies the &#x201c;main&#x201d; elements and structures in the data, removes noise and redundancy, reduces the dimensionality of complex data, and reveals the simple structure hidden behind the complex data (<xref ref-type="bibr" rid="B161">Sugimoto et al., 2012</xref>). PCA is widely used in MS-based multi-omics data analysis, particularly for data dimensionality and achieving data visualization (<xref ref-type="bibr" rid="B161">Sugimoto et al., 2012</xref>). The results are often visualized using scatter plots.</p>
<p>PCA is commonly applied in clinical analysis to reveal differences between samples, with the distance between samples on the horizontal and vertical axes representing the similarity distance of the samples under the influence of the principal components (PC1 and PC2).</p>
<p>For example, in a single-cell proteomics study of hepatocytes by <xref ref-type="bibr" rid="B150">Rosenberger et al. (2023)</xref>, PCA was used to reduce the dimensionality of proteomics data, resulting in clear hepatocyte partitioning and demonstrating the biological validity of the data. Similarly, <xref ref-type="bibr" rid="B191">Xu et al. (2022)</xref> applied PCA to validate the metabolic profile of mouse liver tissue in a study on the mechanism of action of Huang Qin decoction for treating diabetic liver injury.</p>
<p>PCA is particularly suitable for initial exploratory data analysis, especially when linear relationships are presumed in the data and the interpretability of components is crucial (<xref ref-type="bibr" rid="B19">Beattie and Esmonde-White, 2021</xref>; <xref ref-type="bibr" rid="B71">Ivosev et al., 2008</xref>). It is also preferred in scenarios where computational efficiency is a priority. However, PCA may not adequately capture complex nonlinear interactions present in biological data.</p>
</sec>
<sec id="s3-1-1-2">
<title>3.1.1.2 t-distributed stochastic neighbor embedding (t-SNE)</title>
<p>t-distributed Stochastic Neighbor Embedding (t-SNE) is a nonlinear dimensionality reduction technique primarily designed for data visualization and excels at identifying and discovering complex nonlinear structures in data (<xref ref-type="bibr" rid="B42">Cieslak et al., 2020</xref>). It converts high-dimensional data into a low-dimensional space, typically two or three dimensions while preserving the local structure of the data (<xref ref-type="bibr" rid="B42">Cieslak et al., 2020</xref>; <xref ref-type="bibr" rid="B44">Da Silva Lopes et al., 2020</xref>). t-SNE focuses on preserving the relative distances between similar data points, making it effective for revealing clusters and patterns (<xref ref-type="bibr" rid="B35">Chatzimparmpas et al., 2020</xref>).</p>
<p>In the study by <xref ref-type="bibr" rid="B107">Liang et al. (2022)</xref>, 1,681 proteins were analyzed through proteomics in 258 HCM patients. t-SNE was utilized to visualize and reduce the dimensionality of the data, revealing that the four molecular subtypes were well separated.</p>
<p>t-SNE is ideal for visualizing small to medium-sized datasets where the primary goal is to understand and explore local structures and clustering. It is particularly suitable for high-dimensional data with complex, nonlinear relationships (<xref ref-type="bibr" rid="B57">Gisbrecht et al., 2015</xref>). However, it is relatively slow, especially when applied to large datasets.</p>
</sec>
<sec id="s3-1-1-3">
<title>3.1.1.3 Uniform manifold approximation and projection (UMAP)</title>
<p>Uniform manifold approximation and projection (UMAP), an algorithm developed by McInnes et al., is a nonlinear dimensionality reduction technique (<xref ref-type="bibr" rid="B110">Lundberg and Lee, 2017</xref>). It is another nonlinear dimensionality reduction method particularly effective at preserving both local and some global structures of the data (<xref ref-type="bibr" rid="B21">Becht et al., 2018</xref>; <xref ref-type="bibr" rid="B193">Yang et al., 2021</xref>). UMAP is based on manifold learning techniques and constructs a high-dimensional graph representation of the data, which is subsequently optimized to create a low-dimensional embedding (<xref ref-type="bibr" rid="B119">McInnes et al., 2018</xref>).</p>
<p>Like t-SNE, UMAP is also effective in capturing complex nonlinear relationships in the data. In general, UMAP is faster and more scalable than t-SNE and it better preserves both local and global structures.</p>
<p>UMAP is preferred for large datasets requiring a balance between local and global structure preservation (<xref ref-type="bibr" rid="B151">Sainburg et al., 2021</xref>). It is effective for visualizing complex data structures and works well for high-dimensional data (<xref ref-type="bibr" rid="B21">Becht et al., 2018</xref>). Compared to PCA, this method is more complex and can be challenging to understand and debug. Although UMAP is faster than t-SNE, it still requires significant computational resources for very large datasets (<xref ref-type="bibr" rid="B149">Roca et al., 2023</xref>).</p>
</sec>
<sec id="s3-1-1-4">
<title>3.1.1.4 Hierarchical clustering (HCL)</title>
<p>A crucial component of unsupervised learning is the clustering algorithm. Traditionally, cluster analysis is classified as unsupervised learning because it does not involve class labels or quantitative response variables, which are characteristic of supervised learning methods such as classification and regression (<xref ref-type="bibr" rid="B135">Pan et al., 2013</xref>). Cluster analysis is a series of different algorithms that divide observation data into different categories or clusters based on distance functions (<xref ref-type="bibr" rid="B26">Blekherman et al., 2011</xref>). The goal is to partition the data into groups such that the distance between samples within each group is smaller than the distance between samples in different groups (<xref ref-type="bibr" rid="B26">Blekherman et al., 2011</xref>). Hierarchical clustering (HCL) is a clustering method frequently used in marker screening and enables visualization of gene, protein, and metabolite features (<xref ref-type="bibr" rid="B139">Picard et al., 2023</xref>; <xref ref-type="bibr" rid="B59">Granato et al., 2018</xref>). The results of HCL are commonly visualized using heatmaps.</p>
<p>In biomedical informatics, HCL is often applied to cluster protein sequence data. Proteins with similar structures also have similar functions. Proteins with similar functions can be grouped into categories through clustering, aiding in the study of protein functions. In clinical analysis, hierarchical clustering is utilized to intuitively display relationships between groups and highlights expression differences of characteristic substances.</p>
<p>In the study of MS-based urine proteomics of gastric lesions by <xref ref-type="bibr" rid="B51">Fan et al. (2022)</xref>, HCL was used to partition 139 differential proteins with VIP&#x3e;1 into six clusters, revealing dynamic changes from precancerous lesions dynamic changes in gastric cancer.</p>
<p>In an MS-based metabolomics study of cancer cell lines by <xref ref-type="bibr" rid="B101">Li et al. (2019)</xref>, HCL was employed to assess metabolic similarities between cell lines.</p>
<p>For MS-based spatial proteomics, dimensionality reduction and clustering methods such as PCA, t-SNE and HCL are effective for quality control of MS-based spatial proteomic data and for examining organelle separation (<xref ref-type="bibr" rid="B66">Huang et al., 2022</xref>; <xref ref-type="bibr" rid="B84">Karimpour-Fard et al., 2015</xref>; <xref ref-type="bibr" rid="B126">Mou et al., 2022</xref>; <xref ref-type="bibr" rid="B147">Ringner, 2008</xref>).</p>
</sec>
</sec>
<sec id="s3-1-2">
<title>3.1.2 Supervised learning</title>
<p>Supervised learning relies on labeled datasets to train algorithms on a predefined classification system and to infer the functional relationship between input features and output labels based on this training. The algorithm learns a function from the training dataset that enables prediction of outcomes for new data. In essence, supervised learning involves determining whether the objective is to predict outcomes based on known input-output pairs. A significant category within supervised learning is classification problems. In the classification problems, the target variables are discrete rather than continuous. Examples include tumor size, patient age, and the benign or malignant status of the tumor.</p>
<p>The process of model training with ML algorithms involves three steps: data splitting, parameter estimation using the training set, and performance evaluation using the test set.<list list-type="simple">
<list-item>
<p>a. Data Splitting</p>
</list-item>
</list>
</p>
<p>Typically, the dataset used to train a ML model is divided into a training set and a test set, with a common ratio of 70:30 (<xref ref-type="bibr" rid="B55">Galal et al., 2022</xref>). A validation set is often included for model performance evaluation and hyperparameter tuning, ensuring optimal results under the given data conditions. In this scenario, the data can be divided into 60% training, 20% validation, and 20% test sets (<xref ref-type="bibr" rid="B55">Galal et al., 2022</xref>).<list list-type="simple">
<list-item>
<p>b. Parameter Estimation Using Training Data</p>
</list-item>
</list>
</p>
<p>Parameter estimation is a critical step in model training. The goal of using training set to estimate model parameters is to create a model that accurately captures the underlying information in the data so that it can make reliable predictions about new data.<list list-type="simple">
<list-item>
<p>c. Comprehensive Evaluation Using Test Data</p>
</list-item>
</list>
</p>
<p>The test set evaluates the overall performance of the final model. After final parameter adjustments, the test set is used to evaluate the performance of the model comprehensively, assessing for issues such as overfitting or underfitting. If no issues are identified, the model can be applied to the project.</p>
<p>Common supervised algorithms include partial least squares discriminant analysis (PLS-DA), decision trees (DTs), random forest (RF), support vector machine (SVM), K-Nearest Neighbor (kN), and eXtreme Gradient Boosting (XGBoost).</p>
<sec id="s3-1-2-1">
<title>3.1.2.1 partial least squares discriminant analysis (PLS-DA)</title>
<p>Partial least squares discriminant analysis (PLS-DA) is also a dimensionality reduction algorithm. Unlike PCA, PLS is a &#x201c;supervised&#x201d; mode of partial least squares analysis, meaning that the grouping relationships of the samples are known, allowing for better selection of characteristic variables that distinguish each group and determination of relationships between the samples. DA stands for discriminant analysis. PLS-DA employs the partial least squares regression method to &#x201c;reduce the dimensionality&#x201d; of the data, establish a regression model, and conduct discriminant analysis on the regression results. PLS-DA is particularly suitable for selecting and interpreting metabolite signatures when studying biological systems (<xref ref-type="bibr" rid="B43">D&#x27;Andrea et al., 2023</xref>).</p>
<p>In an MS-based urine proteomics study of gastric lesions by <xref ref-type="bibr" rid="B51">Fan et al. (2022)</xref>, PLS-DA was used to analyze the proteomics data of different groups and screen out 139 differential proteins with VIP&#x3e;1.</p>
<p>In the study by <xref ref-type="bibr" rid="B43">D&#x27;Andrea et al. (2023)</xref>, the PLS-DA model was confirmed through cross-validation, and the average variable importance in projection (VIP) score was used to identify metabolites that differed among sample classes.</p>
</sec>
<sec id="s3-1-2-2">
<title>3.1.2.2 Decision trees (DTs)</title>
<p>Decision trees (DTs) employ ML techniques to address classification and prediction problems. Nodes and leaves are the primary elements that form a decision tree (<xref ref-type="bibr" rid="B36">Chaubey et al., 2020</xref>). Nodes test specific properties, and leaves represent a class (<xref ref-type="bibr" rid="B120">Mesari&#x107; and &#x160;ebalj, 2016</xref>). Common decision trees include the ID3 tree, the C4.5 tree (information gain rate), and the CART tree (Gini coefficient) (<xref ref-type="bibr" rid="B80">Ross, 1993</xref>; <xref ref-type="bibr" rid="B99">Leo et al., 1984</xref>).</p>
<p>The ID3 algorithm is one of the classic decision tree algorithms. The C4.5 algorithm is an improvement upon the ID3 algorithm and can handle discontinuous features (<xref ref-type="bibr" rid="B129">Navada et al., 2011</xref>). The ID3 and the C4.5 algorithm are primarily used to address classification problems, but cannot be used to apply regression problems (<xref ref-type="bibr" rid="B155">Singh and Giri, 2014</xref>). The CART algorithm can manage both classification and regression problems.</p>
<p>
<xref ref-type="bibr" rid="B53">Fannes et al. (2013)</xref> introduced CP-DT (Decision Tree Cleavage Prediction), an algorithm based on an ensemble of decision trees trained on publicly available peptide identification data from the PRIDE database. The study demonstrated that CP-DT can accurately predict trypsin cleavage (<xref ref-type="bibr" rid="B53">Fannes et al., 2013</xref>).</p>
<p>Decision tree algorithms are fast, however, they are generally not as accurate as other models.</p>
</sec>
<sec id="s3-1-2-3">
<title>3.1.2.3 Random forest (RF)</title>
<p>Random forest (RF) is a regression tree technique that employs bootstrap aggregation and predictor randomization to achieve a degree of predictive accuracy (<xref ref-type="bibr" rid="B160">Steven, 2017</xref>). Proposed by Breiman in 2001, RF employs randomization to create numerous decision trees and is a widely used tool for classification and regression in bioinformatics and related fields (<xref ref-type="bibr" rid="B160">Steven, 2017</xref>; <xref ref-type="bibr" rid="B73">Janitza et al., 2016</xref>). Compared to a single decision tree, a random forest exhibits stronger generalization performance. In classification problems, the outputs of these decision trees are voted and aggregated into one output; in regression problems, they are averaged and aggregated into one output (<xref ref-type="bibr" rid="B160">Steven, 2017</xref>). RF classification is a widely used supervised learning method for developing predictive models in many research settings (<xref ref-type="bibr" rid="B159">Speiser et al., 2019</xref>).</p>
<p>The random forest algorithm is simple and easy to implement, applicable to both classification and regression problems (<xref ref-type="bibr" rid="B160">Steven, 2017</xref>). It has the following features.<list list-type="simple">
<list-item>
<p>a. It can handle numerous input variables, and the more data features present, the more stable the model (<xref ref-type="bibr" rid="B23">Belgiu and Dr&#x103;gu&#x163;, 2016</xref>).</p>
</list-item>
<list-item>
<p>b. It can evaluate feature importance while determining the category (<xref ref-type="bibr" rid="B9">Archer and Kimes, 2008</xref>; <xref ref-type="bibr" rid="B90">Khalilia et al., 2011</xref>).</p>
</list-item>
<list-item>
<p>c. It can estimate valuable data and maintain a certain degree of accuracy even when a significant portion of the data is missing.</p>
</list-item>
</list>
</p>
<p>
<xref ref-type="bibr" rid="B90">Khalilia et al. (2011)</xref> utilized National Inpatient Sample (NIS) data from the Healthcare Cost and Utilization Project (HCUP) to train RF classifiers for predicting eight disease categories. The results demonstrated good performance (<xref ref-type="bibr" rid="B90">Khalilia et al., 2011</xref>).</p>
<p>However, RF does not perform as well for regression problems as it does for classification and may not produce good classification results for small or low-dimensional datasets (datasets with fewer features).</p>
</sec>
<sec id="s3-1-2-4">
<title>3.1.2.4 Support vector machine (SVM)</title>
<p>Support vector machine (SVM) is a supervised algorithm that learns from examples to assign labels to objects (<xref ref-type="bibr" rid="B28">Boser et al., 1992</xref>). Compared to other ML methods, SVM is highly effective at identifying subtle patterns in complex data sets (<xref ref-type="bibr" rid="B12">Aruna and SP, 2011</xref>). The purpose of SVM is to create a decision boundary between two categories, facilitating the prediction of a label based on one or more feature vectors (<xref ref-type="bibr" rid="B188">WS, 2006</xref>). This decision boundary, called a hyperplane, should be oriented as far away as possible from the nearest data point for each class, referred to a support vector (<xref ref-type="bibr" rid="B70">Huang et al., 2018</xref>).</p>
<p>The computational complexity of SVM depends on the number of support vectors rather than the dimension of the sample space, thereby avoiding the &#x201c;curse of dimensionality&#x201d; (<xref ref-type="bibr" rid="B114">Markowetz, 2001</xref>). However, SVM is sensitive to missing data and is difficult for solving multi-classification problems (<xref ref-type="bibr" rid="B33">Cervantes et al., 2020</xref>). In areas where SVM performs poorly, researchers have developed other applications such as SVM for large datasets, multiple classifications, and imbalanced datasets (<xref ref-type="bibr" rid="B33">Cervantes et al., 2020</xref>).</p>
<p>
<xref ref-type="bibr" rid="B118">Mavrogeorgis et al. (2023)</xref> obtained urine peptide data of 1850 healthy controls (HC) and CKD (diabetic nephropathy-DKD, IgA nephropathy-IgAN, vasculitis) participants from the Human Urine Proteome Database. UMAP was combined with SVM for binary (DKD, HC) and multi-class (DKD, HC, IgAN, vasculitis) classification.</p>
</sec>
<sec id="s3-1-2-5">
<title>3.1.2.5 K-Nearest neighbor (k-NN)</title>
<p>K-Nearest Neighbor (k-NN) is a simple and practical supervised learning algorithm frequently used to deal with classification problems (<xref ref-type="bibr" rid="B27">Boateng et al., 2020</xref>). It examines the k nearest sample points closest to the new sample point in the training set, using a specific distance metric, and classifies the new sample point into the category with the most occurrences among the k sample points (<xref ref-type="bibr" rid="B2">Abu Alfeilat et al., 2019</xref>). The parameter k is crucial, and its value should be optimally chosen (<xref ref-type="bibr" rid="B195">Zhang et al., 2017a</xref>). A value that is too low will increase the error rate, while a value that is too high can render the model ineffective (<xref ref-type="bibr" rid="B196">Zhang et al., 2017b</xref>).</p>
<p>The algorithm is simple in principle, easy to understand and implement, applicable to multi-classification problems, and requires no additional processing (<xref ref-type="bibr" rid="B36">Chaubey et al., 2020</xref>). However, k-NN involves substantial computational effort and requires considerable memory resources. Its performance is influenced by the parameter k and it tends to perform poorly on unbalanced datasets.</p>
</sec>
<sec id="s3-1-2-6">
<title>3.1.2.6 eXtreme gradient boosting (XGBoost)</title>
<p>eXtreme Gradient Boosting (XGBoost) is a machine learning model built on a decision tree ensemble and is among the most widely used machine learning algorithms (<xref ref-type="bibr" rid="B85">Kavzoglu and Teke, 2022</xref>). The algorithm has the following features: <list list-type="simple">
<list-item>
<p>a. It excels in processing both structured and unstructured data, frequently achieving higher accuracy compared to other algorithms (<xref ref-type="bibr" rid="B10">Arif Ali et al., 2023</xref>).</p>
</list-item>
<list-item>
<p>b. It relies on on decision tree integration, offers excellent interpretability, and provides insights into the importance of each feature (<xref ref-type="bibr" rid="B85">Kavzoglu and Teke, 2022</xref>).</p>
</list-item>
<list-item>
<p>c. It employs parallel computing technology and demonstrates high computational efficiency in processing large-scale data (<xref ref-type="bibr" rid="B128">Nalluri et al., 2020</xref>).</p>
</list-item>
</list>
</p>
<p>
<xref ref-type="bibr" rid="B106">Li et al. (2024)</xref> developed a model incorporating 17 feature variables using XGBoost, based on the multidimensional data from a retrospective cohort of 274 papillary thyroid carcinoma (PTC) patients. This model demonstrated strong predictive performance in differentiating between low-risk and medium/high-risk PTC cases and was designated as the PTC Preoperative Risk Assessment Classifier (PRAC-PTC).</p>
<p>However, it is sensitive to parameters settings, with the choice of parameters significantly influencing the results (<xref ref-type="bibr" rid="B46">Demir and &#x15e;ahin, 2022</xref>). In some cases, XGBoost may be overly complex and prone to overfitting the training data.</p>
</sec>
</sec>
</sec>
<sec id="s3-2">
<title>3.2 Applications of machine learning in MS-based multi-omics in thyroid disease</title>
<sec id="s3-2-1">
<title>3.2.1 Applications in MS-based multi-omics data analysis</title>
<p>Extracting valuable insights from MS-based multi-omics data presents a significant challenge in bioinformatics (<xref ref-type="bibr" rid="B166">Tang et al., 2019</xref>). The complexity and high dimensionality of MS-based multi-omics datasets make traditional analysis methods challenging (<xref ref-type="bibr" rid="B95">Krassowski et al., 2020</xref>). Combining ML methods with MS-based multi-omics analysis mainly involves integrating various ML techniques to manage the complexity and volume of multi-omics data, aiming to enhance both accuracy and interpretability.</p>
<sec id="s3-2-1-1">
<title>3.2.1.1 Missing data imputation</title>
<p>Missing data refers to the situation where data is incomplete due to some reasons during the process of data collection, transmission, and processing (<xref ref-type="bibr" rid="B49">Du et al., 2020</xref>). It is a common problem in MS-based omics data analysis (<xref ref-type="bibr" rid="B69">Huang et al., 2023</xref>). The simplest way to deal with missing values is to remove samples with missing values. However, if there are many missing values, such as the missing data of LC-MS-based omics data may be in the range of 30%&#x2013;50%, a large number of samples will be eliminated, resulting in the loss of more useful information (<xref ref-type="bibr" rid="B108">Liebal et al., 2020</xref>).</p>
<p>Imputation methods provide an alternative way of handling missing data rather than discarding missing values and associated data (<xref ref-type="bibr" rid="B69">Huang et al., 2023</xref>). The mean, median, mode, etc., of the feature can be used to fill the missing values (<xref ref-type="bibr" rid="B50">Emmanuel et al., 2021</xref>). However, these simple methods do not consider the relationship between data variables, which sometimes makes the results of data analysis unreliable. Among the methods for dealing with missing values, many other filling methods consider the relationship between data variables (<xref ref-type="bibr" rid="B17">Baraldi and Enders, 2010</xref>). ML algorithms, such as regression, k-NN, and RF, can help resolve missing data problems in multi-omics datasets by inferring values based on observed patterns in existing data (<xref ref-type="bibr" rid="B50">Emmanuel et al., 2021</xref>; <xref ref-type="bibr" rid="B123">Mirza et al., 2019</xref>).</p>
</sec>
<sec id="s3-2-1-2">
<title>3.2.1.2 Dimensionality reduction</title>
<p>MS-based multi-omics data may have multiple layers of variables and a large number of attributes, so-called high-dimensional data (<xref ref-type="bibr" rid="B11">Arjmand et al., 2022</xref>). While high-dimensional data will cause great trouble for subsequent data processing (<xref ref-type="bibr" rid="B31">Cao and Lin, 2015</xref>), dimensionality reduction is a crucial step (<xref ref-type="bibr" rid="B52">Fanaee and Thoresen, 2019</xref>). It aims to reduce the number of variables considered, making the data more manageable and easier to analyze while retaining as much information as possible. Before applying dimensionality reduction, multi-omics data need to be preprocessed, such as normalization and missing value filling, to ensure that the data is in a form suitable for analysis (<xref ref-type="bibr" rid="B146">Reska et al., 2021</xref>). Dimensionality reduction improves computational efficiency, reduces noise while retaining important information, facilitating data processing (<xref ref-type="bibr" rid="B5">Alhassan and Wan Zainon, 2021</xref>). Many ML algorithms can facilitate data processing by reducing data dimensionality while retaining important information, such as PCA, t-SNE, PLS-DA, and UMAP.</p>
</sec>
<sec id="s3-2-1-3">
<title>3.2.1.3 Clustering and classification</title>
<p>Clustering is an unsupervised learning method that groups data based on the attributes of the input features (<xref ref-type="bibr" rid="B144">Reel et al., 2021</xref>). Classification is a supervised learning method that provides predicted output as a discrete class (<xref ref-type="bibr" rid="B144">Reel et al., 2021</xref>). ML algorithms can group samples into clusters or classify them based on distinct patterns present in multi-omics data which can discover subtypes or stratify patients and identify similarities among clustered patients (<xref ref-type="bibr" rid="B58">Goecks et al., 2020</xref>).</p>
</sec>
<sec id="s3-2-1-4">
<title>3.2.1.4 Feature selection</title>
<p>Feature selection is a key step in multi-omics analysis and helps reduce data dimensionality. In this sense, feature selection has similar motivations to dimensionality reduction as described above. Feature selection can remove irrelevant features and reduce the number of features used in the analysis, thereby reducing the difficulty of the learning task (<xref ref-type="bibr" rid="B102">Li et al., 2017a</xref>). It should be noted that the feature selection process must ensure that no important features are lost.</p>
<p>For a multi-omics dataset, a set of attributes is included, some of them may be critical and useful, while others may be useless. Attributes are called features, those that are useful for the current learning task are called relevant features, and those that are useless are called irrelevant features (<xref ref-type="bibr" rid="B93">Kotsiantis, 2011</xref>). The process of selecting a subset of relevant features from a given set of features is called feature selection (<xref ref-type="bibr" rid="B79">Jovi&#x107; et al., 2015</xref>).</p>
<p>Feature selection is an important data preprocessing process. In real machine learning tasks, feature selection is usually performed after obtaining multi-omics data, and then the learner is trained.</p>
<p>In practical applications, feature selection methods are mainly divided into filter, wrapper, and embedded methods (<xref ref-type="bibr" rid="B170">Venkatesh and Anuradha, 2019</xref>).<list list-type="simple">
<list-item>
<p>a. Filter Selection</p>
</list-item>
</list>
</p>
<p>Filter selection first selects features from the data set and then trains the learner (<xref ref-type="bibr" rid="B102">Li et al., 2017a</xref>). The feature selection process is independent of the subsequent learner. It is the simplest and most commonly used method to implement feature selection. The core of the filtering method selection is to sort the features according to their value, to achieve the selection or elimination of any proportion/quantity of features.</p>
<p>Filter selection is computationally efficient and relatively simple to implement, but it ignores the interactions between features (<xref ref-type="bibr" rid="B81">Jiliang et al., 2014</xref>).<list list-type="simple">
<list-item>
<p>b. Wrapper Selection</p>
</list-item>
</list>
</p>
<p>Unlike filter-based feature selection, which does not consider subsequent learners, wrapper selection directly uses the performance of the most important learner as the evaluation criterion for the feature subset (<xref ref-type="bibr" rid="B171">Wald et al., 2013</xref>; <xref ref-type="bibr" rid="B29">Cadenas et al., 2013</xref>).</p>
<p>Since wrapper selection directly optimizes a given learner, it is better than filter selection in terms of the final learner performance (<xref ref-type="bibr" rid="B29">Cadenas et al., 2013</xref>). However, since the learner needs to be trained multiple times during the feature selection process, it requires a huge amount of computation.<list list-type="simple">
<list-item>
<p>c. Embedded selection</p>
</list-item>
</list>
</p>
<p>Embedded selection integrates the feature selection process with the learner training process, that is, feature selection is automatically performed during the learner training process (<xref ref-type="bibr" rid="B105">Li et al., 2017b</xref>). The most commonly used are tree models and a series of ensemble algorithms based on tree models because the model provides important information about feature importance.</p>
<p>Embedded selection combines the advantages of filter selection and wrapper selection in terms of computational cost and performance, but it cannot identify highly relevant features (<xref ref-type="bibr" rid="B145">Remeseiro and Bolon-Canedo, 2019</xref>).</p>
</sec>
</sec>
<sec id="s3-2-2">
<title>3.2.2 Applications in clinical researches</title>
<p>The contribution of ML to thyroid disease is not only in processing data, but also in the classification, clinical diagnosis, treatment, prognosis and risk stratification of thyroid diseases. In clinical researches, ML is beneficial and essential (<xref ref-type="bibr" rid="B92">Komuro et al., 2023</xref>). ML enables efficient analysis of extensive data sets and improve disease diagnosis and classification by building predictive models of disease, and has a particularly important impact on improving MS-based clinical multi-omics research (<xref ref-type="bibr" rid="B138">Perakakis et al., 2018</xref>; <xref ref-type="bibr" rid="B11">Arjmand et al., 2022</xref>). ML models primarily select important features from complex data to construct predictive models and output data as predictive labels based on identified patterns (<xref ref-type="bibr" rid="B131">Ngan et al., 2023</xref>). Using models like decision trees, RF, SVM, and XGBoost to predict outcomes based on data facilitates predictive models, including disease diagnosis, prognosis, and treatment, based on multi-omics data (<xref ref-type="bibr" rid="B142">Quazi, 2022</xref>; <xref ref-type="bibr" rid="B183">Wekesa and Kimwele, 2023</xref>). Validation and evaluation are critical steps in ML for multi-omics analysis to ensure that the models and methods used are reliable and robust. There are several approaches:</p>
<p>Cross-Validation: Use k-fold cross-validation to assess model performance.</p>
<p>External Validation: Validate results with independent datasets to ensure robustness.</p>
<p>Performance Metrics: Use appropriate metrics to evaluate the model (e.g., accuracy, precision, recall, area under curve (AUC), F1-score for classification; R 2, RMSE for regression).</p>
<p>The trained and validated ML models are expected to be able to assess cancer risk and facilitate the development of preoperative cancer diagnosis (<xref ref-type="bibr" rid="B131">Ngan et al., 2023</xref>).</p>
<sec id="s3-2-2-1">
<title>3.2.2.1 Diagnosis and classification</title>
<p>The classification model is the most commonly used type of ML models in clinical researches which can output the type of thyroid disease it predicts based on the input features, such as clinical factors and omics data, thereby providing insights into clinical diagnosis (<xref ref-type="fig" rid="F4">Figure 4</xref>). For thyroid disease prediction, ML methods have been applied in various existing research works. Prediction of thyroid disease at its early stages and categorization into cancer or other thyroid disease is very helpful for treating and recovering the maximum number of patients (<xref ref-type="bibr" rid="B63">Gupta et al., 2024</xref>). MS-based multi-omics have become a powerful technique for biomarker discovery which is significant for clinic (<xref ref-type="bibr" rid="B168">Torun et al., 2022</xref>). However, screening biomarkers from complex MS data requires reliable bioinformatics tools and ML can be a good choice (<xref ref-type="bibr" rid="B168">Torun et al., 2022</xref>). Analyzing large and complex datasets by ML models enables the identification of subtle biomarkers and disease signatures, which leads to earlier and more accurate diagnoses (<xref ref-type="bibr" rid="B130">Ng et al., 2023</xref>). This is particularly beneficial in complex diseases specially cancer, where early detection can significantly improve prognosis. The integration of ML and MS-based multi-omics not only improves the efficiency of biomarker discovery but also helps develop more accurate and reliable diagnostic tools, ultimately advancing the field of precision medicine and improving patient outcomes (<xref ref-type="bibr" rid="B77">Johnson et al., 2021</xref>; <xref ref-type="bibr" rid="B96">Krishnan et al., 2023</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>The workflow of ML for data processing and modeling.</p>
</caption>
<graphic xlink:href="fmolb-11-1483326-g004.tif"/>
</fig>
<p>From the perspective of classification, existing researches mainly focused on binary classification problems in thyroid disease classification based on ML models. <xref ref-type="bibr" rid="B97">Kumari et al. (2024)</xref> used age, gender, and hormone levels as features and combined them with 3 ML models to classify hyperthyroidism and hypothyroidism. Results showed that XGBoost was the top-performing model for this task (<xref ref-type="bibr" rid="B97">Kumari et al., 2024</xref>).</p>
<p>
<xref ref-type="bibr" rid="B6">Al-muwaffaq and Bozkus (2016)</xref> developed the Machine Learning tool for Thyroid Disease Diagnosis (MLTDD) mainly focused on thyroid gland medical diseases caused by underactive or overactive thyroid glands. The prediction accuracy was in range between 98.7% and 99.8% for testing. MLTDD can effectively help to make the right clinical decision.</p>
<p>
<xref ref-type="bibr" rid="B189">Xi et al. (2022)</xref> constructed 6 ML models to predict the malignancy of thyroid nodules. RF and Gradient Boosting Machine (GBM) showed better overall diagnostic accuracy and ability to identify malignant nodules. Their method can be used as additional evidence in the preoperative diagnosis of thyroid cancer.</p>
<p>
<xref ref-type="bibr" rid="B62">Guo et al. (2022b)</xref> constructed a diagnostic model of benign and malignant thyroid tumors. The benign group contained 5 thyroid diseases and the malignant group contained six thyroid diseases. Clinical factors were used as features and RF, XGBoost, LightGBM, and AdaBoost models were constructed. RF model showed the best performance. Their research proposed a model incorporating novel biomarkers which could be a powerful and promising tool for predicting benign and malignant thyroid tumors (<xref ref-type="bibr" rid="B62">Guo et al., 2022b</xref>).</p>
<p>Recently, some researches have begun to focus on multi-classes classification problems. <xref ref-type="bibr" rid="B34">Chaganti et al. (2022)</xref> used ML models to predict five thyroid diseases. Results showed that the extra tree classifier-based selected feature yields the best results with 0.99 accuracy and an F1 score when used with the RF classifier (<xref ref-type="bibr" rid="B34">Chaganti et al., 2022</xref>).</p>
<p>
<xref ref-type="bibr" rid="B63">Gupta et al. (2024)</xref> used ML models to predict ten thyroid diseases. Results suggested that an accuracy of 0.998 can be obtained using the optimized AdaBoost model by differential evolution (<xref ref-type="bibr" rid="B63">Gupta et al., 2024</xref>). These researches applied ML models to a variety of thyroid diseases, which helped to diagnose diseases more conveniently and comprehensively in clinical practice.</p>
<p>ML models can not only be used to classify the types of thyroid disease, but also to determine whether there is a certain gene mutation in the disease. <xref ref-type="bibr" rid="B98">Kwon et al. (2020)</xref> used ML models combined with radiomics to predict the presence or absence of B-Raf proto-oncogene, serine/threonine kinase (BRAF) mutation in PTC and the results showed that the classification accuracy of these models was higher than 60%. Although this research provided a new perspective of application of ML in thyroid disease which focused on the gene mutation, the classification model did not show excellent performance in predicting the presence of BRAF mutation in PTC and need to be further validated in a larger dataset to better assess their potential clinical use.</p>
<p>In addition, ML models can also be used to predict treatment trends and prognosis. <xref ref-type="bibr" rid="B14">Aversano et al. (2021)</xref> combined ten different ML models with parameters related to the person being treated to predict whether the LT4-based treatment needs to be increased or decreased for the patients with hypothyroidism. This study provides reference insights for clinical treatment plans.</p>
<p>
<xref ref-type="bibr" rid="B175">Wang et al. (2024a)</xref> presented ML models based on comprehensive predictors to predict the structural recurrence risk of PTC patients. All the patients were treated with thyroid surgery and radioiodine. Twenty-nine perioperative variables consisting of four dimensions (demographic characteristics and comorbidities, tumor-related variables, lymph node-related variables, and metabolic and inflammatory markers) were analyzed (<xref ref-type="bibr" rid="B175">Wang et al., 2024a</xref>). The results showed that the RF model achieved the expected prediction effect, with good discrimination, calibration, and interpretability, and revealed the potential of ML models in improving the accuracy of risk stratification of PTC patients (<xref ref-type="bibr" rid="B175">Wang et al., 2024a</xref>).</p>
<p>It is also an important task for ML models to classify clinical patient samples based on MS-based multi-omics data. In many cases, it can be used to determine which ion m/z values contribute most to the models, thereby facilitating the identification of biomarkers and further facilitating the diagnosis and classification of thyroid disease (<xref ref-type="bibr" rid="B22">Beck et al., 2024</xref>). Recently, an increasing number of researches have focused on combining ML with MS data for thyroid disease classification, even for further treatment strategies, which have provided broader prospect.</p>
<p>
<xref ref-type="bibr" rid="B163">Sun et al. (2022)</xref> proposed the first protein-based neural network classifier for thyroid nodules. Their research was the first to establish a deep proteome data repository for various thyroid lesions, analyzed a larger sample size and obtained deeper proteome coverage (<xref ref-type="bibr" rid="B163">Sun et al., 2022</xref>). The large-scale thyroid proteome map combined with the neural network model demonstrated the power of the classifier and is expected to be quickly applied to clinical practice to supplement the deficiencies of traditional cytopathology (<xref ref-type="bibr" rid="B163">Sun et al., 2022</xref>). Their recent work (<xref ref-type="bibr" rid="B164">Sun et al., 2024</xref>) established a protein-based model with targeted MS for the diagnosis of FTC and FTA. This model used 24 proteins filtered by XGBoost as features and performed better than gene-based model. The protein model has 95.7% negative predictive value for ruling out malignant nodules (<xref ref-type="bibr" rid="B164">Sun et al., 2024</xref>).</p>
<p>
<xref ref-type="bibr" rid="B178">Wang et al. (2022b)</xref> develop a rapid classification method by ML and MS-based metabolomics to diagnose PTC. The metabolomics of frozen samples were performed by probe electrospray ionization (PESI) mass and SVM and RF models were used. For the classification of PTC from PTC adjacent tissues, SVM performed better than RF. Their another work developed a rapid method to classify the malignant and benign thyroid nodules by PESI-MS-based machine learning (<xref ref-type="bibr" rid="B179">Wang et al., 2022c</xref>). For each FNAB sample, only 10 min is needed to determine its malignancy, which is much easier and faster than traditional diagnosis (<xref ref-type="bibr" rid="B179">Wang et al., 2022c</xref>).</p>
<p>
<xref ref-type="bibr" rid="B39">Chen et al. (2024)</xref> explored the potential of rapid thyroid disease screening using the ZrMOF/Au-assisted LDI-MS platform, enabling rapid screening of malignant thyroid disease from benign patients. The authors constructed a panel of 43 key metabolites as features for ML models to discriminate thyroid cancer from thyroid nodules and NN, RF, LR, and SVM models were used for classification (<xref ref-type="bibr" rid="B39">Chen et al., 2024</xref>). The results showed that NN had the best classification performance.</p>
<p>
<xref ref-type="bibr" rid="B202">Zhu et al. (2024)</xref> combined ML with MS-based proteomics and selected four proteins as features with the highest contributions to predict the efficacy of iodine therapy. This research showed the ability to pre-identify PTC patients who are resistant to radioactive iodine therapy (<xref ref-type="bibr" rid="B202">Zhu et al., 2024</xref>).</p>
<p>The above articles were retrieved by entering &#x201c;machine learning&#x201d; and &#x201c;thyroid disease&#x201d; in Google Scholar and some representative ones involving &#x201c;application of ML in diagnosis of thyroid disease&#x201d; were selected by us. We showed them in <xref ref-type="table" rid="T1">Table 1</xref> in the order we mentioned in this section with three summary measures, sample types, features, and supervised ML models.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Applications of machine learning in diagnosis of thyroid disease.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">References</th>
<th align="center">Year</th>
<th align="center">Sample types</th>
<th align="center">Features</th>
<th align="center">Supervised ML models</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">
<xref ref-type="bibr" rid="B63">Gupta et al. (2024)</xref>
</td>
<td align="center">2024</td>
<td align="center">Concurrent Non-thyroid Illness, Compensated Hypothyroid, Increased Binding Protein, Primary Hypothyroid, etc</td>
<td align="center">not given</td>
<td align="center">RF, SVM, LR, ADA, GBM, CNN, RNN, LSTM</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B97">Kumari et al. (2024)</xref>
</td>
<td align="center">2024</td>
<td align="center">Hyperthyroidism and Hypothyroidism</td>
<td align="center">age, sex, pregnancy, T3, T4, and TSH</td>
<td align="center">RF, SVM, XGB</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B6">Al-muwaffaq and Bozkus (2016)</xref>
</td>
<td align="center">2016</td>
<td align="center">Hyperthyroidism, Hypothyroidism and normal function of the thyroid gland</td>
<td align="center">age, sex, on_thyroxine, query_on_thyroxine, on_antithyroid_medication, sick, pregnant, TSH, T3, T4, T4U, FTIetc.</td>
<td align="center">DT</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B189">Xi et al. (2022)</xref>
</td>
<td align="center">2022</td>
<td align="center">Thyroid Cancer</td>
<td align="center">demographic information, ultrasound features, and blood test results</td>
<td align="center">RF, SVM, LR, LDA, GBM</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B62">Guo et al. (2022b)</xref>
</td>
<td align="center">2022</td>
<td align="center">Benign and Malignant Thyroid Tumors</td>
<td align="center">Peripheral blood indicators, BRAFV600E gene, demographic indicators</td>
<td align="center">RF, XGB, GBM, ADA</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B34">Chaganti et al. (2022)</xref>
</td>
<td align="center">2022</td>
<td align="center">Hashimoto&#x2019;s thyroiditis, binding protein (increased binding protein), Autoimmune Thyroiditis, and Non-Thyroidal Syndrome (NTIS)</td>
<td align="center">age, sex, on_thyroxine, query_on_thyroxine, on_antithyroid_medication, sick, pregnant, TSH, T3, T4, T4U, FTI, TBGetc.</td>
<td align="center">RF, LR, SVM, ADA, GBM</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B98">Kwon et al. (2020)</xref>
</td>
<td align="center">2020</td>
<td align="center">PTC</td>
<td align="center">radiomics features</td>
<td align="center">LR, RF, SVM</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B14">Aversano et al. (2021)</xref>
</td>
<td align="center">2021</td>
<td align="center">Hypothyroidism</td>
<td align="center">personal information, family history, physical characteristics, hormonal and thyroid parameters, parameters relating to blood tests</td>
<td align="center">ADA, XGB, GBM, CAT, DT, RF, ExtraTree, k-NN, Naive Bayes, MLP</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B175">Wang et al. (2024a)</xref>
</td>
<td align="center">2024</td>
<td align="center">PTC</td>
<td align="center">demographic characteristics and comorbidities, tumor-related variables, lymph node (LN)-related variables, metabolic and inflammatory markers</td>
<td align="center">LR, XGB, RF, SVM, NN</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B163">Sun et al. (2022)</xref>
</td>
<td align="center">2022</td>
<td align="center">Thyroid Nodules</td>
<td align="center">MS-based proteomics</td>
<td align="center">NN</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B164">Sun et al. (2024)</xref>
</td>
<td align="center">2024</td>
<td align="center">FTA and FTC</td>
<td align="center">MS-based proteomics</td>
<td align="center">XGB</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B178">Wang et al. (2022b)</xref>
</td>
<td align="center">2022</td>
<td align="center">PTC</td>
<td align="center">MS-based metabolomics</td>
<td align="center">RF, SVM</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B179">Wang et al. (2022c)</xref>
</td>
<td align="center">2022</td>
<td align="center">Thyroid Nodules</td>
<td align="center">MS-based ions</td>
<td align="center">RF, SVM, MLP</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B39">Chen et al. (2024)</xref>
</td>
<td align="center">2024</td>
<td align="center">Thyroid Cancer and Thyroid Nodules</td>
<td align="center">MS-based metabolomics</td>
<td align="center">NN, RF, LR, SVM</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B202">Zhu et al. (2024)</xref>
</td>
<td align="center">2024</td>
<td align="center">Radioactive Iodine Refractory (RAIR) and Non-Radioactive Iodine Refractory (Non-RAIR) PTC</td>
<td align="center">MS-based proteomics</td>
<td align="center">XGB</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>ADA, adaptive boosting; CAT, CatBoosting; CNN, convolutional neural network; DT, decision tree; GBM, gradient boosting machine; k-NN, k-nearest neighbor; LDA, linear discriminant analysis; LR, logistic regression; LSTM, long short-term memory; MLP, multilayer perceptron; NN, neural network; RF, random forest; RNN, recurrent neural network; SVM, support vector machine; XGB, eXtreme Gradient Boosting.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>By analyzing the above research works, we found that patients&#x2019; personal data and hormone parameters are often used as features, such as age, sex, thyroid-stimulating hormone (TSH), total serum triiodothyronine (T3), thyroid binding globulin (TBG) and total serum thyroxin (T4). Among these features, almost every researcher has selected some features for thyroid disease diagnosis work. MS-based proteomics and metabolomics data are also often used but almost only single type is used. In order to analyze thyroid disease more comprehensively, combining metabolomics and proteomics or combining them with other omics data such as genomics and clinical indicators should be further considered in future studies.</p>
</sec>
<sec id="s3-2-2-2">
<title>3.2.2.2 Risk stratification</title>
<p>A significant advantage of ML in the clinic is its ability to facilitate early intervention (<xref ref-type="bibr" rid="B3">Adlung et al., 2021</xref>). By using advanced algorithms and predictive models, ML algorithms can detect potential health risks at an early stage, and effectively classify diseases into different risk categories, which offer a nuanced understanding of the likelihood of patients developing specific health conditions and allowing clinicians to intervene promptly and implement targeted treatments (<xref ref-type="bibr" rid="B20">Beaulieu-Jones et al., 2021</xref>; <xref ref-type="bibr" rid="B41">Choudhury and Asan, 2020</xref>; <xref ref-type="bibr" rid="B162">Sun et al., 2023</xref>). This goes beyond traditional diagnostic methods, providing a more personalized and proactive approach to healthcare (<xref ref-type="bibr" rid="B192">Yadav, 2024</xref>).</p>
<p>Saima Sharleen Islam (<xref ref-type="bibr" rid="B162">Sun et al., 2023</xref>) et al. used 11 ML models to predict thyroid risk and used accuracy and recall as evaluation indicators. The results show that the ANN classifier outperforms the others in terms of accuracy. <xref ref-type="bibr" rid="B199">Zhao et al. (2022a)</xref> et al. used 5 ML models to predict the risk of nodular thyroid disease in coal miners, with the XGB model having the best overall predictive performance.</p>
<p>
<xref ref-type="bibr" rid="B180">Wang et al. (2022a)</xref> presented ML models based on comprehensive predictors to predict the structural recurrence risk of PTC patients. All the patients were treated with thyroid surgery and radioiodine. Twenty-nine perioperative variables consisting of four dimensions (demographic characteristics and comorbidities, tumor-related variables, lymph node-related variables, and metabolic and inflammatory markers) were analyzed <xref ref-type="bibr" rid="B180">Wang et al. (2022a)</xref>. The results showed that the RF model achieved the expected prediction effect, with good discrimination, calibration, and interpretability, and revealed the potential of ML models in improving the accuracy of risk stratification of PTC patients <xref ref-type="bibr" rid="B180">Wang et al. (2022a)</xref>.</p>
<p>MS-based multi-omics data can also be combined with ML for risk stratification in thyroid disease. <xref ref-type="bibr" rid="B106">Li et al. (2024)</xref> first reported a Preoperative Risk Assessment Classifier for PTC (PRAC-PTC) which constructed by ML models used clinical indicators, immune indices, genetic feature, and MS-based proteomics as multidimensional features. The results showed that six proteins (DPP7, PDLIM3, Col12A1, CTSL, TUBB2A, and ITGB5) were identified as the best discriminable proteins between low-risk and intermediate-risk/high-risk PTCs (<xref ref-type="bibr" rid="B106">Li et al., 2024</xref>). XGBoost showed the best performance among these ML models authors used. PRAC-PTC can increase the accuracy of the preoperative risk stratification and decrease unnecessary surgery or overtreatment.</p>
<p>
<xref ref-type="bibr" rid="B173">Wang et al. (2024b)</xref> used different ML algorithms to explore the relationship between mixed-semi-volatile organic compounds (SVOCs) exposure and thyroid nodule. The data was collected by GC-MS/MS. RF and AdaBoost models were selected to screen out the features based on their contribution to the models. Weighted quantile sum (WQS) regression and Bayesian kernel machine regression (BKMR) were used to assess the mixed effects of the SVOCs exposure on thyroid nodule (<xref ref-type="bibr" rid="B173">Wang et al., 2024b</xref>). The results showed that high levels of exposure to SVOCs increase the risk of PTC and nodular goiters (NG), with Fluazifop-butyl and Fenpropathrin playing a major role (<xref ref-type="bibr" rid="B173">Wang et al., 2024b</xref>).</p>
<p>
<xref ref-type="bibr" rid="B181">Wang et al. (2024c)</xref> proposed a ML-based objective method to individual to predict the risk of pediatric papillary thyroid carcinomas (PPTCs). They collected the clinical factors and MS-based proteomics data and nineteen proteins were selected by ML models to construct a protein-based personalized prognostic prediction model which can stratify PPTC patients into high- or low-recurrence risk groups and provide a suggestion for clinical decision-making and individualized treatment.</p>
<p>The combination of ML and MS-based multi-omics data in thyroid disease not only enhances disease risk assessment but also improves the approach to patient care. Through early intervention, patient stratification, and the implementation of targeted preventive measures, ML makes a significant contribution to improving patient health and building a more personalized and efficient clinical treatment system (<xref ref-type="bibr" rid="B88">Khalifa and Albadawy, 2024</xref>; <xref ref-type="bibr" rid="B89">Khalifa et al., 2024</xref>).</p>
</sec>
</sec>
</sec>
</sec>
<sec id="s4"> <title>4 Summary</title>
<p>In the 21st century, the development of medical science has entered the era of big data, with ML algorithms, as a cornerstone of artificial intelligence, beginning to emerge in clinical disease research (<xref ref-type="bibr" rid="B104">Li et al., 2023b</xref>). From the clinical perspective, the application of ML in thyroid disease can contribute to the classification, diagnosis, treatment and prognosis. MS-based multi-omics analysis utilizing ML technology, offers significant prospects for early disease detection and prevention. However, there are currently limited examples of successful application of such technologies into clinical practice (<xref ref-type="bibr" rid="B87">Kelly et al., 2019</xref>). There are also many challenges must be addressed. In the biomarker field, the primary challenge is not in data analysis, but in the collection of comprehensive clinical data for each particular patient (<xref ref-type="bibr" rid="B47">Desaire et al., 2022</xref>; <xref ref-type="bibr" rid="B121">Arzyeh et al., 2020</xref>). The success of ML algorithms in the medical field largely depends on the quality, diversity, and completeness of the training data (<xref ref-type="bibr" rid="B152">Sarker, 2021</xref>). While the number of samples in some researches are not small, collecting more data will increase the diversity of patients. Models trained on broader and more diverse datasets will generalize better to new patients when deployed in real-world scenarios (<xref ref-type="bibr" rid="B189">Xi et al., 2022</xref>). Most researches mainly use publicly available datasets, and many datasets have the problem of class imbalance, with a very small number of samples in a certain class. Meanwhile, this phenomenon also leads to the results not being universal. When ML models are applied to such datasets, the models will overfit to the majority class, resulting in incorrect predictions for the minority class. The other limitation is that only a few types of thyroid diseases have been used to classification problems in existing studies, and most studies focus on binary classification, which has caused certain limitations in the application of ML to clinical applications of thyroid diseases. In disease research, this entails collecting detailed information about a patient&#x2019;s medical history, genetic profile, treatment response, and long-term outcomes. Furthermore, patient privacy and data security must be carefully managed and addressed. As data volume increases, it is imperative to implement robust measures to protect patient privacy and uphold ethical standards (<xref ref-type="bibr" rid="B1">Abouelmehdi et al., 2018</xref>).</p>
<p>In summary, while ML holds substantial for clinical disease researches, it also encounters significant challenges to widespread adoption. Addressing these challenges will pave the way for realizing the full potential of ML in enhancing disease diagnosis, prognosis, and personalized treatment strategies.</p>
</sec>
</body>
<back>
<sec sec-type="author-contributions" id="s5">
<title>Author contributions</title>
<p>YC: Writing&#x2013;original draft, Writing&#x2013;review and editing. MZ: Writing&#x2013;review and editing. YG: Writing&#x2013;review and editing. ZZ: Writing&#x2013;review and editing, Resources. XZ: Conceptualization, Writing&#x2013;review and editing, Supervision, Funding acquisition, Resources.</p>
</sec>
<sec sec-type="funding-information" id="s6">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research, authorship, and/or publication of this article.</p>
</sec>
<ack>
<p>Thanks are given to ZZ for assistance with histopathologic information for endocrine tumors and to XZ for valuable discussions.</p>
</ack>
<sec sec-type="COI-statement" id="s7">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s8">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abouelmehdi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Beni-Hessane</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Khaloufi</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Big healthcare data: preserving security and privacy</article-title>. <source>J. Big Data</source> <volume>5</volume> (<issue>1</issue>), <fpage>1</fpage>. <pub-id pub-id-type="doi">10.1186/s40537-017-0110-7</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abu Alfeilat</surname>
<given-names>H. A.</given-names>
</name>
<name>
<surname>Hassanat</surname>
<given-names>A. B. A.</given-names>
</name>
<name>
<surname>Lasassmeh</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Tarawneh</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Alhasanat</surname>
<given-names>M. B.</given-names>
</name>
<name>
<surname>Eyal Salman</surname>
<given-names>H. S.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Effects of distance measure choice on K-nearest neighbor classifier performance: a review</article-title>. <source>Big Data</source> <volume>7</volume> (<issue>4</issue>), <fpage>221</fpage>&#x2013;<lpage>248</lpage>. <pub-id pub-id-type="doi">10.1089/big.2018.0175</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Adlung</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Cohen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Mor</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Elinav</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Machine learning in clinical decision making</article-title>. <source>Med</source> <volume>2</volume> (<issue>6</issue>), <fpage>642</fpage>&#x2013;<lpage>665</lpage>. <pub-id pub-id-type="doi">10.1016/j.medj.2021.04.006</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alber</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Buganza Tepole</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cannon</surname>
<given-names>W. R.</given-names>
</name>
<name>
<surname>De</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Dura-Bernal</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Garikipati</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Integrating machine learning and multiscale modeling-perspectives, challenges, and opportunities in the biological, biomedical, and behavioral sciences</article-title>. <source>NPJ Digit. Med.</source> <volume>2</volume>, <fpage>115</fpage>. <pub-id pub-id-type="doi">10.1038/s41746-019-0193-y</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alhassan</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Wan Zainon</surname>
<given-names>W. M. N.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Review of feature selection, dimensionality reduction and classification for chronic disease diagnosis</article-title>. <source>IEEE Access</source> <volume>9</volume>, <fpage>87310</fpage>&#x2013;<lpage>87317</lpage>. <pub-id pub-id-type="doi">10.1109/access.2021.3088613</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Al-muwaffaq</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Bozkus</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>MLTDD: use of machine learning techniques for diagnosis of thyroid gland disorder</article-title>. <source>Comput. Sci. and Inf. Technol. ( CS and IT )</source>, <fpage>67</fpage>&#x2013;<lpage>73</lpage>. <pub-id pub-id-type="doi">10.5121/csit.2016.60507</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alseekh</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Aharoni</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Brotman</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Contrepois</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>D&#x27;Auria</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ewald</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Mass spectrometry-based metabolomics: a guide for annotation, quantification and best reporting practices</article-title>. <source>Nat. Methods</source> <volume>18</volume> (<issue>7</issue>), <fpage>747</fpage>&#x2013;<lpage>756</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-021-01197-1</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Angra</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ahuja</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2017</year>). &#x201c;<article-title>Machine learning and its applications: a review</article-title>,&#x201d; in <conf-name>2017 International Conference on Big Data Analytics and Computational Intelligence (ICBDAC)</conf-name>, <conf-date>23-25 March 2017</conf-date>, <fpage>57</fpage>&#x2013;<lpage>60</lpage>. <pub-id pub-id-type="doi">10.1109/icbdaci.2017.8070809</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Archer</surname>
<given-names>K. J.</given-names>
</name>
<name>
<surname>Kimes</surname>
<given-names>R. V.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Empirical characterization of random forest variable importance measures</article-title>. <source>Comput. Statistics and Data Analysis</source> <volume>52</volume> (<issue>4</issue>), <fpage>2249</fpage>&#x2013;<lpage>2260</lpage>. <pub-id pub-id-type="doi">10.1016/j.csda.2007.08.015</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arif Ali</surname>
<given-names>Z. H.</given-names>
</name>
<name>
<surname>Abduljabbar</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Tahir</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Bibo Sallow</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Almufti</surname>
<given-names>S. M.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>eXtreme gradient boosting algorithm with machine learning: a review</article-title>. <source>Acad. J. Nawroz Univ.</source> <volume>12</volume> (<issue>2</issue>), <fpage>320</fpage>&#x2013;<lpage>334</lpage>. <pub-id pub-id-type="doi">10.25007/ajnu.v12n2a1612</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arjmand</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Hamidpour</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Tayanloo-Beik</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Goodarzi</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Aghayan</surname>
<given-names>H. R.</given-names>
</name>
<name>
<surname>Adibi</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Machine learning: a new prospect in multi-omics data analysis of cancer</article-title>. <source>Front. Genet.</source> <volume>13</volume>, <fpage>824451</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2022.824451</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aruna</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sp</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>A novel SVM based CSSFFS feature selection algorithm for detecting breast cancer</article-title>. <source>Int. J. Comput. Appl.</source> <volume>31</volume> (<issue>8</issue>), <fpage>14</fpage>&#x2013;<lpage>20</lpage>. <pub-id pub-id-type="doi">10.5120/3844-5346</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Auslander</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Gussow</surname>
<given-names>A. B.</given-names>
</name>
<name>
<surname>Koonin</surname>
<given-names>E. V.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Incorporating machine learning into established bioinformatics frameworks</article-title>. <source>Int. J. Mol. Sci.</source> <volume>22</volume> (<issue>6</issue>), <fpage>2903</fpage>. <pub-id pub-id-type="doi">10.3390/ijms22062903</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aversano</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Bernardi</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Cimitile</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Iammarino</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Macchia</surname>
<given-names>P. E.</given-names>
</name>
<name>
<surname>Nettore</surname>
<given-names>I. C.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Thyroid Disease Treatment prediction with machine learning approaches</article-title>. <source>Procedia Comput. Sci.</source> <volume>19</volume>, <fpage>1031</fpage>&#x2013;<lpage>1040</lpage>. <pub-id pub-id-type="doi">10.1016/j.procs.2021.08.106</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Babu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Snyder</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Multi-omics profiling for health</article-title>. <source>Mol. Cell. Proteomics</source> <volume>22</volume> (<issue>6</issue>), <fpage>100561</fpage>. <pub-id pub-id-type="doi">10.1016/j.mcpro.2023.100561</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ball</surname>
<given-names>L. E.</given-names>
</name>
<name>
<surname>Agana</surname>
<given-names>B. A.</given-names>
</name>
<name>
<surname>Comte-Walters</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bethard</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Burnette</surname>
<given-names>B. B.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>An introduction to mass spectrometry-based proteomics</article-title>. <source>Encycl. Cell. Biol.</source>, <fpage>132</fpage>&#x2013;<lpage>140</lpage>. <pub-id pub-id-type="doi">10.1016/b978-0-12-821618-7.00143-7</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baraldi</surname>
<given-names>A. N.</given-names>
</name>
<name>
<surname>Enders</surname>
<given-names>C. K.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>An introduction to modern missing data analyses</article-title>. <source>J. Sch. Psychol.</source> <volume>48</volume> (<issue>1</issue>), <fpage>5</fpage>&#x2013;<lpage>37</lpage>. <pub-id pub-id-type="doi">10.1016/j.jsp.2009.10.001</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Basolo</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Macerola</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Poma</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Torregrossa</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>The 5(th) edition of WHO classification of tumors of endocrine organs: changes in the diagnosis of follicular-derived thyroid carcinoma</article-title>. <source>Endocrine</source> <volume>80</volume> (<issue>3</issue>), <fpage>470</fpage>&#x2013;<lpage>476</lpage>. <pub-id pub-id-type="doi">10.1007/s12020-023-03336-4</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beattie</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Esmonde-White</surname>
<given-names>F. W. L.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Exploration of principal component analysis: deriving principal component analysis visually using spectra</article-title>. <source>Appl. Spectrosc.</source> <volume>75</volume> (<issue>4</issue>), <fpage>361</fpage>&#x2013;<lpage>375</lpage>. <pub-id pub-id-type="doi">10.1177/0003702820987847</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beaulieu-Jones</surname>
<given-names>B. K.</given-names>
</name>
<name>
<surname>Yuan</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Brat</surname>
<given-names>G. A.</given-names>
</name>
<name>
<surname>Beam</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>Weber</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Ruffin</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Machine learning for patient risk stratification: standing on, or looking over, the shoulders of clinicians?</article-title> <source>NPJ Digit. Med.</source> <volume>4</volume> (<issue>1</issue>), <fpage>62</fpage>. <pub-id pub-id-type="doi">10.1038/s41746-021-00426-3</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Becht</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>McInnes</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Healy</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Dutertre</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Kwok</surname>
<given-names>I. W. H.</given-names>
</name>
<name>
<surname>Ng</surname>
<given-names>L. G.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Dimensionality reduction for visualizing single-cell data using UMAP</article-title>. <source>Nat. Biotechnol.</source> <volume>37</volume>, <fpage>38</fpage>&#x2013;<lpage>44</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.4314</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beck</surname>
<given-names>A. G.</given-names>
</name>
<name>
<surname>Muhoberac</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Randolph</surname>
<given-names>C. E.</given-names>
</name>
<name>
<surname>Beveridge</surname>
<given-names>C. H.</given-names>
</name>
<name>
<surname>Wijewardhane</surname>
<given-names>P. R.</given-names>
</name>
<name>
<surname>Kenttamaa</surname>
<given-names>H. I.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Recent developments in machine learning for mass spectrometry</article-title>. <source>ACS Meas. Sci. Au</source> <volume>4</volume> (<issue>3</issue>), <fpage>233</fpage>&#x2013;<lpage>246</lpage>. <pub-id pub-id-type="doi">10.1021/acsmeasuresciau.3c00060</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Belgiu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Dr&#x103;gu&#x163;</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Random forest in remote sensing: a review of applications and future directions</article-title>. <source>ISPRS J. Photogrammetry Remote Sens.</source> <volume>114</volume>, <fpage>24</fpage>&#x2013;<lpage>31</lpage>. <pub-id pub-id-type="doi">10.1016/j.isprsjprs.2016.01.011</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Berger</surname>
<given-names>M. F.</given-names>
</name>
<name>
<surname>Mardis</surname>
<given-names>E. R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>The emerging clinical relevance of genomics in cancer medicine</article-title>. <source>Nat. Rev. Clin. Oncol.</source> <volume>15</volume> (<issue>6</issue>), <fpage>353</fpage>&#x2013;<lpage>365</lpage>. <pub-id pub-id-type="doi">10.1038/s41571-018-0002-6</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Biomarkers</surname>
<given-names>D. W. G.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Biomarkers and surrogate endpoints: preferred definitions and conceptual framework</article-title>. <source>Clin. Pharmacol. Ther.</source> <volume>69</volume> (<issue>3</issue>), <fpage>89</fpage>&#x2013;<lpage>95</lpage>. <pub-id pub-id-type="doi">10.1067/mcp.2001.113989</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Blekherman</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Laubenbacher</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Cortes</surname>
<given-names>D. F.</given-names>
</name>
<name>
<surname>Mendes</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Torti</surname>
<given-names>F. M.</given-names>
</name>
<name>
<surname>Akman</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Bioinformatics tools for cancer metabolomics</article-title>. <source>Metabolomics</source> <volume>7</volume> (<issue>3</issue>), <fpage>329</fpage>&#x2013;<lpage>343</lpage>. <pub-id pub-id-type="doi">10.1007/s11306-010-0270-3</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boateng</surname>
<given-names>E. Y.</given-names>
</name>
<name>
<surname>Otoo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Abaye</surname>
<given-names>D. A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Basic tenets of classification algorithms K-Nearest-Neighbor, support vector machine, random forest and neural network: a review</article-title>. <source>J. Data Analysis Inf. Process.</source> <volume>08</volume> (<issue>04</issue>), <fpage>341</fpage>&#x2013;<lpage>357</lpage>. <pub-id pub-id-type="doi">10.4236/jdaip.2020.84020</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boser</surname>
<given-names>B. E.</given-names>
</name>
<name>
<surname>Guyon</surname>
<given-names>I. M.</given-names>
</name>
<name>
<surname>Vapnik</surname>
<given-names>V. N.</given-names>
</name>
</person-group> (<year>1992</year>). <article-title>A training algorithm for optimal margin classifiers</article-title>. <source>Proc. fifth Annu. workshop Comput. Learn. theory</source>, <fpage>144</fpage>&#x2013;<lpage>152</lpage>. <pub-id pub-id-type="doi">10.1145/130385.130401</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cadenas</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Garrido</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Mart&#xed;nez</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Feature subset selection Filter&#x2013;Wrapper based on low quality data</article-title>. <source>Expert Syst. Appl.</source> <volume>40</volume> (<issue>16</issue>), <fpage>6241</fpage>&#x2013;<lpage>6252</lpage>. <pub-id pub-id-type="doi">10.1016/j.eswa.2013.05.051</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Califf</surname>
<given-names>R. M.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Biomarker definitions and their applications</article-title>. <source>Exp. Biol. Med. (Maywood)</source> <volume>243</volume> (<issue>3</issue>), <fpage>213</fpage>&#x2013;<lpage>221</lpage>. <pub-id pub-id-type="doi">10.1177/1535370217750088</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Extreme learning machines on high dimensional and large data applications: a survey</article-title>. <source>Math. Problems Eng.</source> <volume>2015</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1155/2015/103796</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Caria</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Dettori</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Frau</surname>
<given-names>D. V.</given-names>
</name>
<name>
<surname>Lichtenzstejn</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Pani</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Vanni</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Characterizing the three-dimensional organization of telomeres in papillary thyroid carcinoma cells</article-title>. <source>J. Cell. Physiol.</source> <volume>234</volume> (<issue>4</issue>), <fpage>5175</fpage>&#x2013;<lpage>5185</lpage>. <pub-id pub-id-type="doi">10.1002/jcp.27321</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cervantes</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Garcia-Lamont</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Rodr&#xed;guez-Mazahua</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Lopez</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A comprehensive survey on support vector machine classification: applications, challenges and trends</article-title>. <source>Neurocomputing</source> <volume>408</volume>, <fpage>189</fpage>&#x2013;<lpage>215</lpage>. <pub-id pub-id-type="doi">10.1016/j.neucom.2019.10.118</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chaganti</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Rustam</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>De La Torre Diez</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Mazon</surname>
<given-names>J. L. V.</given-names>
</name>
<name>
<surname>Rodriguez</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Ashraf</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Thyroid disease prediction using selective features and machine learning techniques</article-title>. <source>Cancers (Basel)</source> <volume>14</volume> (<issue>16</issue>), <fpage>3914</fpage>. <pub-id pub-id-type="doi">10.3390/cancers14163914</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chatzimparmpas</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Martins</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Kerren</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>t-viSNE: interactive assessment and interpretation of t-SNE projections</article-title>. <source>IEEE Trans. Vis. Comput. Graph</source> <volume>26</volume> (<issue>8</issue>), <fpage>2696</fpage>&#x2013;<lpage>2714</lpage>. <pub-id pub-id-type="doi">10.1109/TVCG.2020.2986996</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chaubey</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Bisen</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Arjaria</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yadav</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Thyroid disease prediction using machine learning approaches</article-title>. <source>Natl. Acad. Sci. Lett.</source> <volume>44</volume> (<issue>3</issue>), <fpage>233</fpage>&#x2013;<lpage>238</lpage>. <pub-id pub-id-type="doi">10.1007/s40009-020-00979-z</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2023b</year>). <article-title>Applications of multi-omics analysis in human diseases</article-title>. <source>MedComm</source> <volume>4</volume> (<issue>4</issue>), <fpage>e315</fpage>. <pub-id pub-id-type="doi">10.1002/mco2.315</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>D. W.</given-names>
</name>
<name>
<surname>Lang</surname>
<given-names>B. H. H.</given-names>
</name>
<name>
<surname>McLeod</surname>
<given-names>D. S. A.</given-names>
</name>
<name>
<surname>Newbold</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Haymart</surname>
<given-names>M. R.</given-names>
</name>
</person-group> (<year>2023a</year>). <article-title>Thyroid cancer</article-title>. <source>Lancet</source> <volume>401</volume> (<issue>10387</issue>), <fpage>1531</fpage>&#x2013;<lpage>1544</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(23)00020-X</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Qu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Jia</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>High-performance metabolic profiling of high-risk thyroid nodules by ZrMOF hybrids</article-title>. <source>ACS Nano</source> <volume>18</volume> (<issue>32</issue>), <fpage>21336</fpage>&#x2013;<lpage>21346</lpage>. <pub-id pub-id-type="doi">10.1021/acsnano.4c05700</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>X. W.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>J. X.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Big data bioinformatics</article-title>. <source>Methods</source> <volume>111</volume>, <fpage>1</fpage>&#x2013;<lpage>2</lpage>. <pub-id pub-id-type="doi">10.1016/j.ymeth.2016.11.017</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Choudhury</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Asan</surname>
<given-names>O.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Role of artificial intelligence in patient safety outcomes: systematic literature review</article-title>. <source>JMIR Med. Inf.</source> <volume>8</volume> (<issue>7</issue>), <fpage>e18599</fpage>. <pub-id pub-id-type="doi">10.2196/18599</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cieslak</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Castelfranco</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Roncalli</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Lenz</surname>
<given-names>P. H.</given-names>
</name>
<name>
<surname>Hartline</surname>
<given-names>D. K.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>t-Distributed Stochastic Neighbor Embedding (t-SNE): a tool for eco-physiological transcriptomic analysis</article-title>. <source>Mar. Genomics</source> <volume>51</volume>, <fpage>100723</fpage>. <pub-id pub-id-type="doi">10.1016/j.margen.2019.100723</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>D&#x27;Andrea</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Jing</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Peyrottes</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Guigonis</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Graslin</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Lindenthal</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Pilot study on the use of untargeted metabolomic fingerprinting of liquid-cytology fluids as a diagnostic tool of malignancy for thyroid nodules</article-title>. <source>Metabolites</source> <volume>13</volume> (<issue>7</issue>), <fpage>782</fpage>. <pub-id pub-id-type="doi">10.3390/metabo13070782</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Da Silva Lopes</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Doria Neto</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>De Medeiros Martins</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Parallel t-SNE applied to data visualization in smart cities</article-title>. <source>IEEE Access</source> <volume>8</volume>, <fpage>11482</fpage>&#x2013;<lpage>11490</lpage>. <pub-id pub-id-type="doi">10.1109/access.2020.2964413</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davis</surname>
<given-names>K. D.</given-names>
</name>
<name>
<surname>Aghaeepour</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Ahn</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Angst</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Borsook</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Brenton</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Discovery and validation of biomarkers to aid the development of safe and effective pain therapeutics: challenges and opportunities</article-title>. <source>Nat. Rev. Neurol.</source> <volume>16</volume> (<issue>7</issue>), <fpage>381</fpage>&#x2013;<lpage>400</lpage>. <pub-id pub-id-type="doi">10.1038/s41582-020-0362-2</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Demir</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>&#x15e;ahin</surname>
<given-names>E. K.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Liquefaction prediction with robust machine learning algorithms (SVM, RF, and XGBoost) supported by genetic algorithm-based feature selection and parameter optimization from the perspective of data processing</article-title>. <source>Environ. Earth Sci.</source> <volume>81</volume> (<issue>18</issue>), <fpage>459</fpage>. <pub-id pub-id-type="doi">10.1007/s12665-022-10578-4</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Desaire</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Go</surname>
<given-names>E. P.</given-names>
</name>
<name>
<surname>Hua</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Advances, obstacles, and opportunities for machine learning in proteomics</article-title>. <source>Cell. Rep. Phys. Sci.</source> <volume>3</volume> (<issue>10</issue>), <fpage>101069</fpage>. <pub-id pub-id-type="doi">10.1016/j.xcrp.2022.101069</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ding</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>Y.-Q.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Mass spectrometry-based metabolomics for clinical study: recent progresses and applications</article-title>. <source>TrAC Trends Anal. Chem.</source> <volume>158</volume>, <fpage>116896</fpage>. <pub-id pub-id-type="doi">10.1016/j.trac.2022.116896</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Du</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Missing data problem in the monitoring system: a review</article-title>. <source>IEEE Sensors J.</source> <volume>20</volume> (<issue>23</issue>), <fpage>13984</fpage>&#x2013;<lpage>13998</lpage>. <pub-id pub-id-type="doi">10.1109/jsen.2020.3009265</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Emmanuel</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Maupong</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Mpoeleng</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Semong</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Mphago</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Tabona</surname>
<given-names>O.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A survey on missing data in machine learning</article-title>. <source>J. Big Data</source> <volume>8</volume> (<issue>1</issue>), <fpage>140</fpage>. <pub-id pub-id-type="doi">10.1186/s40537-021-00516-9</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fan</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z. W.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>N. R.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>L. H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z. C.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Urine proteomic signatures predicting the progression from premalignancy to malignant gastric cancer</article-title>. <source>EBioMedicine</source> <volume>86</volume>, <fpage>104340</fpage>. <pub-id pub-id-type="doi">10.1016/j.ebiom.2022.104340</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fanaee</surname>
<given-names>T. H.</given-names>
</name>
<name>
<surname>Thoresen</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Multi-insight visualization of multi-omics data via ensemble dimension reduction and tensor factorization</article-title>. <source>Bioinformatics</source> <volume>35</volume> (<issue>10</issue>), <fpage>1625</fpage>&#x2013;<lpage>1633</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bty847</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fannes</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Vandermarliere</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Schietgat</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Degroeve</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Martens</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ramon</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Predicting tryptic cleavage from proteomics data using decision tree ensembles</article-title>. <source>J. Proteome Res.</source> <volume>12</volume> (<issue>5</issue>), <fpage>2253</fpage>&#x2013;<lpage>2259</lpage>. <pub-id pub-id-type="doi">10.1021/pr4001114</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fern&#xe1;ndez</surname>
<given-names>P. L.</given-names>
</name>
<name>
<surname>Merino</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>G&#xf3;mez</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Campo</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Medina</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Castronovo</surname>
<given-names>V.</given-names>
</name>
<etal/>
</person-group> (<year>1997</year>). <article-title>Galectin-3 and laminin expression in neoplastic and non-neoplastic thyroid tissue</article-title>. <source>J. Pathol.</source> <volume>181</volume> (<issue>1</issue>), <fpage>80</fpage>&#x2013;<lpage>86</lpage>. <pub-id pub-id-type="doi">10.1002/(SICI)1096-9896(199701)181:1&#x3c;80::AID-PATH699&#x3e;3.0.CO;2-E</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Galal</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Talal</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Moustafa</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Applications of machine learning in metabolomics: disease modeling and classification</article-title>. <source>Front. Genet.</source> <volume>13</volume>, <fpage>1017340</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2022.1017340</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gild</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Bullock</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pon</surname>
<given-names>C. K.</given-names>
</name>
<name>
<surname>Robinson</surname>
<given-names>B. G.</given-names>
</name>
<name>
<surname>Clifton-Bligh</surname>
<given-names>R. J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Destabilizing RET in targeted treatment of thyroid cancers</article-title>. <source>Endocr. Connect.</source> <volume>5</volume> (<issue>1</issue>), <fpage>10</fpage>&#x2013;<lpage>19</lpage>. <pub-id pub-id-type="doi">10.1530/EC-15-0098</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gisbrecht</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Schulz</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hammer</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Parametric nonlinear dimensionality reduction using kernel t-SNE</article-title>. <source>Neurocomputing</source> <volume>147</volume>, <fpage>71</fpage>&#x2013;<lpage>82</lpage>. <pub-id pub-id-type="doi">10.1016/j.neucom.2013.11.045</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goecks</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jalili</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Heiser</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Gray</surname>
<given-names>J. W.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>How machine learning will transform biomedicine</article-title>. <source>Cell.</source> <volume>181</volume> (<issue>1</issue>), <fpage>92</fpage>&#x2013;<lpage>101</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2020.03.022</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Granato</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Santos</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Escher</surname>
<given-names>G. B.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>B. L.</given-names>
</name>
<name>
<surname>Maggio</surname>
<given-names>R. M.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Use of principal component analysis (PCA) and hierarchical cluster analysis (HCA) for multivariate association between bioactive compounds and functional properties in foods: a critical perspective</article-title>. <source>Trends Food Sci. and Technol.</source> <volume>72</volume>, <fpage>83</fpage>&#x2013;<lpage>90</lpage>. <pub-id pub-id-type="doi">10.1016/j.tifs.2017.12.006</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guarino</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Castellone</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Avilla</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Melillo</surname>
<given-names>R. M.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Thyroid cancer and inflammation</article-title>. <source>Mol. Cell. Endocrinol.</source> <volume>321</volume> (<issue>1</issue>), <fpage>94</fpage>&#x2013;<lpage>102</lpage>. <pub-id pub-id-type="doi">10.1016/j.mce.2009.10.003</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Xing</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Huan</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2022a</year>). <article-title>Addressing big data challenges in mass spectrometry-based metabolomics</article-title>. <source>Chem. Commun. (Camb)</source> <volume>58</volume> (<issue>72</issue>), <fpage>9979</fpage>&#x2013;<lpage>9990</lpage>. <pub-id pub-id-type="doi">10.1039/d2cc03598g</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>Y.-y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.-j.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Gong</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.-x.</given-names>
</name>
<etal/>
</person-group> (<year>2022b</year>). <article-title>Machine learning for identifying benign and malignant of thyroid tumors: a retrospective study of 2,423 patients</article-title>. <source>Front. Public Health</source> <volume>10</volume>, <fpage>960740</fpage>. <pub-id pub-id-type="doi">10.3389/fpubh.2022.960740</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gupta</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Rustam</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Kanwal</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Aljedaani</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Alfarhood</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Safran</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Detecting thyroid disease using optimized machine learning model based on differential evolution</article-title>. <source>Int. J. Comput. Intell. Syst.</source> <volume>17</volume> (<issue>1</issue>), <fpage>3</fpage>. <pub-id pub-id-type="doi">10.1007/s44196-023-00388-2</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Halder</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Verma</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Biswas</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Srivastava</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Recent advances in mass-spectrometry based proteomics software, tools and databases</article-title>. <source>Drug Discov. Today Technol.</source> <volume>39</volume>, <fpage>69</fpage>&#x2013;<lpage>79</lpage>. <pub-id pub-id-type="doi">10.1016/j.ddtec.2021.06.007</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Noble</surname>
<given-names>W. S.</given-names>
</name>
<name>
<surname>Wolf-Yadlin</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Technical advances in proteomics: new developments in data-independent acquisition</article-title>. <source>F1000Res</source> <volume>5</volume>, <fpage>419</fpage>. <pub-id pub-id-type="doi">10.12688/f1000research.7042.1</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>PSL-LCCL: a resource for subcellular protein localization in liver cancer cell line SK_HEP1</article-title>. <source>Database</source> <volume>2022</volume>, <fpage>baab087</fpage>. <pub-id pub-id-type="doi">10.1093/database/baab087</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>F. Q.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>F. X.</given-names>
</name>
<name>
<surname>Alolga</surname>
<given-names>R. N.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>M. J.</given-names>
</name>
<etal/>
</person-group> (<year>2019a</year>). <article-title>Serum-plasma matched metabolomics for comprehensive characterization of benign thyroid nodule and papillary thyroid carcinoma</article-title>. <source>Int. J. Cancer</source> <volume>144</volume> (<issue>4</issue>), <fpage>868</fpage>&#x2013;<lpage>876</lpage>. <pub-id pub-id-type="doi">10.1002/ijc.31925</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Mao</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2019b</year>). <article-title>A graphical data processing pipeline for mass spectrometry imaging-based spatially resolved metabolomics on tumor heterogeneity</article-title>. <source>Anal. Chim. Acta</source> <volume>1077</volume>, <fpage>183</fpage>&#x2013;<lpage>190</lpage>. <pub-id pub-id-type="doi">10.1016/j.aca.2019.05.068</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Gong</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>H. W.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Deep learning methods for omics data imputation</article-title>. <source>Biol. (Basel)</source> <volume>12</volume> (<issue>10</issue>), <fpage>1313</fpage>. <pub-id pub-id-type="doi">10.3390/biology12101313</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Pacheco</surname>
<given-names>P. P.</given-names>
</name>
<name>
<surname>Narrandes</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Applications of support vector machine (SVM) learning in cancer genomics</article-title>. <source>Cancer Genomics and Proteomics</source> <volume>15</volume> (<issue>1</issue>), <fpage>41</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.21873/cgp.20063</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ivosev</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Burton</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Bonner</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Dimensionality reduction and visualization in principal component analysis</article-title>. <source>Anal. Chem.</source> <volume>80</volume>, <fpage>4933</fpage>&#x2013;<lpage>4944</lpage>. <pub-id pub-id-type="doi">10.1021/ac800110w</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jajin</surname>
<given-names>M. G.</given-names>
</name>
<name>
<surname>Abooshahab</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Hooshmand</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Moradi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Siadat</surname>
<given-names>S. D.</given-names>
</name>
<name>
<surname>Mirzazadeh</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Gas chromatography-mass spectrometry-based untargeted metabolomics reveals metabolic perturbations in medullary thyroid carcinoma</article-title>. <source>Sci. Rep.</source> <volume>12</volume> (<issue>1</issue>), <fpage>8397</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-022-12590-x</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Janitza</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Tutz</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Boulesteix</surname>
<given-names>A.-L.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Random forest for ordinal responses: prediction and variable selection</article-title>. <source>Comput. Statistics and Data Analysis</source> <volume>96</volume>, <fpage>57</fpage>&#x2013;<lpage>73</lpage>. <pub-id pub-id-type="doi">10.1016/j.csda.2015.10.005</pub-id>
</citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jasem</surname>
<given-names>N. M.</given-names>
</name>
<name>
<surname>Kadhim</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Sharba M</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Assessing thyroid function: a review of biochemical markers and testing strategies</article-title>. <source>Int. J. Med. Sci. Dent. Health</source> <volume>10</volume> (<issue>02</issue>), <fpage>130</fpage>&#x2013;<lpage>150</lpage>. <pub-id pub-id-type="doi">10.55640/ijmsdh-10-02-17</pub-id>
</citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jia</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhai</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J. A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Circulating exosome involves in the pathogenesis of autoimmune thyroid diseases through immunomodulatory proteins</article-title>. <source>Front. Immunol.</source> <volume>12</volume>, <fpage>730089</fpage>. <pub-id pub-id-type="doi">10.3389/fimmu.2021.730089</pub-id>
</citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jimenez</surname>
<given-names>C. R.</given-names>
</name>
<name>
<surname>Verheul</surname>
<given-names>H. M. W.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Mass spectrometry-based proteomics:from cancer biology to protein biomarkers, drug targets, and clinical applications</article-title>. <source>Am. Soc. Clin. Oncol. Educ. Book</source> <volume>34</volume>, <fpage>e504</fpage>&#x2013;<lpage>e510</lpage>. <pub-id pub-id-type="doi">10.14694/EdBook_AM.2014.34.e504</pub-id>
</citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johnson</surname>
<given-names>K. B.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>W. Q.</given-names>
</name>
<name>
<surname>Weeraratne</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Frisse</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Misulis</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Rhee</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Precision medicine, AI, and the future of personalized health care</article-title>. <source>Clin. Transl. Sci.</source> <volume>14</volume> (<issue>1</issue>), <fpage>86</fpage>&#x2013;<lpage>93</lpage>. <pub-id pub-id-type="doi">10.1111/cts.12884</pub-id>
</citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Joshi</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Garapati</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Ghose</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Kandasamy</surname>
<given-names>R. K.</given-names>
</name>
<name>
<surname>Pandey</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Recent progress in mass spectrometry-based urinary proteomics</article-title>. <source>Clin. Proteomics</source> <volume>21</volume> (<issue>1</issue>), <fpage>14</fpage>. <pub-id pub-id-type="doi">10.1186/s12014-024-09462-z</pub-id>
</citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jovi&#x107;</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Brki&#x107;</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Bogunovi&#x107;</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>A review of feature selection methods with applications</article-title>. <source>2015 38th Int. Convention Inf. Commun. Technol. Electron. Microelectron.</source>, <fpage>1200</fpage>&#x2013;<lpage>1205</lpage>. <pub-id pub-id-type="doi">10.1109/MIPRO.2015.7160458</pub-id>
</citation>
</ref>
<ref id="B80">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Ross</surname>
<given-names>Q. J.</given-names>
</name>
</person-group> (<year>1993</year>). <source>C4.5: programs for machine learning</source>. <publisher-loc>San Francisco</publisher-loc>: <publisher-name>Morgan Kaufmann Publishers</publisher-name>.</citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiliang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Salem</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Huan</surname>
<given-names>L</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Feature selection for classification:A review</article-title>. <source>Data Classif. Algorithms Appl.</source> <volume>37</volume>. <pub-id pub-id-type="doi">10.1201/b17320</pub-id>
</citation>
</ref>
<ref id="B82">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ko</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Mersha</surname>
<given-names>T. B.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A roadmap for multi-omics data integration using deep learning</article-title>. <source>Brief. Bioinform</source> <volume>23</volume> (<issue>1</issue>), <fpage>bbab454</fpage>. <pub-id pub-id-type="doi">10.1093/bib/bbab454</pub-id>
</citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kappler</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Lehmann</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Mass-spectrometric multi-omics linked to function &#x2013; state-of-the-art investigations of mitochondria in systems medicine</article-title>. <source>TrAC Trends Anal. Chem.</source> <volume>119</volume>, <fpage>115635</fpage>. <pub-id pub-id-type="doi">10.1016/j.trac.2019.115635</pub-id>
</citation>
</ref>
<ref id="B84">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Karimpour-Fard</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Epperson</surname>
<given-names>L. E.</given-names>
</name>
<name>
<surname>Hunter</surname>
<given-names>L. E.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>A survey of computational tools for downstream analysis of proteomic and other omic datasets</article-title>. <source>Hum. Genomics</source> <volume>9</volume> (<issue>1</issue>), <fpage>28</fpage>. <pub-id pub-id-type="doi">10.1186/s40246-015-0050-2</pub-id>
</citation>
</ref>
<ref id="B85">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kavzoglu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Teke</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Predictive performances of ensemble machine learning algorithms in landslide susceptibility mapping using random forest, extreme gradient boosting (XGBoost) and natural gradient boosting (NGBoost)</article-title>. <source>Arabian J. Sci. Eng.</source> <volume>47</volume> (<issue>6</issue>), <fpage>7367</fpage>&#x2013;<lpage>7385</lpage>. <pub-id pub-id-type="doi">10.1007/s13369-022-06560-8</pub-id>
</citation>
</ref>
<ref id="B86">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kawashima</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Watanabe</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Umeyama</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Nakajima</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hattori</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Honda</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Optimization of data-independent acquisition mass spectrometry for deep and highly sensitive proteomic analysis</article-title>. <source>Int. J. Mol. Sci.</source> <volume>20</volume> (<issue>23</issue>), <fpage>5932</fpage>. <pub-id pub-id-type="doi">10.3390/ijms20235932</pub-id>
</citation>
</ref>
<ref id="B87">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kelly</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Karthikesalingam</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Suleyman</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Corrado</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>King</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Key challenges for delivering clinical impact with artificial intelligence</article-title>. <source>BMC Med.</source> <volume>17</volume> (<issue>1</issue>), <fpage>195</fpage>. <pub-id pub-id-type="doi">10.1186/s12916-019-1426-2</pub-id>
</citation>
</ref>
<ref id="B88">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khalifa</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Albadawy</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Artificial intelligence for diabetes: enhancing prevention, diagnosis, and effective management</article-title>. <source>Comput. Methods Programs Biomed. Update</source> <volume>5</volume>, <fpage>100141</fpage>. <pub-id pub-id-type="doi">10.1016/j.cmpbup.2024.100141</pub-id>
</citation>
</ref>
<ref id="B89">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khalifa</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Albadawy</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Iqbal</surname>
<given-names>U.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Advancing clinical decision support: the role of artificial intelligence across six domains</article-title>. <source>Comput. Methods Programs Biomed. Update</source> <volume>5</volume>, <fpage>100142</fpage>. <pub-id pub-id-type="doi">10.1016/j.cmpbup.2024.100142</pub-id>
</citation>
</ref>
<ref id="B90">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khalilia</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chakraborty</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Popescu</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Predicting disease risks from highly imbalanced data using random forest</article-title>. <source>BMC Med. Inf. Decis. Mak.</source> <volume>11</volume> (<issue>51</issue>), <fpage>51</fpage>. <pub-id pub-id-type="doi">10.1186/1472-6947-11-51</pub-id>
</citation>
</ref>
<ref id="B91">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Huo</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tseng</surname>
<given-names>G. C.</given-names>
</name>
<name>
<surname>Bar-Joseph</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Meta-analytic principal component analysis in integrative omics application</article-title>. <source>Bioinformatics</source> <volume>34</volume> (<issue>8</issue>), <fpage>1321</fpage>&#x2013;<lpage>1328</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx765</pub-id>
</citation>
</ref>
<ref id="B92">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Komuro</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kusumoto</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hashimoto</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Yuasa</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Machine learning in cardiology: clinical application and basic research</article-title>. <source>J. Cardiol.</source> <volume>82</volume> (<issue>2</issue>), <fpage>128</fpage>&#x2013;<lpage>133</lpage>. <pub-id pub-id-type="doi">10.1016/j.jjcc.2023.04.020</pub-id>
</citation>
</ref>
<ref id="B93">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kotsiantis</surname>
<given-names>S. B.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>RETRACTED ARTICLE: feature selection for machine learning classification problems: a recent overview</article-title>. <source>Artif. Intell. Rev.</source> <volume>42</volume> (<issue>1</issue>), <fpage>157</fpage>. <pub-id pub-id-type="doi">10.1007/s10462-011-9230-1</pub-id>
</citation>
</ref>
<ref id="B94">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kowalczyk</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ciborowski</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kisluk</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kretowski</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Barbas</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Mass spectrometry based proteomics and metabolomics in personalized oncology</article-title>. <source>Biochim. Biophys. Acta Mol. Basis Dis.</source> <volume>1866</volume> (<issue>5</issue>), <fpage>165690</fpage>. <pub-id pub-id-type="doi">10.1016/j.bbadis.2020.165690</pub-id>
</citation>
</ref>
<ref id="B95">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krassowski</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Das</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Sahu</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Misra</surname>
<given-names>B. B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>State of the field in multi-omics research: from computational needs to data mining and sharing</article-title>. <source>Front. Genet.</source> <volume>11</volume>, <fpage>610798</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2020.610798</pub-id>
</citation>
</ref>
<ref id="B96">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krishnan</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Singh</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Pathania</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gosavi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Abhishek</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Parchani</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Artificial intelligence in clinical medicine: catalyzing a sustainable global healthcare paradigm</article-title>. <source>Front. Artif. Intell.</source> <volume>6</volume>, <fpage>1227091</fpage>. <pub-id pub-id-type="doi">10.3389/frai.2023.1227091</pub-id>
</citation>
</ref>
<ref id="B97">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kumari</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kaur</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Rakhra</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Deka</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Byeon</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Asenso</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Explainable artificial intelligence and machine learning algorithms for classification of thyroid disease</article-title>. <source>Discov. Appl. Sci.</source> <volume>6</volume> (<issue>7</issue>), <fpage>360</fpage>. <pub-id pub-id-type="doi">10.1007/s42452-024-06068-w</pub-id>
</citation>
</ref>
<ref id="B98">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kwon</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Shin</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Cho</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hahn</surname>
<given-names>S. Y.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>K. W.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Radiomics study of thyroid ultrasound for predicting BRAF mutation in papillary thyroid carcinoma: preliminary results</article-title>. <source>AJNR Am. J. Neuroradiol.</source> <volume>41</volume> (<issue>4</issue>), <fpage>700</fpage>&#x2013;<lpage>705</lpage>. <pub-id pub-id-type="doi">10.3174/ajnr.A6505</pub-id>
</citation>
</ref>
<ref id="B99">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Leo</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Jerome</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Olshe</surname>
<given-names>R.A.</given-names>
</name>
</person-group> (<year>1984</year>). <source>Classification and regression trees</source>. <publisher-loc>New York</publisher-loc>: <publisher-name>Chapman and Hall</publisher-name>, <fpage>582</fpage>&#x2013;<lpage>588</lpage>.</citation>
</ref>
<ref id="B100">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leung Kwan</surname>
<given-names>K. K.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>T. Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Q. Y.</given-names>
</name>
<name>
<surname>Xia Dong</surname>
<given-names>T. T.</given-names>
</name>
<name>
<surname>Lam</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Keung Tsim</surname>
<given-names>K. W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Mass spectrometry-based multi-omics analysis reveals the thermogenetic regulation of herbal medicine in rat model of yeast-induced fever</article-title>. <source>J. Ethnopharmacol.</source> <volume>279</volume>, <fpage>114382</fpage>. <pub-id pub-id-type="doi">10.1016/j.jep.2021.114382</pub-id>
</citation>
</ref>
<ref id="B101">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ning</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ghandi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kryukov</surname>
<given-names>G. V.</given-names>
</name>
<name>
<surname>Gopal</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Deik</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>The landscape of cancer cell line metabolism</article-title>. <source>Nat. Med.</source> <volume>25</volume> (<issue>5</issue>), <fpage>850</fpage>&#x2013;<lpage>860</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-019-0404-8</pub-id>
</citation>
</ref>
<ref id="B102">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Morstatter</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Trevino</surname>
<given-names>R. P.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2017a</year>). <article-title>Feature selection: a data perspective</article-title>. <source>ACM Comput. Surv.</source> <volume>50</volume> (<issue>6</issue>), <fpage>1</fpage>&#x2013;<lpage>45</lpage>. <pub-id pub-id-type="doi">10.1145/3136625</pub-id>
</citation>
</ref>
<ref id="B103">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mi</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ran</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Sui</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2023a</year>). <article-title>Identification of potential diagnostic and prognostic biomarkers for papillary thyroid microcarcinoma (PTMC) based on TMT-labeled LC-MS/MS and machine learning</article-title>. <source>J. Endocrinol. Invest.</source> <volume>46</volume> (<issue>6</issue>), <fpage>1131</fpage>&#x2013;<lpage>1143</lpage>. <pub-id pub-id-type="doi">10.1007/s40618-022-01960-x</pub-id>
</citation>
</ref>
<ref id="B104">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Leng</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Mao</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2023b</year>). <article-title>New perspectives on cancer clinical research in the era of big data and machine learning</article-title>. <source>Surg. Oncol.</source> <volume>52</volume>, <fpage>102009</fpage>. <pub-id pub-id-type="doi">10.1016/j.suronc.2023.102009</pub-id>
</citation>
</ref>
<ref id="B105">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2017b</year>). <article-title>Recent advances in feature selection and its applications</article-title>. <source>Knowl. Inf. Syst.</source> <volume>53</volume> (<issue>3</issue>), <fpage>551</fpage>&#x2013;<lpage>577</lpage>. <pub-id pub-id-type="doi">10.1007/s10115-017-1059-8</pub-id>
</citation>
</ref>
<ref id="B106">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Risk stratification of papillary thyroid cancers using multidimensional machine learning</article-title>. <source>Int. J. Surg.</source> <volume>110</volume> (<issue>1</issue>), <fpage>372</fpage>&#x2013;<lpage>384</lpage>. <pub-id pub-id-type="doi">10.1097/js9.0000000000000814</pub-id>
</citation>
</ref>
<ref id="B107">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liang</surname>
<given-names>L. W.</given-names>
</name>
<name>
<surname>Raita</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hasegawa</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Fifer</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Maurer</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Reilly</surname>
<given-names>M. P.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Proteomics profiling reveals a distinct high-risk molecular subtype of hypertrophic cardiomyopathy</article-title>. <source>Heart</source> <volume>108</volume> (<issue>22</issue>), <fpage>1807</fpage>&#x2013;<lpage>1814</lpage>. <pub-id pub-id-type="doi">10.1136/heartjnl-2021-320729</pub-id>
</citation>
</ref>
<ref id="B108">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liebal</surname>
<given-names>U. W.</given-names>
</name>
<name>
<surname>Phan</surname>
<given-names>A. N. T.</given-names>
</name>
<name>
<surname>Sudhakar</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Raman</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Blank</surname>
<given-names>L. M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Machine learning applications for mass spectrometry-based metabolomics</article-title>. <source>Metabolites</source> <volume>10</volume> (<issue>6</issue>), <fpage>243</fpage>. <pub-id pub-id-type="doi">10.3390/metabo10060243</pub-id>
</citation>
</ref>
<ref id="B109">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>HSP90 inhibitor NVP-AUY922 induces cell apoptosis by disruption of the survivin in papillary thyroid carcinoma cells</article-title>. <source>Biochem. Biophys. Res. Commun.</source> <volume>487</volume> (<issue>2</issue>), <fpage>313</fpage>&#x2013;<lpage>319</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbrc.2017.04.056</pub-id>
</citation>
</ref>
<ref id="B110">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lundberg</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S.-I.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>A unified approach to interpreting model predictions</article-title>. <source>Adv. neural Inf. Process. Syst.</source>, <fpage>4768</fpage>&#x2013;<lpage>4777</lpage>. <pub-id pub-id-type="doi">10.48550/arXiv.1705.07874</pub-id>
</citation>
</ref>
<ref id="B111">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Xia</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Proteomics study of serum exosomes from papillary thyroid cancer patients</article-title>. <source>Endocr. Relat. Cancer</source> <volume>25</volume> (<issue>10</issue>), <fpage>879</fpage>&#x2013;<lpage>891</lpage>. <pub-id pub-id-type="doi">10.1530/ERC-17-0547</pub-id>
</citation>
</ref>
<ref id="B112">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ma</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Principal component analysis based methods in bioinformatics studies</article-title>. <source>Brief. Bioinform</source> <volume>12</volume> (<issue>6</issue>), <fpage>714</fpage>&#x2013;<lpage>722</lpage>. <pub-id pub-id-type="doi">10.1093/bib/bbq090</pub-id>
</citation>
</ref>
<ref id="B113">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Manochkumar</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Cherukuri</surname>
<given-names>A. K.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Almansour</surname>
<given-names>A. I.</given-names>
</name>
<name>
<surname>Ramamoorthy</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Efferth</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>A critical review of machine-learning for &#x201c;multi-omics&#x201d; marine metabolite datasets</article-title>. <source>Comput. Biol. Med.</source> <volume>165</volume>, <fpage>107425</fpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.107425</pub-id>
</citation>
</ref>
<ref id="B114">
<citation citation-type="thesis">
<person-group person-group-type="author">
<name>
<surname>Markowetz</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2001</year>). <source>Support vector machines in bioinformatics</source> (<publisher-loc>Heidelberg</publisher-loc>: <publisher-name>University of Heidelberg</publisher-name>). <comment>
<italic>Master&#x27;s thesis</italic>
</comment>.</citation>
</ref>
<ref id="B115">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marsee</surname>
<given-names>D. K.</given-names>
</name>
<name>
<surname>Venkateswaran</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Tao</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Vadysirisack</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Vandre</surname>
<given-names>D. D.</given-names>
</name>
<etal/>
</person-group> (<year>2004</year>). <article-title>Inhibition of heat shock protein 90, a novel RET/PTC1-associated protein, increases radioiodide accumulation in thyroid cells</article-title>. <source>J. Biol. Chem.</source> <volume>279</volume> (<issue>42</issue>), <fpage>43990</fpage>&#x2013;<lpage>43997</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.M407503200</pub-id>
</citation>
</ref>
<ref id="B116">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Martinez-Aguilar</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Clifton-Bligh</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Molloy</surname>
<given-names>M. P.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>A multiplexed, targeted mass spectrometry assay of the S100 protein family uncovers the isoform-specific expression in thyroid tumours</article-title>. <source>BMC Cancer</source> <volume>15</volume>, <fpage>199</fpage>. <pub-id pub-id-type="doi">10.1186/s12885-015-1217-x</pub-id>
</citation>
</ref>
<ref id="B117">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Martinez-Aguilar</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Clifton-Bligh</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Molloy</surname>
<given-names>M. P.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Proteomics of thyroid tumours provides new insights into their molecular composition and changes associated with malignancy</article-title>. <source>Sci. Rep.</source> <volume>6</volume>, <fpage>23660</fpage>. <pub-id pub-id-type="doi">10.1038/srep23660</pub-id>
</citation>
</ref>
<ref id="B118">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mavrogeorgis</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Mischak</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Latosinska</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Vlahou</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Schanstra</surname>
<given-names>J. P.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Uniform manifold approximation and projection-based assessment of chronic kidney disease aetiologies based on urinary peptidomics</article-title>. <comment>medRxiv</comment>. <pub-id pub-id-type="doi">10.1101/2023.05.19.23290228</pub-id>
</citation>
</ref>
<ref id="B119">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McInnes</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Healy</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Saul</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Gro&#xdf;berger</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>UMAP: uniform manifold approximation and projection</article-title>. <source>J. Open Source Softw.</source> <volume>3</volume> (<issue>29</issue>), <fpage>861</fpage>. <pub-id pub-id-type="doi">10.21105/joss.00861</pub-id>
</citation>
</ref>
<ref id="B120">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mesari&#x107;</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>&#x160;ebalj</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Decision trees for predicting the academic success of students</article-title>. <source>Croat. Operational Res. Rev.</source> <volume>7</volume> (<issue>2</issue>), <fpage>367</fpage>&#x2013;<lpage>388</lpage>. <pub-id pub-id-type="doi">10.17535/crorr.2016.0025</pub-id>
</citation>
</ref>
<ref id="B121">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arzyeh</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Tristan</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Peter</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Andrew</surname>
<given-names>L B.</given-names>
</name>
<name>
<surname>Irene</surname>
<given-names>Y C.</given-names>
</name>
<name>
<surname>Rajesh</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A review of challenges and opportunities in machine learning for health</article-title>. <source>AMIA Jt. Summits Transl. Sci.</source>, <fpage>191</fpage>&#x2013;<lpage>200</lpage>. <pub-id pub-id-type="doi">10.48550/arXiv.1806.00388</pub-id>
</citation>
</ref>
<ref id="B122">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Migisha</surname>
<given-names>N. P. V.</given-names>
</name>
<name>
<surname>Heo</surname>
<given-names>C. E.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>J. Y.</given-names>
</name>
<name>
<surname>Chae</surname>
<given-names>S. Y.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Vu</surname>
<given-names>H. M.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Mass spectrometry-based proteomics of single cells and organoids: the new generation of cancer research</article-title>. <source>TrAC Trends Anal. Chem.</source> <volume>130</volume>, <fpage>116005</fpage>. <pub-id pub-id-type="doi">10.1016/j.trac.2020.116005</pub-id>
</citation>
</ref>
<ref id="B123">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mirza</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Chung</surname>
<given-names>N. C.</given-names>
</name>
<name>
<surname>Ping</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Machine learning and integrative analysis of biomedical big data</article-title>. <source>Genes. (Basel)</source> <volume>10</volume> (<issue>2</issue>), <fpage>87</fpage>. <pub-id pub-id-type="doi">10.3390/genes10020087</pub-id>
</citation>
</ref>
<ref id="B124">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mischak</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Allmaier</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Apweiler</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Attwood</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Baumann</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Benigni</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>Recommendations for biomarker identification and qualification in clinical proteomics</article-title>. <source>Sci. Transl. Med.</source> <volume>2</volume> (<issue>46</issue>), <fpage>46ps42</fpage>. <pub-id pub-id-type="doi">10.1126/scitranslmed.3001249</pub-id>
</citation>
</ref>
<ref id="B125">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Mohammadzadeh</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Fran&#xe7;oise</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Gouiff&#xe8;s</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Caramiaux</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2024</year>). &#x201c;<article-title>Studying collaborative interactive machine teaching in image classification</article-title>,&#x201d; in <conf-name>Proceedings of the 29th International Conference on Intelligent User Interfaces</conf-name>, <conf-loc>USA</conf-loc>, <conf-date>January 13 - 16, 2004</conf-date>, <fpage>195</fpage>&#x2013;<lpage>208</lpage>. <pub-id pub-id-type="doi">10.1145/3640543.3645204</pub-id>
</citation>
</ref>
<ref id="B126">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mou</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Application of machine learning in spatial proteomics</article-title>. <source>J. Chem. Inf. Model.</source> <volume>62</volume> (<issue>23</issue>), <fpage>5875</fpage>&#x2013;<lpage>5895</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.2c01161</pub-id>
</citation>
</ref>
<ref id="B127">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mullur</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y. Y.</given-names>
</name>
<name>
<surname>Brent</surname>
<given-names>G. A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Thyroid hormone regulation of metabolism</article-title>. <source>Physiol. Rev.</source> <volume>94</volume> (<issue>2</issue>), <fpage>355</fpage>&#x2013;<lpage>382</lpage>. <pub-id pub-id-type="doi">10.1152/physrev.00030.2013</pub-id>
</citation>
</ref>
<ref id="B128">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nalluri</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pentela</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Eluri</surname>
<given-names>N. R.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A scalable tree boosting system:XG boost</article-title>. <source>Int. J. Res. Stud. Sci. Eng. Technol.</source> <volume>7</volume> (<issue>12</issue>), <fpage>36</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.22259/2349-476X.0712005</pub-id>
</citation>
</ref>
<ref id="B129">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Navada</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ansari</surname>
<given-names>A. N.</given-names>
</name>
<name>
<surname>Patil</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sonkamble</surname>
<given-names>B. A.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Overview of use of decision tree algorithms in machine learning</article-title>. <source>IEEE Control Syst. Graduate Res. Colloquium</source>, <fpage>37</fpage>&#x2013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.1109/ICSGRC.2011.5991826</pub-id>
</citation>
</ref>
<ref id="B130">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ng</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Masarone</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Watson</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Barnes</surname>
<given-names>M. R.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>The benefits and pitfalls of machine learning for biomarker discovery</article-title>. <source>Cell. Tissue Res.</source> <volume>394</volume> (<issue>1</issue>), <fpage>17</fpage>&#x2013;<lpage>31</lpage>. <pub-id pub-id-type="doi">10.1007/s00441-023-03816-z</pub-id>
</citation>
</ref>
<ref id="B131">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ngan</surname>
<given-names>H.-L.</given-names>
</name>
<name>
<surname>Lam</surname>
<given-names>K.-Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Machine learning facilitates the application of mass spectrometry-based metabolomics to clinical analysis: a review of early diagnosis of high mortality rate cancers</article-title>. <source>TrAC Trends Anal. Chem.</source> <volume>168</volume>, <fpage>117333</fpage>. <pub-id pub-id-type="doi">10.1016/j.trac.2023.117333</pub-id>
</citation>
</ref>
<ref id="B132">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nicholson</surname>
<given-names>J. K.</given-names>
</name>
<name>
<surname>Lindon</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Holmes</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>&#x27;Metabonomics&#x27;: understanding the metabolic responses of living systems to pathophysiological stimuli via multivariate statistical analysis of biological NMR spectroscopic data</article-title>. <source>Xenobiotica</source> <volume>29</volume> (<issue>11</issue>), <fpage>1181</fpage>&#x2013;<lpage>1189</lpage>. <pub-id pub-id-type="doi">10.1080/004982599238047</pub-id>
</citation>
</ref>
<ref id="B133">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nipp</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Elsner</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Balluff</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Meding</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sarioglu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ueffing</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>S100-A10, thioredoxin, and S100-A6 as biomarkers of papillary thyroid carcinoma with lymph node metastasis identified by MALDI imaging</article-title>. <source>J. Mol. Med. Berl.</source> <volume>90</volume> (<issue>2</issue>), <fpage>163</fpage>&#x2013;<lpage>174</lpage>. <pub-id pub-id-type="doi">10.1007/s00109-011-0815-6</pub-id>
</citation>
</ref>
<ref id="B134">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Omur</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Baran</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>An update on molecular biology of thyroid cancers</article-title>. <source>Crit. Rev. Oncology/Hematology</source> <volume>90</volume> (<issue>3</issue>), <fpage>233</fpage>&#x2013;<lpage>252</lpage>. <pub-id pub-id-type="doi">10.1016/j.critrevonc.2013.12.007</pub-id>
</citation>
</ref>
<ref id="B135">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pan</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Cluster analysis:unsupervised learning via supervised learning with a non-convex penalty</article-title>. <source>J. Mach. Learn. Res.</source> <volume>14</volume> (<issue>7</issue>), <fpage>1865</fpage>.</citation>
</ref>
<ref id="B136">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paron</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Scaloni</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pines</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bachi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>F. T.</given-names>
</name>
<name>
<surname>Puppin</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2003</year>). <article-title>Nuclear localization of Galectin-3 in transformed thyroid cells: a role in transcriptional regulation</article-title>. <source>Biochem. Biophys. Res. Commun.</source> <volume>302</volume> (<issue>3</issue>), <fpage>545</fpage>&#x2013;<lpage>553</lpage>. <pub-id pub-id-type="doi">10.1016/s0006-291x(03)00151-7</pub-id>
</citation>
</ref>
<ref id="B137">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pearl</surname>
<given-names>L. H.</given-names>
</name>
<name>
<surname>Prodromou</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Workman</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>The Hsp90 molecular chaperone: an open and shut case for treatment</article-title>. <source>Biochem. J.</source> <volume>410</volume> (<issue>3</issue>), <fpage>439</fpage>&#x2013;<lpage>453</lpage>. <pub-id pub-id-type="doi">10.1042/BJ20071640</pub-id>
</citation>
</ref>
<ref id="B138">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Perakakis</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Yazdani</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Karniadakis</surname>
<given-names>G. E.</given-names>
</name>
<name>
<surname>Mantzoros</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Omics, big data and machine learning as tools to propel understanding of biological mechanisms and to discover novel diagnostics and therapeutics</article-title>. <source>Metabolism</source> <volume>87</volume>, <fpage>A1-A9</fpage>&#x2013;<lpage>A9</lpage>. <pub-id pub-id-type="doi">10.1016/j.metabol.2018.08.002</pub-id>
</citation>
</ref>
<ref id="B139">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Picard</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Felsberg</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Langini</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Stachura</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Macas</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Integrative multi-omics reveals two biologically distinct groups of pilocytic astrocytoma</article-title>. <source>Acta Neuropathol.</source> <volume>146</volume> (<issue>4</issue>), <fpage>551</fpage>&#x2013;<lpage>564</lpage>. <pub-id pub-id-type="doi">10.1007/s00401-023-02626-5</pub-id>
</citation>
</ref>
<ref id="B140">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qian</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Xue</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Mass spectrometry-based proteomics of epithelial ovarian cancers: a clinical perspective</article-title>. <source>Mol. Cell. Proteomics</source> <volume>22</volume> (<issue>7</issue>), <fpage>100578</fpage>. <pub-id pub-id-type="doi">10.1016/j.mcpro.2023.100578</pub-id>
</citation>
</ref>
<ref id="B141">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qiu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Small molecule metabolites: discovery of biomarkers and therapeutic targets</article-title>. <source>Signal Transduct. Target Ther.</source> <volume>8</volume> (<issue>1</issue>), <fpage>132</fpage>. <pub-id pub-id-type="doi">10.1038/s41392-023-01399-3</pub-id>
</citation>
</ref>
<ref id="B142">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Quazi</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Artificial intelligence and machine learning in precision and genomic medicine</article-title>. <source>Med. Oncol.</source> <volume>39</volume> (<issue>8</issue>), <fpage>120</fpage>. <pub-id pub-id-type="doi">10.1007/s12032-022-01711-1</pub-id>
</citation>
</ref>
<ref id="B143">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Randall</surname>
<given-names>L. V.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>D. H.</given-names>
</name>
<name>
<surname>Abdelrazig</surname>
<given-names>S. M. A.</given-names>
</name>
<name>
<surname>Bollard</surname>
<given-names>N. J.</given-names>
</name>
<name>
<surname>Hemingway-Arnold</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hyde</surname>
<given-names>R. M.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Predicting lameness in dairy cattle using untargeted liquid chromatography-mass spectrometry-based metabolomics and machine learning</article-title>. <source>J. Dairy Sci.</source> <volume>106</volume>, <fpage>7033</fpage>&#x2013;<lpage>7042</lpage>. <pub-id pub-id-type="doi">10.3168/jds.2022-23118</pub-id>
</citation>
</ref>
<ref id="B144">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reel</surname>
<given-names>P. S.</given-names>
</name>
<name>
<surname>Reel</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Pearson</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Trucco</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Jefferson</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Using machine learning approaches for multi-omics data analysis: a review</article-title>. <source>Biotechnol. Adv.</source> <volume>49</volume>, <fpage>107739</fpage>. <pub-id pub-id-type="doi">10.1016/j.biotechadv.2021.107739</pub-id>
</citation>
</ref>
<ref id="B145">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Remeseiro</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Bolon-Canedo</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A review of feature selection methods in medical applications</article-title>. <source>Comput. Biol. Med.</source> <volume>112</volume>, <fpage>103375</fpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2019.103375</pub-id>
</citation>
</ref>
<ref id="B146">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reska</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Czajkowski</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Jurczuk</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Boldak</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Kwedlo</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Bauer</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Integration of solutions and services for multi-omics data analysis towards personalized medicine</article-title>. <source>Biocybern. Biomed. Eng.</source> <volume>41</volume> (<issue>4</issue>), <fpage>1646</fpage>&#x2013;<lpage>1663</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbe.2021.10.005</pub-id>
</citation>
</ref>
<ref id="B147">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ringner</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>What is principal component analysis?</article-title> <source>Nat. Biotechnol.</source> <volume>26</volume> (<issue>3</issue>), <fpage>303</fpage>&#x2013;<lpage>304</lpage>. <pub-id pub-id-type="doi">10.1038/nbt0308-303</pub-id>
</citation>
</ref>
<ref id="B148">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nishimura</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Yokose</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Mukai</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>S-100 protein is a differentiation marker in thyroid carcinoma of follicular cell origin:an immunohistochemical study</article-title>. <source>Pathol. Int.</source> <volume>47</volume> (<issue>10</issue>), <fpage>673</fpage>&#x2013;<lpage>679</lpage>. <pub-id pub-id-type="doi">10.1111/j.1440-1827.1997.tb04440.x</pub-id>
</citation>
</ref>
<ref id="B149">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roca</surname>
<given-names>C. P.</given-names>
</name>
<name>
<surname>Burton</surname>
<given-names>O. T.</given-names>
</name>
<name>
<surname>Neumann</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Tareen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Whyte</surname>
<given-names>C. E.</given-names>
</name>
<name>
<surname>Gergelits</surname>
<given-names>V.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>A cross entropy test allows quantitative statistical comparison of t-SNE and UMAP representations</article-title>. <source>Cell. Rep. Methods</source> <volume>3</volume> (<issue>1</issue>), <fpage>100390</fpage>. <pub-id pub-id-type="doi">10.1016/j.crmeth.2022.100390</pub-id>
</citation>
</ref>
<ref id="B150">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rosenberger</surname>
<given-names>F. A.</given-names>
</name>
<name>
<surname>Thielert</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Strauss</surname>
<given-names>M. T.</given-names>
</name>
<name>
<surname>Schweizer</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ammar</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Madler</surname>
<given-names>S. C.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Spatial single-cell mass spectrometry defines zonation of the hepatocyte proteome</article-title>. <source>Nat. Methods</source> <volume>20</volume> (<issue>10</issue>), <fpage>1530</fpage>&#x2013;<lpage>1536</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-023-02007-6</pub-id>
</citation>
</ref>
<ref id="B151">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sainburg</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>McInnes</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Gentner</surname>
<given-names>T. Q.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Parametric UMAP embeddings for representation and semisupervised learning</article-title>. <source>Neural comput.</source> <volume>33</volume> (<issue>11</issue>), <fpage>2881</fpage>&#x2013;<lpage>2907</lpage>. <pub-id pub-id-type="doi">10.1162/neco_a_01434</pub-id>
</citation>
</ref>
<ref id="B152">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sarker</surname>
<given-names>I. H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Machine learning: algorithms, real-world applications and research directions</article-title>. <source>SN Comput. Sci.</source> <volume>2</volume> (<issue>3</issue>), <fpage>160</fpage>. <pub-id pub-id-type="doi">10.1007/s42979-021-00592-x</pub-id>
</citation>
</ref>
<ref id="B153">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schneider</surname>
<given-names>D. F.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>New developments in the diagnosis and treatment of thyroid cancer</article-title>. <source>CA Cancer J. Clin.</source> <volume>63</volume> (<issue>6</issue>), <fpage>374</fpage>&#x2013;<lpage>394</lpage>. <pub-id pub-id-type="doi">10.3322/caac.21195</pub-id>
</citation>
</ref>
<ref id="B154">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Searle</surname>
<given-names>B. C.</given-names>
</name>
<name>
<surname>Swearingen</surname>
<given-names>K. E.</given-names>
</name>
<name>
<surname>Barnes</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Schmidt</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Gessulat</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kuster</surname>
<given-names>B.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Generating high quality libraries for DIA MS with empirically corrected peptide predictions</article-title>. <source>Nat. Commun.</source> <volume>11</volume> (<issue>1</issue>), <fpage>1548</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-020-15346-1</pub-id>
</citation>
</ref>
<ref id="B155">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singh</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Giri</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Comparative study ID3, cart and C4. 5 decision tree algorithm:a survey</article-title>. <source>Int. J. Adv. Inf. Sci. Technol. (IJAIST)</source> <volume>27</volume> (<issue>27</issue>), <fpage>97</fpage>&#x2013;<lpage>103</lpage>. <pub-id pub-id-type="doi">10.15693/ijaist/2014.v3i7.47-52</pub-id>
</citation>
</ref>
<ref id="B156">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smith</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Weathers</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>Lewis</surname>
<given-names>S. L.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>An overview of clinical machine learning applications in neurology</article-title>. <source>J. Neurological Sci.</source> <volume>455</volume>, <fpage>122799</fpage>. <pub-id pub-id-type="doi">10.1016/j.jns.2023.122799</pub-id>
</citation>
</ref>
<ref id="B157">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sofia</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Sravani</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>K Lakshmi</surname>
<given-names>D. C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Anomalous development of thyroid gland; a cadaveric study in coastal population of Andhra Pradesh</article-title>. <source>Indian J. Clin. Anat. Physiology</source> <volume>6</volume> (<issue>2</issue>), <fpage>220</fpage>&#x2013;<lpage>223</lpage>. <pub-id pub-id-type="doi">10.18231/j.ijcap.2019.049</pub-id>
</citation>
</ref>
<ref id="B158">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sofiadis</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Dinets</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Orre</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Branca</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Juhlin</surname>
<given-names>C. C.</given-names>
</name>
<name>
<surname>Foukakis</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>Proteomic study of thyroid tumors reveals frequent up-regulation of the Ca2&#x2b; -binding protein S100A6 in papillary thyroid carcinoma</article-title>. <source>Thyroid</source> <volume>20</volume> (<issue>10</issue>), <fpage>1067</fpage>&#x2013;<lpage>1076</lpage>. <pub-id pub-id-type="doi">10.1089/thy.2009.0400</pub-id>
</citation>
</ref>
<ref id="B159">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Speiser</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Miller</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Tooze</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ip</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A comparison of random forest variable selection methods for classification prediction modeling</article-title>. <source>Expert Syst. Appl.</source> <volume>134</volume>, <fpage>93</fpage>&#x2013;<lpage>101</lpage>. <pub-id pub-id-type="doi">10.1016/j.eswa.2019.05.028</pub-id>
</citation>
</ref>
<ref id="B160">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Steven</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Random forest</article-title>. <source>J. Insur. Med.</source> <volume>47</volume> (<issue>1</issue>), <fpage>31</fpage>&#x2013;<lpage>39</lpage>. <pub-id pub-id-type="doi">10.17849/insm-47-01-31-39.1</pub-id>
</citation>
</ref>
<ref id="B161">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sugimoto</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kawakami</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Robert</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Soga</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tomita</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Bioinformatics tools for mass spectroscopy-based metabolomic data processing and analysis</article-title>. <source>Curr. Bioinforma.</source> <volume>7</volume> (<issue>1</issue>), <fpage>96</fpage>&#x2013;<lpage>108</lpage>. <pub-id pub-id-type="doi">10.2174/157489312799304431</pub-id>
</citation>
</ref>
<ref id="B162">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Salerno</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Sujimongkol</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Use of machine learning to assess the prognostic utility of radiomic features for in-hospital COVID-19 mortality</article-title>. <source>Sci. Rep.</source> <volume>13</volume> (<issue>1</issue>), <fpage>7318</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-023-34559-0</pub-id>
</citation>
</ref>
<ref id="B163">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Selvarajan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Artificial intelligence defines protein-based classification of thyroid nodules</article-title>. <source>Cell. Discov.</source> <volume>8</volume> (<issue>1</issue>), <fpage>85</fpage>. <pub-id pub-id-type="doi">10.1038/s41421-022-00442-x</pub-id>
</citation>
</ref>
<ref id="B164">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Peng</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>A diagnostic protein assay for differentiating follicular thyroid adenoma and carcinoma</article-title>. <comment>medRxiv</comment>. <pub-id pub-id-type="doi">10.1101/2024.09.26.24314403</pub-id>
</citation>
</ref>
<ref id="B165">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Surman</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wilczak</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Jankowska</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Skupien-Rabian</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Przybylo</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Shotgun proteomics of thyroid carcinoma exosomes - insight into the role of exosomal proteins in carcinogenesis and thyroid homeostasis</article-title>. <source>Biochim. Biophys. Acta Gen. Subj.</source> <volume>1868</volume> (<issue>9</issue>), <fpage>130672</fpage>. <pub-id pub-id-type="doi">10.1016/j.bbagen.2024.130672</pub-id>
</citation>
</ref>
<ref id="B166">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Khateeb</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Recent advances of deep learning in bioinformatics and computational biology</article-title>. <source>Front. Genet.</source> <volume>10</volume>, <fpage>214</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2019.00214</pub-id>
</citation>
</ref>
<ref id="B167">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Torres-Cabala</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Panizo-Santos</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Krutzsch</surname>
<given-names>H. C.</given-names>
</name>
<name>
<surname>Barazi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Namba</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sakaguchi</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2004</year>). <article-title>Differential expression of S100C in thyroid lesions</article-title>. <source>Int. J. Surg. Pathol.</source> <volume>12</volume> (<issue>2</issue>), <fpage>107</fpage>&#x2013;<lpage>115</lpage>. <pub-id pub-id-type="doi">10.1177/106689690401200203</pub-id>
</citation>
</ref>
<ref id="B168">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Torun</surname>
<given-names>F. M.</given-names>
</name>
<name>
<surname>Virreira Winter</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Doll</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Riese</surname>
<given-names>F. M.</given-names>
</name>
<name>
<surname>Vorobyev</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mueller-Reif</surname>
<given-names>J. B.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Transparent exploration of machine learning for biomarker discovery from proteomics and omics data</article-title>. <source>J. Proteome Res.</source> <volume>22</volume> (<issue>2</issue>), <fpage>359</fpage>&#x2013;<lpage>367</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jproteome.2c00473</pub-id>
</citation>
</ref>
<ref id="B169">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vanderpump</surname>
<given-names>M. P.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>The epidemiology of thyroid disease</article-title>. <source>Br. Med. Bull.</source> <volume>99</volume>, <fpage>39</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1093/bmb/ldr030</pub-id>
</citation>
</ref>
<ref id="B170">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Venkatesh</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Anuradha</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A review of feature selection and its methods</article-title>. <source>Cybern. Inf. Technol.</source> <volume>19</volume> (<issue>1</issue>), <fpage>3</fpage>&#x2013;<lpage>26</lpage>. <pub-id pub-id-type="doi">10.2478/cait-2019-0001</pub-id>
</citation>
</ref>
<ref id="B171">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Wald</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Khoshgoftaar</surname>
<given-names>T. M.</given-names>
</name>
<name>
<surname>Napolitano</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2013</year>). &#x201c;<article-title>How the choice of wrapper learner and performance metric affects subset evaluation</article-title>,&#x201d; in <conf-name>2013 IEEE 25th International Conference on Tools with Artificial Intelligence</conf-name>, <conf-date>4-6 Nov. 2013</conf-date>, <fpage>426</fpage>&#x2013;<lpage>432</lpage>. <pub-id pub-id-type="doi">10.1109/ictai.2013.70</pub-id>
</citation>
</ref>
<ref id="B172">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Walsh</surname>
<given-names>J. P.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Managing thyroid disease in general practice</article-title>. <source>Med. J. Aust.</source> <volume>205</volume> (<issue>4</issue>), <fpage>179</fpage>&#x2013;<lpage>184</lpage>. <pub-id pub-id-type="doi">10.5694/mja16.00545</pub-id>
</citation>
</ref>
<ref id="B173">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2024b</year>). <article-title>Risk of papillary thyroid carcinoma and nodular goiter associated with exposure to semi-volatile organic compounds: a multi-pollutant assessment based on machine learning algorithms</article-title>. <source>Sci. Total Environ.</source> <volume>915</volume>, <fpage>169962</fpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2024.169962</pub-id>
</citation>
</ref>
<ref id="B174">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H. N.</given-names>
</name>
<name>
<surname>Cui</surname>
<given-names>X. Q.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>S. Y.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>S100A1 is a potential biomarker for papillary thyroid carcinoma diagnosis and prognosis</article-title>. <source>J. Cancer</source> <volume>12</volume> (<issue>19</issue>), <fpage>5760</fpage>&#x2013;<lpage>5771</lpage>. <pub-id pub-id-type="doi">10.7150/jca.51855</pub-id>
</citation>
</ref>
<ref id="B175">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Qiu</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2024a</year>). <article-title>Development and validation of prediction models for papillary thyroid cancer structural recurrence using machine learning approaches</article-title>. <source>BMC Cancer</source> <volume>24</volume> (<issue>1</issue>), <fpage>427</fpage>. <pub-id pub-id-type="doi">10.1186/s12885-024-12146-4</pub-id>
</citation>
</ref>
<ref id="B176">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Gimple</surname>
<given-names>R. C.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2023b</year>). <article-title>Integrative multi-omics approaches to explore immune cell functions: challenges and opportunities</article-title>. <source>iScience</source> <volume>26</volume> (<issue>4</issue>), <fpage>106359</fpage>. <pub-id pub-id-type="doi">10.1016/j.isci.2023.106359</pub-id>
</citation>
</ref>
<ref id="B177">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Power of metabolomics in diagnosis and biomarker discovery of hepatocellular carcinoma</article-title>. <source>Hepatology</source> <volume>57</volume> (<issue>5</issue>), <fpage>2072</fpage>&#x2013;<lpage>2077</lpage>. <pub-id pub-id-type="doi">10.1002/hep.26130</pub-id>
</citation>
</ref>
<ref id="B178">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Shima</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2022b</year>). <article-title>Rapid diagnosis of papillary thyroid carcinoma with machine learning and probe electrospray ionization mass spectrometry</article-title>. <source>J. Mass Spectrom.</source> <volume>57</volume> (<issue>6</issue>), <fpage>e4831</fpage>. <pub-id pub-id-type="doi">10.1002/jms.4831</pub-id>
</citation>
</ref>
<ref id="B179">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Di</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2022c</year>). <article-title>Fast classification of thyroid nodules with ultrasound guided-fine needle biopsy samples and machine learning</article-title>. <source>Appl. Sci.</source> <volume>12</volume> (<issue>11</issue>), <fpage>5364</fpage>. <pub-id pub-id-type="doi">10.3390/app12115364</pub-id>
</citation>
</ref>
<ref id="B180">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Lih</surname>
<given-names>T. M.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Kuczler</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2022a</year>). <article-title>Optimized data-independent acquisition approach for proteomic analysis at single-cell level</article-title>. <source>Clin. Proteomics</source> <volume>19</volume> (<issue>1</issue>), <fpage>24</fpage>. <pub-id pub-id-type="doi">10.1186/s12014-022-09359-9</pub-id>
</citation>
</ref>
<ref id="B181">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Lyu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2024c</year>). <article-title>An individualized protein-based prognostic model to stratify pediatric patients with papillary thyroid carcinoma</article-title>. <source>Nat. Commun.</source> <volume>15</volume> (<issue>1</issue>), <fpage>3560</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-024-47926-w</pub-id>
</citation>
</ref>
<ref id="B182">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Xiong</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2023a</year>). <article-title>Advances in mass spectrometry-based multi-scale metabolomic methodologies and their applications in biological and clinical investigations</article-title>. <source>Sci. Bull. (Beijing)</source> <volume>68</volume>, <fpage>2268</fpage>&#x2013;<lpage>2284</lpage>. <pub-id pub-id-type="doi">10.1016/j.scib.2023.08.047</pub-id>
</citation>
</ref>
<ref id="B183">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wekesa</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Kimwele</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>A review of multi-omics data integration through deep learning approaches for disease diagnosis, prognosis, and treatment</article-title>. <source>Front. Genet.</source> <volume>14</volume>, <fpage>1199087</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2023.1199087</pub-id>
</citation>
</ref>
<ref id="B184">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>White</surname>
<given-names>P. T.</given-names>
</name>
<name>
<surname>Subramanian</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Gallagher</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Novel HSP90 inhibitors effectively target functions of thyroid cancer stem cell preventing migration and invasion</article-title>. <source>Surgery</source> <volume>159</volume> (<issue>1</issue>), <fpage>142</fpage>&#x2013;<lpage>151</lpage>. <pub-id pub-id-type="doi">10.1016/j.surg.2015.07.050</pub-id>
</citation>
</ref>
<ref id="B185">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wickenberg</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mercier</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Yap</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Walker</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Baker</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>LaPointe</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Hsp90 inhibition leads to an increase in surface expression of multiple immunological receptors in cancer cells</article-title>. <source>Front. Mol. Biosci.</source> <volume>11</volume>, <fpage>1334876</fpage>. <pub-id pub-id-type="doi">10.3389/fmolb.2024.1334876</pub-id>
</citation>
</ref>
<ref id="B186">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wojakowska</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Chekan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Marczak</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Polanski</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Lange</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Pietrowska</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Detection of metabolites discriminating subtypes of thyroid cancer: molecular profiling of FFPE samples using the GC/MS approach</article-title>. <source>Mol. Cell. Endocrinol.</source> <volume>417</volume>, <fpage>149</fpage>&#x2013;<lpage>157</lpage>. <pub-id pub-id-type="doi">10.1016/j.mce.2015.09.021</pub-id>
</citation>
</ref>
<ref id="B187">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wojakowska</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cole</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Chekan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bednarczyk</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Maksymiak</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Oczko-Wojciechowska</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Discrimination of papillary thyroid cancer from non-cancerous thyroid tissue based on lipid profiling by mass spectrometry imaging</article-title>. <source>Endokrynol. Pol.</source> <volume>69</volume> (<issue>1</issue>), <fpage>2</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.5603/EP.a2018.0003</pub-id>
</citation>
</ref>
<ref id="B188">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ws</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>What is a support vector machine?</article-title> <source>Nat. Biotechnol.</source> <volume>24</volume> (<issue>12</issue>), <fpage>1565</fpage>&#x2013;<lpage>1557</lpage>. <pub-id pub-id-type="doi">10.1038/nbt1206-1565</pub-id>
</citation>
</ref>
<ref id="B189">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xi</surname>
<given-names>N. M.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Improving the diagnosis of thyroid cancer by machine learning and clinical data</article-title>. <source>Sci. Rep.</source> <volume>12</volume> (<issue>1</issue>), <fpage>11143</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-022-15342-z</pub-id>
</citation>
</ref>
<ref id="B190">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiao</surname>
<given-names>J. F.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Ressom</surname>
<given-names>H. W.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Metabolite identification and quantitation in LC-MS/MS-based metabolomics</article-title>. <source>Trends Anal. Chem.</source> <volume>32</volume>, <fpage>1</fpage>&#x2013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.1016/j.trac.2011.08.009</pub-id>
</citation>
</ref>
<ref id="B191">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Integrating network pharmacology and metabolomics to elucidate the mechanism of action of Huang Qin decoction for treament of diabetic liver injury</article-title>. <source>Front. Pharmacol.</source> <volume>13</volume>, <fpage>899043</fpage>. <pub-id pub-id-type="doi">10.3389/fphar.2022.899043</pub-id>
</citation>
</ref>
<ref id="B192">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yadav</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Transformative frontiers: a comprehensive review of emerging technologies in modern healthcare</article-title>. <source>Cureus</source> <volume>16</volume>, <fpage>e56538</fpage>. <pub-id pub-id-type="doi">10.7759/cureus.56538</pub-id>
</citation>
</ref>
<ref id="B193">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Gong</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Dimensionality reduction by UMAP reinforces sample heterogeneity analysis in bulk transcriptomic data</article-title>. <source>Cell. Rep.</source> <volume>36</volume> (<issue>4</issue>), <fpage>109442</fpage>. <pub-id pub-id-type="doi">10.1016/j.celrep.2021.109442</pub-id>
</citation>
</ref>
<ref id="B194">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yao</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Su</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Peng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Serum metabolic profiling and features of papillary thyroid carcinoma and nodular goiter</article-title>. <source>Mol. Biosyst.</source> <volume>7</volume> (<issue>9</issue>), <fpage>2608</fpage>&#x2013;<lpage>2614</lpage>. <pub-id pub-id-type="doi">10.1039/c1mb05029j</pub-id>
</citation>
</ref>
<ref id="B195">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Feider</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Nagi</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Carter</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Suliburk</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2017a</year>). <article-title>Detection of metastatic breast and thyroid cancer in lymph nodes by desorption electrospray ionization mass spectrometry imaging</article-title>. <source>J. Am. Soc. Mass Spectrom.</source> <volume>28</volume> (<issue>6</issue>), <fpage>1166</fpage>&#x2013;<lpage>1174</lpage>. <pub-id pub-id-type="doi">10.1007/s13361-016-1570-2</pub-id>
</citation>
</ref>
<ref id="B196">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zong</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2017b</year>). <article-title>Learning k for kNN Classification</article-title>. <source>ACM Trans. Intelligent Syst. Technol.</source> <volume>8</volume> (<issue>3</issue>), <fpage>1</fpage>&#x2013;<lpage>19</lpage>. <pub-id pub-id-type="doi">10.1145/2990508</pub-id>
</citation>
</ref>
<ref id="B197">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>V. C.</given-names>
</name>
<name>
<surname>Rong</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Deep convolutional neural networks in thyroid disease detection: a multi-classification comparison by ultrasonography and computed tomography</article-title>. <source>Comput. Methods Programs Biomed.</source> <volume>220</volume>, <fpage>106823</fpage>. <pub-id pub-id-type="doi">10.1016/j.cmpb.2022.106823</pub-id>
</citation>
</ref>
<ref id="B198">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>W. H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Exosomes: biogenesis, biologic function and clinical potential</article-title>. <source>Cell. Biosci.</source> <volume>9</volume>, <fpage>19</fpage>. <pub-id pub-id-type="doi">10.1186/s13578-019-0282-2</pub-id>
</citation>
</ref>
<ref id="B199">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2022a</year>). <article-title>Molecular network strategy in multi-omics and mass spectrometry imaging</article-title>. <source>Curr. Opin. Chem. Biol.</source> <volume>70</volume>, <fpage>102199</fpage>. <pub-id pub-id-type="doi">10.1016/j.cbpa.2022.102199</pub-id>
</citation>
</ref>
<ref id="B200">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2022b</year>). <article-title>Predicting the risk of nodular thyroid disease in coal miners based on different machine learning models</article-title>. <source>Front. Med. (Lausanne)</source> <volume>9</volume>, <fpage>1037944</fpage>. <pub-id pub-id-type="doi">10.3389/fmed.2022.1037944</pub-id>
</citation>
</ref>
<ref id="B201">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Development of data-independent acquisition workflows for metabolomic analysis on a quadrupole-orbitrap platform</article-title>. <source>Talanta</source> <volume>164</volume>, <fpage>128</fpage>&#x2013;<lpage>136</lpage>. <pub-id pub-id-type="doi">10.1016/j.talanta.2016.11.048</pub-id>
</citation>
</ref>
<ref id="B202">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Feature screening of radioactive iodine-refractory thyroid carcinoma based on proteomics analysis and artificial intelligence</article-title>. <source>SSRN</source>. <pub-id pub-id-type="doi">10.2139/ssrn.4865048</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>