<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mol. Biosci.</journal-id>
<journal-title>Frontiers in Molecular Biosciences</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mol. Biosci.</abbrev-journal-title>
<issn pub-type="epub">2296-889X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1346242</article-id>
<article-id pub-id-type="doi">10.3389/fmolb.2024.1346242</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Molecular Biosciences</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Deep learning-based identification of esophageal cancer subtypes through analysis of high-resolution histopathology images</article-title>
<alt-title alt-title-type="left-running-head">Aalam et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fmolb.2024.1346242">10.3389/fmolb.2024.1346242</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Aalam</surname>
<given-names>Syed Wajid</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2590935/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ahanger</surname>
<given-names>Abdul Basit</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2608634/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Masoodi</surname>
<given-names>Tariq A.</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1725510/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bhat</surname>
<given-names>Ajaz A.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/537745/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Akil</surname>
<given-names>Ammira S. Al-Shabeeb</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/636492/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Khan</surname>
<given-names>Meraj Alam</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Assad</surname>
<given-names>Assif</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Macha</surname>
<given-names>Muzafar A.</given-names>
</name>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/954838/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Bhat</surname>
<given-names>Muzafar Rasool</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2608117/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Computer Science</institution>, <institution>Islamic University of Science and Technology</institution>, <addr-line>Awantipora</addr-line>, <country>India</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Human Immunology Department</institution>, <institution>Research Branch</institution>, <institution>Sidra Medicine</institution>, <addr-line>Doha</addr-line>, <country>Qatar</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Human Genetics-Precision Medicine in Diabetes</institution>, <institution>Obesity and Cancer Program</institution>, <institution>Sidra Medicine</institution>, <addr-line>Doha</addr-line>, <country>Qatar</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>DigiBiomics Inc</institution>, <addr-line>Mississauga</addr-line>, <addr-line>ON</addr-line>, <country>Canada</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Department of Computer Science and Engineering, Islamic University of Science and Technology</institution>, <addr-line>Awantipora</addr-line>, <country>India</country>
</aff>
<aff id="aff6">
<sup>6</sup>
<institution>Watson-Crick Centre for Molecular Medicine</institution>, <institution>Islamic University of Science and Technology</institution>, <addr-line>Awantipora</addr-line>, <country>India</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/908478/overview">Xin Zhang</ext-link>, Jiangmen Central Hospital, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/711875/overview">Nguyen Quoc Khanh Le</ext-link>, Taipei Medical University, Taiwan</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1605426/overview">Shigao Huang</ext-link>, Air Force Medical University, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Muzafar Rasool Bhat, <email>Muzafar.rasool@islamicuniversity.edu.in</email>; Muzafar A. Macha, <email>muzafar.macha@iust.ac.in</email>, <email>muzafar.aiiims@gmail.com</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>19</day>
<month>03</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>11</volume>
<elocation-id>1346242</elocation-id>
<history>
<date date-type="received">
<day>29</day>
<month>11</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>23</day>
<month>02</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Aalam, Ahanger, Masoodi, Bhat, Akil, Khan, Assad, Macha and Bhat.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Aalam, Ahanger, Masoodi, Bhat, Akil, Khan, Assad, Macha and Bhat</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Esophageal cancer (EC) remains a significant health challenge globally, with increasing incidence and high mortality rates. Despite advances in treatment, there remains a need for improved diagnostic methods and understanding of disease progression. This study addresses the significant challenges in the automatic classification of EC, particularly in distinguishing its primary subtypes: adenocarcinoma and squamous cell carcinoma, using histopathology images. Traditional histopathological diagnosis, while being the gold standard, is subject to subjectivity and human error and imposes a substantial burden on pathologists. This study proposes a binary class classification system for detecting EC subtypes in response to these challenges. The system leverages deep learning techniques and tissue-level labels for enhanced accuracy. We utilized 59 high-resolution histopathological images from The Cancer Genome Atlas (TCGA) Esophageal Carcinoma dataset (TCGA-ESCA). These images were preprocessed, segmented into patches, and analyzed using a pre-trained ResNet101 model for feature extraction. For classification, we employed five machine learning classifiers: Support Vector Classifier (SVC), Logistic Regression (LR), Decision Tree (DT), AdaBoost (AD), Random Forest (RF), and a Feed-Forward Neural Network (FFNN). The classifiers were evaluated based on their prediction accuracy on the test dataset, yielding results of 0.88 (SVC and LR), 0.64 (DT and AD), 0.82 (RF), and 0.94 (FFNN). Notably, the FFNN classifier achieved the highest Area Under the Curve (AUC) score of 0.92, indicating its superior performance, followed closely by SVC and LR, with a score of 0.87. This suggested approach holds promising potential as a decision-support tool for pathologists, particularly in regions with limited resources and expertise. The timely and precise detection of EC subtypes through this system can substantially enhance the likelihood of successful treatment, ultimately leading to reduced mortality rates in patients with this aggressive cancer.</p>
</abstract>
<kwd-group>
<kwd>histopathology</kwd>
<kwd>deep learning</kwd>
<kwd>machine learning</kwd>
<kwd>transfer learning</kwd>
<kwd>image processing</kwd>
<kwd>whole slide image</kwd>
<kwd>patching</kwd>
<kwd>normalization</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Molecular Diagnostics and Therapeutics</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Esophageal cancer (EC), which has seen a concerning rise in prevalence over the past 4&#xa0;decades (<xref ref-type="bibr" rid="B38">Napier et al., 2014</xref>), now ranks as the eighth most common cancer and the sixth leading cause of cancer-related mortality worldwide (<xref ref-type="bibr" rid="B40">Pakzad et al., 2016</xref>). This aggressive disease presents a formidable challenge, with 5-year survival rates between 15% and 25% (<xref ref-type="bibr" rid="B43">Pennathur et al., 2013</xref>). In 2020 alone, approximately 600,000 new EC cases were reported, tragically resulting in an estimated 540,000 fatalities (<xref ref-type="bibr" rid="B53">Sung et al., 2021</xref>). The origins of this malignancy typically lie in the mucosa, the innermost layer of the esophagus, and from there, it can infiltrate various vital organs, including the stomach, liver, lungs, chest, blood vessels, and lymph nodes. EC comprises two primary subtypes: Esophageal Squamous Cell Carcinoma (SCC) and Adenocarcinoma (ADC), along with a handful of relatively uncommon small-cell carcinomas like melanoma, sarcoma and lymphoma (<xref ref-type="bibr" rid="B1">Abbas and Krasna, 2017</xref>; <xref ref-type="bibr" rid="B61">Yang et al., 2020</xref>).</p>
<p>In medical diagnostics, histopathological image analysis is the gold standard for cancer diagnosis (<xref ref-type="bibr" rid="B16">Gurcan et al., 2009</xref>; <xref ref-type="bibr" rid="B54">Tomaszewski, 2021</xref>). Histopathological images provide a comprehensive view of diseases, capturing many cytological features that furnish detailed diagnostic insights. These features encompass heightened mitotic activity, cellular enlargement, nuclear hyperchromasia, irregular nuclear chromatin distribution, prominent and sizable nucleoli, cellular and nuclear pleomorphism, increased cellularity, abnormalities in nuclear membranes, cellular discohesiveness, and the presence of tumor necrosis in the background, also known as tumor diathesis. Unlike mammography or CT scans, these cytological characteristics are not easily discernible through other imaging techniques (<xref ref-type="bibr" rid="B3">Al-Abbadi, 2011</xref>). Nevertheless, conventional methods employed to analyze histopathology whole-slide images (WSI) have limitations, notably in time consumption and observer variability. Traditionally, pathologists scrutinize tissue samples under a microscope, having stained them with Haematoxylin and Eosin (H&#x26;E) to enhance tissue organ contrast (<xref ref-type="bibr" rid="B20">He et al., 2012</xref>). However, this labour-intensive visual inspection and subjective interpretive process require pathologists to examine multiple regions of interest within each slide.</p>
<p>Furthermore, the inherent subjectivity in visual interpretation can introduce variations among different observers, leading to inconsistent diagnoses and assessments (<xref ref-type="bibr" rid="B4">Allison et al., 2014</xref>). Hence, a compelling need exists for more efficient and objective approaches to WSI analysis, such as advanced digital pathology techniques that leverage image analysis algorithms, artificial intelligence, and machine learning. These cutting-edge methods aim to automate and streamline the analysis process, diminishing the reliance on manual examination and enhancing efficiency, consistency, and accuracy in evaluating histopathology WSI.</p>
<p>Artificial intelligence (AI) and deep learning (DL) diagnostic systems are becoming increasingly popular, opening up new possibilities in image analysis (<xref ref-type="bibr" rid="B15">Guo et al., 2023</xref>; <xref ref-type="bibr" rid="B36">Muller et al., 2023</xref>; <xref ref-type="bibr" rid="B58">Wang et al., 2023</xref>; <xref ref-type="bibr" rid="B60">Xiao et al., 2023</xref>). By harnessing shape and texture attributes alongside higher-order spatial features that capture intricate pixel-level relationships, these systems elevate images into high-dimensional features, vastly enhancing their capability for detection and classification (<xref ref-type="bibr" rid="B29">Kumar et al., 2012</xref>). While feature extraction-based classification systems, which rely on handcrafted features to characterize cancer subtypes, have seen advancements, researchers increasingly recognize the potency of deep neural networks (DNN) for automatic feature extraction and comprehensive visual analysis (<xref ref-type="bibr" rid="B27">Kermany et al., 2018</xref>; <xref ref-type="bibr" rid="B49">Shimizu and Nakayama, 2020</xref>; <xref ref-type="bibr" rid="B64">Zhou et al., 2020</xref>). Unlike traditional manual approaches, deep learning&#x2019;s automatic feature extraction through multiple non-linear transformation layers empowers it to capture a broad spectrum of generalizable and high-level features, particularly suited for intricate tasks like medical image analysis. Remarkably, both DL and machine learning (ML) have been deployed in intriguing ways for the diagnosis, prognosis prediction (<xref ref-type="bibr" rid="B55">Tran et al., 2021</xref>), and classification of various cancer types, utilizing diverse imaging modalities such as histopathology, CT scans, and MRI imaging. Their ability to handle vast medical data and discern complex patterns promises to revolutionize cancer diagnosis and treatment. In the context of EC patients, correct staging, treatment planning, and prognostication are pivotal for improving patient outcomes and survival rates (<xref ref-type="bibr" rid="B22">Huang et al., 2022</xref>). Unfortunately, EC is frequently diagnosed at advanced stages, owing to its non-specific early symptoms and the challenge of accessing the esophagus, resulting in a bleak prognosis. Thus, the importance of early detection cannot be overstated, as it holds the key to timely interventions, exploration of a broader range of treatment options, and, ultimately, better long-term survival for patients.</p>
<p>A recent investigation (<xref ref-type="bibr" rid="B57">Wagner and Cosgrove, 2023</xref>) utilized ResNet-18 for endometrial subtype classification, employing Tissue level annotation of WSIs from the (TCGA-UCEC) dataset. This study achieved the best AUC of 0.82 in predicting the subtypes of cancer. In another research (<xref ref-type="bibr" rid="B63">Zhao et al., 2023</xref>), a DL model based on ResNet50, utilizing 523 annotated whole-slide images, demonstrated the capability to classify invasive non-mucinous lung adenocarcinoma subtypes with an AUC of 0.80. A study has employed transfer learning to extract features, subsequently utilizing various machine learning models for classification, achieving an accuracy of 0.93 (<xref ref-type="bibr" rid="B30">Kumar A and Mubarak, 2022</xref>). Another study presents a two-stage deep transfer learning method for subclass classification in histopathology images, overcoming limitations in traditional patch-based approaches. While employing patch-based classification, the results are aggregated for slide-level classification. The study attains automatic classification of epithelial ovarian carcinoma WSIs with an accuracy of 0.87 (<xref ref-type="bibr" rid="B59">Wang et al., 2020</xref>).</p>
<p>Contemporary studies on esophageal cancer (EC) subtype classification predominantly rely on patch-level annotations, introducing different challenges. The reliance on such annotations has been associated with inter-observer variability and limitations in capturing the comprehensive spatial and morphological distinctions inherent in esophageal cancer tissues (<xref ref-type="bibr" rid="B41">Paul and Mukherjee, 2015</xref>). The imperative for direct pathologist involvement in the annotation process not only imposes heightened time and resource demands but also intensifies the potential for divergent annotation practices. The repeated emphasis on direct pathologist involvement extends the temporal and resource investment and underscores the susceptibility to variations in annotation practices. These variations further challenge the integration and comparability of results across diverse research studies, hindering the establishment of a cohesive and standardized understanding of EC subtypes (<xref ref-type="bibr" rid="B11">Evans et al., 2023</xref>).</p>
<p>Addressing this gap, we aimed to develop an advanced DL-based automated diagnostic system, leveraging state-of-the-art deep learning techniques for feature engineering and machine learning, to accurately classify different subtypes of esophageal cancer using H&#x26;E images of the esophagus. While adhering to fundamental predictive modelling procedures, we have introduced an innovative approach by incorporating a median-based technique to effectively address the inherent variability in the number of tumor tiles across Whole Slide Images (WSIs) and demonstrate resilience to outliers, enhancing the stability and reliability of our model. We trained our model on a dataset comprising 42 high-resolution WSI and subsequently validated it using 17 additional images.</p>
</sec>
<sec sec-type="methods" id="s2">
<title>Methodology</title>
<sec id="s2-1">
<title>Data collection</title>
<p>The Cancer Genome Atlas Esophageal Carcinoma Collection (TCGA-ESCA) cohort comprises diagnostic and tissue slides for 182 subjects. Diagnostic slides, which provide detailed information about tissue phenotypic heterogeneity (<xref ref-type="bibr" rid="B9">Chen et al., 2022</xref>), were exclusively focused upon due to their significance in histologic analysis. This study did not consider tissue slides, often used for genomic analysis (<xref ref-type="bibr" rid="B17">Gutman et al., 2013</xref>). As such, only 156 subjects with diagnostics slides available in TCGA-ESCA were selected, as shown in <xref ref-type="fig" rid="F1">Figure 1</xref>. Following rigorous filtering criteria by excluding the WSIs with poor visual quality, extensive blurring, abnormal staining, and ink marks. Finally, 59 high-quality diagnostic WSIs were obtained from the TCGA-ESCA cohort. This curated dataset, consisting of H&#x26;E stained WSIs categorized into SCC and ADC, ensured consistency and quality for subsequent research and analysis. Significantly, the TCGA cohort&#x2019;s open accessibility without authentication requirements greatly facilitated our investigative activities.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Exclusion criteria: The complete data selection process, incorporating exclusion criteria and showcasing the data distribution in train and test sets.</p>
</caption>
<graphic xlink:href="fmolb-11-1346242-g001.tif"/>
</fig>
</sec>
<sec id="s2-2">
<title>Preprocessing of histopathology images</title>
<p>Training DNN and ML models directly on entire gigapixel H&#x26;E WSI presents substantial computational challenges with current standard computing resources. We adopted strategies such as tiling and down-sampling (<xref ref-type="bibr" rid="B52">Srinidhi et al., 2021</xref>). High-resolution images are broken down into smaller, more manageable patches. Within these WSIs, there were both informative and non-informative regions. The Canny edge detection algorithm was employed for its ability to differentiate and outline tissue boundaries, leveraging its capability to identify noisy edges effectively. The method offers criteria of strong edge detection, precise localization, and single response, making it a suitable choice for our purpose (<xref ref-type="bibr" rid="B8">Canny, 1986</xref>). Subsequently, masks were generated to demarcate the boundary between the background and the tissue (foreground) using a graph-based segmentation method. The method was chosen due to its adeptness in handling pixel intensity variations, ensuring resilience against challenges posed by staining and tissue characteristic variations, and fostering consistent and reliable boundary demarcation (<xref ref-type="bibr" rid="B12">Felzenszwalb and Huttenlocher, 2004</xref>). These mask images were then organized into a grid of tiles based on specified dimensions to form patches. Patches comprising background information were discarded, while those primarily containing tissue (foreground) information were retained for further analysis. Various techniques, including random sampling, Otsu, and adaptive thresholding, can be used to eliminate background tiles (<xref ref-type="bibr" rid="B39">Otsu, 1979</xref>; <xref ref-type="bibr" rid="B26">Kalton, 2011</xref>; <xref ref-type="bibr" rid="B46">Roy et al., 2014</xref>). We utilized the Otsu method, a widely used thresholding algorithm (<xref ref-type="bibr" rid="B14">Goh et al., 2018</xref>; <xref ref-type="bibr" rid="B23">Huang et al., 2021</xref>; <xref ref-type="bibr" rid="B50">Singh et al., 2021</xref>), to discard unwanted background images from the generated patch set due to its thresholding capability for varying image characteristics, allowing for optimal discrimination between tissue and background in an unsupervised manner. Tiles containing less than 10% tissue were excluded and classified as background by setting the threshold to 0.1. Histology images were preprocessed using PyHIST (<xref ref-type="bibr" rid="B37">Mu&#xf1;oz-Aguirre et al., 2020</xref>), a TIFF/SVS file format segmentation tool. Nonoverlapping patches measuring 512 &#xd7; 512 pixels were extracted from each WSI, and H&#x26;E images with a magnification greater than &#xd7;20 were only considered for this study.</p>
</sec>
<sec id="s2-3">
<title>Data normalization</title>
<p>Histopathology images exhibit inherent color variations stemming from differences in staining concentration, varied equipment usage, and occasional inconsistencies in tissue sectioning. These color disparities within WSI introduce increased variability into the training data, potentially impacting the model&#x2019;s efficacy during training. Various methods exist for image color normalization, including the Reinhard Algorithm (RA) (<xref ref-type="bibr" rid="B45">Reinhard et al., 2001</xref>), Histogram Specification (<xref ref-type="bibr" rid="B24">Hussain et al., 2018</xref>), and Structure-Preserving Color Normalization (<xref ref-type="bibr" rid="B56">Vahadane et al., 2016</xref>), with RA notably demonstrating superior performance in DL models. The RA method computes a chosen reference image&#x2019;s mean and standard deviation. During the color correction process, the color characteristics of one image are aligned with those of another. Careful consideration was given to the reference image selection, as normalization outcomes can be influenced if the chosen reference image exhibits darker colors (<xref ref-type="bibr" rid="B47">Roy et al., 2021</xref>). The application of Reinhard color normalization to our dataset is based on established practices in the literature (<xref ref-type="bibr" rid="B31">Lakshmanan et al., 2019</xref>; <xref ref-type="bibr" rid="B44">Qu et al., 2021</xref>), demonstrating its superior performance compared to other techniques. This normalization method effectively mitigated the complexity of the extracted features, thereby enhancing the overall quality of our analysis.</p>
</sec>
<sec id="s2-4">
<title>Model training and evaluation</title>
<p>We employed a two-step approach for classification, as outlined in <xref ref-type="fig" rid="F2">Figure 2</xref>. In the initial step, we performed feature extraction on all the tiles within the WSI using a pre-trained CNN (ResNet101) (<xref ref-type="bibr" rid="B19">He et al., 2016</xref>). This process generated a 2048-dimensional feature vector for each tile in the WSI. Consequently, we constructed a feature matrix of size N x 2048 for each subject, where N represents the number of tumor tiles within the WSI. This variable significantly differs across WSIs. The variance in the number of patches generated during the tiling process impacts the model&#x2019;s prediction efficiency. To address this, we calculated the median of the stacked feature vectors from all the WSI tiles along the vertical axis, thereby creating a single feature vector with a size of 2048. These feature vectors were subsequently input into various classification algorithms to predict the EC subtypes. The experimentation was conducted on an NVIDIA Tesla V100 GPU with 32&#xa0;GB memory, boasting 15,360 CUDA Cores and a processing power of 2.976 TFLOPS. On average, normalization per tile required 0.25&#xa0;s, and Feature extraction exhibited an average time of 0.03&#xa0;s per tile. These metrics underscore the computational efficiency of the algorithms on the specified high-performance GPU architecture. We employed performance metrics such as Accuracy, AUC, Recall, F1-score, and Precision to assess the proposed model&#x2019;s efficacy in classifying EC subtypes. Accuracy provides a comprehensive assessment of correctness in both classes, particularly effective in balanced class distributions. AUC evaluates the model&#x2019;s discriminatory ability across various thresholds. Recall quantifies the model&#x2019;s efficacy in identifying positive instances out of total positive instances, which is crucial in scenarios prioritizing sensitivity. Precision measures the accuracy of actual positive predictions, offering insights into the model&#x2019;s specificity. Lastly, the F1 score strikes a balance between precision and recall, furnishing the evaluation of overall model performance in classification tasks.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Experimentation pipeline: The process involves taking each color-normalized tile and passing it through a pre-trained model to obtain a 2048-dimensional feature vector. These feature vectors from all tiles belonging to the same patient are then combined into a single feature vector of size 2048 and used as input for various machine-learning models to make predictions about esophageal cancer (EC) subtypes.</p>
</caption>
<graphic xlink:href="fmolb-11-1346242-g002.tif"/>
</fig>
<p>During the model training and evaluation, we utilized a Feed-Forward Neural Network (FFNN) configured with only two layers. The first layer, with a size of 2048, was designed to accept the input feature vector, preserving compatibility with the size of the extracted features obtained during the feature extraction process using pretrained models. The second layer was employed for classification, strategically reintegrating the last layer of the pretrained model, which was initially removed during the feature extraction process. This approach allows for an efficient utilization of the deep hierarchical representations learned by the model. The choice of two dense layers with Rectified Linear Unit (ReLU) activation function (<xref ref-type="bibr" rid="B2">Agarap, 2018</xref>), a learning rate of 10<sup>&#x2013;3</sup> over 800 epochs, and the Adam as optimizer (<xref ref-type="bibr" rid="B28">Kingma and Ba, 2015</xref>) was opted due to the ability of DL to complex information through multiple layers (<xref ref-type="bibr" rid="B6">Bebis and Georgiopoulos, 1994</xref>). In addition to FFNN, we utilized various machine learning classifiers for comparative analysis following the previous studies (<xref ref-type="bibr" rid="B51">Singh et al., 2023</xref>; <xref ref-type="bibr" rid="B48">Saxe and Berlin, 2015</xref>). AdaBoost, an ensemble learning method, was chosen for its ability to combine weak classifiers, such as decision trees, to form a robust classifier (<xref ref-type="bibr" rid="B13">Freund and Schapire, 1997</xref>). Decision Tree, a non-parametric algorithm, was also employed for its tree-like structure and adaptability to handle noise and missing data (<xref ref-type="bibr" rid="B10">Cycles, 1989</xref>). Random Forest, another ensemble method was selected to enhance classification performance by combining multiple decision trees through bootstrap sampling and feature subsetting (<xref ref-type="bibr" rid="B7">BREIMAN, 2021</xref>). Logistic Regression, a binary classification algorithm, served as a widely used and interpretable model, estimating probabilities for esophageal carcinoma subtypes based on input feature vectors (<xref ref-type="bibr" rid="B42">Peng et al., 2002</xref>). Finally, the Support Vector Classifier (SVC), known for its robustness and versatility in handling both linear and non-linearly separable data, was applied for effective classification between esophageal cancer subtypes (<xref ref-type="bibr" rid="B5">Busuttil, 2003</xref>). Each model brought a unique strategy to the analysis, contributing to a comparative analysis of our proposed approach, which provides valuable insights into the suitability of various machine learning algorithms.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec id="s3-1">
<title>High-resolution histopathological dataset of ADC and SCC</title>
<p>Following a meticulous qualitative analysis that excluded small-sized images and those with significant blurring artefacts and ink marks, we systematically organized a dataset comprising 59 high-resolution histopathological H&#x26;E stained images of ADC and ESCC. This dataset was then divided into distinct training and testing sets, maintaining a balanced 70:30 ratio. After extracting WSI tiles and carefully selecting tumor tiles, the training and testing sets for EC comprised 191,798 and 48,665 tiles, respectively. The distribution of these tiles is visually depicted in <xref ref-type="fig" rid="F3">Figure 3</xref> for both the train and test sets. Moreover, the demographic and other characteristics of all patients included in our experimentation are summarized in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Patch Variation and Distribution: This figure visually presents the patch variation after preprocessing, showing the data distribution between training and testing sets. Patch counts range from as high as 6,000 patches per slide to as low as 1,200 patches per slide. The variation is handled by calculating the median of all the features per WSI to form a single feature vector.</p>
</caption>
<graphic xlink:href="fmolb-11-1346242-g003.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Patient characteristics on the 59 cases from TCGA - ESCA cohort.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" colspan="2" align="left">Characteristics</th>
<th colspan="2" align="center">Data set</th>
</tr>
<tr>
<th align="center">ADC</th>
<th align="center">SCC</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="2" align="left">Gender</td>
<td align="left">Male</td>
<td align="center">26</td>
<td align="center">25</td>
</tr>
<tr>
<td align="left">Female</td>
<td align="center">5</td>
<td align="center">3</td>
</tr>
<tr>
<td rowspan="2" align="left">Age</td>
<td align="left">&#x2264;60</td>
<td align="center">9</td>
<td align="center">21</td>
</tr>
<tr>
<td align="left">&#x3e;60</td>
<td align="center">22</td>
<td align="center">7</td>
</tr>
<tr>
<td rowspan="2" align="left">Vital Status</td>
<td align="left">Dead</td>
<td align="center">14</td>
<td align="center">8</td>
</tr>
<tr>
<td align="left">Alive</td>
<td align="center">17</td>
<td align="center">20</td>
</tr>
<tr>
<td rowspan="2" align="left">Alcohol History</td>
<td align="left">Yes</td>
<td align="center">26</td>
<td align="center">19</td>
</tr>
<tr>
<td align="left">No</td>
<td align="center">5</td>
<td align="center">9</td>
</tr>
<tr>
<td rowspan="4" align="left">Location</td>
<td align="left">Lower Third</td>
<td align="center">29</td>
<td align="center">11</td>
</tr>
<tr>
<td align="left">Middle Third</td>
<td align="center">-</td>
<td align="center">12</td>
</tr>
<tr>
<td align="left">Upper third</td>
<td align="center">2</td>
<td align="center">3</td>
</tr>
<tr>
<td align="left">Unspecified Location</td>
<td align="center">-</td>
<td align="center">2</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-2">
<title>Enhancing digital pathology by data-preprocessing</title>
<p>Preprocessing of digital pathology played a crucial role in addressing differences among images, including variations in color, illumination, and imperfections like artefacts or noise (<xref ref-type="fig" rid="F4">Figure 4</xref>). These variations and imperfections can be effectively minimized or corrected by applying preprocessing techniques, ensuring more consistent and reliable image quality across diverse datasets. The advantages of digital pathology still need to be increased to overcome its limitations: WSI requires considerably large storage volumes (since each image can need 2&#x2013;3&#xa0;GB). Moreover, as depicted in <xref ref-type="fig" rid="F5">Figure 5</xref>, these WSIs exhibit undesirable blank backgrounds, which were eliminated during this stage. Despite efforts toward standardization, attaining impeccable color calibration across all samples remains challenging (<xref ref-type="bibr" rid="B34">Lyon et al., 1994</xref>). This challenge drives the adoption and implementation of color normalization techniques, which have led to increased efficiency in our model. <xref ref-type="fig" rid="F6">Figure 6</xref> provides a visual difference before and after color normalization, and the general normalization process is shown in (<xref ref-type="fig" rid="F7">Figure 7</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>WSI Noise and Artefacts: <bold>(A)</bold> an example of noise in WSI (random or unwanted variations in image data), <bold>(B)</bold> an example of artefact in the Whole Slide Image of our dataset. (Artefacts can include staining artefacts, tissue folding or tearing, scanner artefacts, or any other unintended alterations that may occur during slide preparation, scanning, or digitization).</p>
</caption>
<graphic xlink:href="fmolb-11-1346242-g004.tif"/>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Preprocessing Steps: This figure outlines the preprocessing steps using PyHIST. Panel <bold>(A)</bold> displays an H&#x26;E WSI from TCGA, <bold>(B)</bold> illustrates a mask generated during preprocessing, <bold>(C)</bold> presents a Mask Grid created for patching WSI, and <bold>(D)</bold> shows a zoomed view of tiles selected from the grid.</p>
</caption>
<graphic xlink:href="fmolb-11-1346242-g005.tif"/>
</fig>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Tile Transformation: The figure exhibits the normalization process for ADC and SCC tiles. Panel <bold>(A)</bold> displays an original tile of ADC WSI after patching, <bold>(B)</bold> shows the ADC tile after normalization, <bold>(C)</bold> presents an original tile of SCC WSI after patching, and <bold>(D)</bold> illustrates the SCC tile after normalization.</p>
</caption>
<graphic xlink:href="fmolb-11-1346242-g006.tif"/>
</fig>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Color Normalization Flowchart: The figure provides a flow chart representing the color normalization process for images with different color variations. This process enhances the consistency of color across images, ensuring uniformity in the dataset.</p>
</caption>
<graphic xlink:href="fmolb-11-1346242-g007.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>Performance evaluation and comparative analysis</title>
<p>We utilized confusion matrices, as illustrated in <xref ref-type="fig" rid="F8">Figure 8</xref>, to assess the overall accuracy of our classification models. Calculating recall, precision, and F1 score from the confusion matrix values provided a comprehensive evaluation of model performance for both SCC and ADC classes. This approach aligns with established practices, reflecting evaluation matrices utilized in previous studies (<xref ref-type="bibr" rid="B33">Le and Ou, 2016</xref>; <xref ref-type="bibr" rid="B32">Le et al., 2017</xref>). The FFNN stands out as the top-performing model, achieving an impressive classification rate of 86% for SCC patients and 100% for ADC patients in the validation set. Our feature-based classification method successfully demonstrated the use of machine learning in accurate classification of esophageal squamous cell carcinoma and adenocarcinoma. The SVC and LR models also demonstrated strong performance, achieving prediction accuracies of 86% for SCC patients and 90% for ADC patients. The RFC provided acceptable predictions of 71% for SCC patients and 90% for ADC patients. AdaBoost achieved a perfect prediction rate (100%) for SCC patients but presented the lowest performance of 40% only for ADC patients. The Decision Tree model also exhibited the least effectiveness, with correct classification rates of 85% for SCC patients and 50% for ADC patients.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Confusion matrices illustrating the performance of five ML classifiers [represented as <bold>(A, B, D, E, F)</bold>]. <bold>(C)</bold> shows the confusion matrix of the FFNN classifier with the best values for classifying esophageal cancer subtypes. The matrices display the true positive (TP), true negative (TN), false positive (FP), and false negative (FN) values for each model, offering insights into their predictive capabilities and error distributions.</p>
</caption>
<graphic xlink:href="fmolb-11-1346242-g008.tif"/>
</fig>
<p>Due to the large size, WSIs were divided into smaller patches for analysis, and image features were extracted at a &#xd7;20 magnification level. The results from different ML classification methods, utilizing identical methodology and data distribution, were compared while maintaining the training and test ratio. These classifiers use the feature vectors of size N x 2048 as input, extracted using ResNet101. The evaluation considered essential performance metrics such as precision, recall, F1-score, accuracy, and AUC. The results in <xref ref-type="table" rid="T2">Table 2</xref> demonstrated that the feed-forward neural network (FFNN) model outperformed other ML models with an accuracy of 94.11% and an AUC score of 92%.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Results of WSI classification.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="center">Feature extraction</th>
<th rowspan="2" align="center">Algorithms</th>
<th colspan="2" align="center">Precision</th>
<th colspan="2" align="center">Recall</th>
<th colspan="2" align="center">F1-score</th>
<th rowspan="2" align="center">ACC</th>
<th rowspan="2" align="center">AUC</th>
</tr>
<tr>
<th align="center">SCC</th>
<th align="center">ADC</th>
<th align="center">SCC</th>
<th align="center">ADC</th>
<th align="center">SCC</th>
<th align="center">ADC</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="6" align="center">Resnet101</td>
<td align="center">SVC</td>
<td align="center">0.86</td>
<td align="center">0.9</td>
<td align="center">0.86</td>
<td align="center">0.9</td>
<td align="center">0.86</td>
<td align="center">0.9</td>
<td align="center">0.88</td>
<td align="center">0.87</td>
</tr>
<tr>
<td align="center">LR</td>
<td align="center">0.86</td>
<td align="center">0.9</td>
<td align="center">0.86</td>
<td align="center">0.9</td>
<td align="center">0.86</td>
<td align="center">0.9</td>
<td align="center">0.88</td>
<td align="center">0.87</td>
</tr>
<tr>
<td align="center">DT</td>
<td align="center">0.55</td>
<td align="center">0.83</td>
<td align="center">0.86</td>
<td align="center">0.5</td>
<td align="center">0.67</td>
<td align="center">0.62</td>
<td align="center">0.64</td>
<td align="center">0.68</td>
</tr>
<tr>
<td align="center">AdaBoost</td>
<td align="center">0.54</td>
<td align="center">1</td>
<td align="center">1</td>
<td align="center">0.4</td>
<td align="center">0.7</td>
<td align="center">0.57</td>
<td align="center">0.64</td>
<td align="center">0.7</td>
</tr>
<tr>
<td align="center">RFC</td>
<td align="center">0.6</td>
<td align="center">0.86</td>
<td align="center">0.86</td>
<td align="center">0.6</td>
<td align="center">0.71</td>
<td align="center">0.71</td>
<td align="center">0.82</td>
<td align="center">0.72</td>
</tr>
<tr>
<td align="center">FFNN</td>
<td align="center">1</td>
<td align="center">0.91</td>
<td align="center">0.86</td>
<td align="center">1</td>
<td align="center">0.92</td>
<td align="center">0.95</td>
<td align="center">
<bold>0.94</bold>
</td>
<td align="center">
<bold>0.92</bold>
</td>
</tr>
<tr>
<td rowspan="6" align="center">InceptionV3</td>
<td align="center">SVC</td>
<td align="center">0.75</td>
<td align="center">0.89</td>
<td align="center">0.86</td>
<td align="center">0.80</td>
<td align="center">0.80</td>
<td align="center">0.84</td>
<td align="center">0.82</td>
<td align="center">0.82</td>
</tr>
<tr>
<td align="center">LR</td>
<td align="center">0.70</td>
<td align="center">1.0</td>
<td align="center">1.0</td>
<td align="center">0.70</td>
<td align="center">0.82</td>
<td align="center">0.82</td>
<td align="center">0.82</td>
<td align="center">0.85</td>
</tr>
<tr>
<td align="center">DT</td>
<td align="center">0.67</td>
<td align="center">0.73</td>
<td align="center">0.57</td>
<td align="center">0.80</td>
<td align="center">0.62</td>
<td align="center">0.76</td>
<td align="center">0.71</td>
<td align="center">0.68</td>
</tr>
<tr>
<td align="center">AdaBoost</td>
<td align="center">0.71</td>
<td align="center">0.80</td>
<td align="center">0.71</td>
<td align="center">0.80</td>
<td align="center">0.71</td>
<td align="center">0.80</td>
<td align="center">0.76</td>
<td align="center">0.75</td>
</tr>
<tr>
<td align="center">RFC</td>
<td align="center">0.67</td>
<td align="center">0.73</td>
<td align="center">0.57</td>
<td align="center">0.80</td>
<td align="center">0.62</td>
<td align="center">0.76</td>
<td align="center">0.71</td>
<td align="center">0.68</td>
</tr>
<tr>
<td align="center">FFNN</td>
<td align="center">0.67</td>
<td align="center">0.88</td>
<td align="center">0.86</td>
<td align="center">0.70</td>
<td align="center">0.75</td>
<td align="center">0.78</td>
<td align="center">0.76</td>
<td align="center">0.77</td>
</tr>
<tr>
<td rowspan="6" align="center">Resnet50</td>
<td align="center">SVC</td>
<td align="center">0.80</td>
<td align="center">0.75</td>
<td align="center">0.57</td>
<td align="center">0.90</td>
<td align="center">0.67</td>
<td align="center">0.82</td>
<td align="center">0.76</td>
<td align="center">0.73</td>
</tr>
<tr>
<td align="center">LR</td>
<td align="center">0.62</td>
<td align="center">0.78</td>
<td align="center">0.71</td>
<td align="center">0.70</td>
<td align="center">0.67</td>
<td align="center">0.74</td>
<td align="center">0.71</td>
<td align="center">0.70</td>
</tr>
<tr>
<td align="center">DT</td>
<td align="center">0.57</td>
<td align="center">0.70</td>
<td align="center">0.57</td>
<td align="center">0.70</td>
<td align="center">0.57</td>
<td align="center">0.70</td>
<td align="center">0.65</td>
<td align="center">0.63</td>
</tr>
<tr>
<td align="center">AdaBoost</td>
<td align="center">0.67</td>
<td align="center">0.88</td>
<td align="center">0.86</td>
<td align="center">0.70</td>
<td align="center">0.75</td>
<td align="center">0.78</td>
<td align="center">0.76</td>
<td align="center">0.77</td>
</tr>
<tr>
<td align="center">RFC</td>
<td align="center">0.67</td>
<td align="center">0.73</td>
<td align="center">0.57</td>
<td align="center">0.80</td>
<td align="center">0.62</td>
<td align="center">0.76</td>
<td align="center">0.71</td>
<td align="center">0.68</td>
</tr>
<tr>
<td align="center">FFNN</td>
<td align="center">0.75</td>
<td align="center">0.89</td>
<td align="center">0.86</td>
<td align="center">0.80</td>
<td align="center">0.80</td>
<td align="center">0.84</td>
<td align="center">0.82</td>
<td align="center">0.82</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Similarly, the SVC and LR models displayed comparable performance, achieving an accuracy of 88% and an AUC of 0.87, surpassing the performance of the remaining models. Notably, the DT and AdaBoost models exhibited the lowest accuracy at 64%. We observed that while FFNN outperforms all other algorithms in terms of accuracy, the imbalance in the dataset was better handled by SVC and LR, where the difference in recall between SCC and ADC is the least, showing that both classes have a similar number of misclassifications and accurate classifications. These metrics offer a holistic assessment of the model&#x2019;s performance, highlighting its strengths and weaknesses. Such insights are invaluable for refining and advancing classification models in subsequent studies. Additionally, hyperparameters were carefully tuned using a grid search approach in our model training process, except for FFNN. They were optimized for each model to achieve the best performance on the test set (<xref ref-type="table" rid="T3">Table 3</xref>).</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Hyperparameters settings for selected models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Model</th>
<th align="center">Hyperparameter</th>
<th align="center">Search space</th>
<th align="center">Best value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="4" align="center">AdaBoost</td>
<td align="center">max_depth</td>
<td align="center">[2, 11]</td>
<td align="center">6</td>
</tr>
<tr>
<td align="center">min_samples_leaf</td>
<td align="center">[5, 10]</td>
<td align="center">10</td>
</tr>
<tr>
<td align="center">learning_rate</td>
<td align="center">[0.01, 0.1]</td>
<td align="center">0.1</td>
</tr>
<tr>
<td align="center">n_estimators</td>
<td align="center">[10, 50, 250, 1,000]</td>
<td align="center">50</td>
</tr>
<tr>
<td rowspan="3" align="center">Decision Tree (DT)</td>
<td align="center">max_features</td>
<td align="center">[&#x2018;auto&#x2019;, &#x2018;sqrt&#x2019;, &#x2018;log2&#x27;]</td>
<td align="center">auto</td>
</tr>
<tr>
<td align="center">ccp_alpha</td>
<td align="center">[0.1, 0.01, 0.001]</td>
<td align="center">0.01</td>
</tr>
<tr>
<td align="center">criterion</td>
<td align="center">[&#x2018;gini&#x2019;, &#x2018;entropy&#x27;]</td>
<td align="center">gini</td>
</tr>
<tr>
<td rowspan="2" align="center">Random Forest (RF)</td>
<td align="center">max_depth</td>
<td align="center">[10, 15]</td>
<td align="center">11</td>
</tr>
<tr>
<td align="center">max_features</td>
<td align="center">[0, 14]</td>
<td align="center">4</td>
</tr>
<tr>
<td rowspan="3" align="center">Logistic Regression (LR)</td>
<td align="center">C</td>
<td align="center">[0.1, 1, 10, 100]</td>
<td align="center">0.1</td>
</tr>
<tr>
<td align="center">penalty</td>
<td align="center">[&#x2018;l1&#x27;, &#x2018;l2&#x27;]</td>
<td align="center">l1</td>
</tr>
<tr>
<td align="center">solver</td>
<td align="center">[&#x2018;newton-cg&#x2019;, &#x2018;lbfgs&#x2019;, &#x2018;liblinear&#x27;]</td>
<td align="center">liblinear</td>
</tr>
<tr>
<td rowspan="3" align="center">Support Vector Classifier (SVC)</td>
<td align="center">C</td>
<td align="center">[0.1, 1, 10, 100]</td>
<td align="center">0.1</td>
</tr>
<tr>
<td align="center">kernel</td>
<td align="center">[&#x2018;rbf&#x2019;, &#x2018;linear&#x2019;]</td>
<td align="center">linear</td>
</tr>
<tr>
<td align="center">gamma</td>
<td align="center">[&#x2018;scale&#x2019;, &#x2018;auto&#x27;]</td>
<td align="center">scale</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>For a comparative analysis (refer to <xref ref-type="table" rid="T2">Table 2</xref>) involving transfer learning, we employed pre-trained InceptionV3 and ResNet50 models for feature extraction. The results showed that our proposed architecture outperformed other models, utilizing ResNet101 for feature extraction. The accuracy of our proposed model was 0.94, surpassing the best classification accuracy of 0.82 achieved by the other two models, thereby establishing the suitability of ResNet101 for the classification of esophageal cancer into Adenocarcinoma and Squamous Cell Carcinoma from histopathology images.</p>
</sec>
</sec>
<sec id="s4">
<title>Discussion and conclusion</title>
<p>Manual histopathological diagnosis of esophageal cancer subtypes poses challenges, emphasizing the need for a sophisticated and automated classification system. Our study adopts a tissue-level diagnostic approach leveraging deep learning and machine learning techniques to construct a reliable model, aiming to alleviate the limitations associated with manual diagnosis, providing a more efficient and objective solution.</p>
<p>We precisely curated the dataset TCGA-ESCA, ensuring consistency and quality while addressing potential variations in size, color intensities, and equipment usage. The preprocessing phase involved strategic techniques such as tiling, down-sampling, and edge detection to manage computational challenges and enhance the model&#x2019;s efficiency. These methods facilitated the extraction of informative patches from high-resolution whole-slide images (WSI) for further analysis. Moreover, a data normalization technique was adopted, where inherent color variations in histopathology images are addressed using the Reinhard Algorithm. This normalization process proves crucial in reducing variability and enhancing the model&#x2019;s overall efficacy during training.</p>
<p>Our study emphasizes tissue-level classification rather than patch-level analysis. While patch-level annotations (<xref ref-type="bibr" rid="B21">Hou et al., 2016</xref>; <xref ref-type="bibr" rid="B35">Mi et al., 2021</xref>) have gained popularity for cancer sub-type detection in digital pathology, relying solely on them has notable drawbacks. A primary concern is the substantial manual annotation effort required for this approach, involving the careful marking and annotation of individual patches within the WSIs, making the process time-consuming and labour-intensive. However, depending solely on patch-level analysis may result in overlooking crucial contextual information within the slide. By focusing exclusively on isolated patches, there is a risk of missing important features and spatial relationships between regions in the slide. This limitation can lead to inaccurate or incomplete detection, as the analysis may fail to capture the full extent of the disease and its characteristics. Moreover, a patch-level analysis may be susceptible to sampling bias (<xref ref-type="bibr" rid="B18">H&#xe4;gele et al., 2020</xref>), as the selected patches may not adequately represent the entire slide, potentially causing the omission of critical regions of interest crucial for accurate cancer subtype identification.</p>
<p>Furthermore, the challenges of intratumoral heterogeneity pose a significant obstacle for patch-level cancer subtype detection. Cancer subtypes can exhibit spatial variability within a single tumor, with distinct regions displaying different cellular characteristics and molecular profiles. By relying solely on patch-level analysis, there is a risk of obtaining inconsistent or ambiguous results, as the selected patches may not fully capture the heterogeneity present within the tumor. This limitation can impact the reliability and accuracy of the cancer subtype detection, particularly when attempting to classify tumors with diverse intratumoral characteristics. We assessed the method&#x2019;s effectiveness in detecting esophageal subtype carcinoma from H&#x26;E WSIs. We found that ML can accurately classify cancer subtypes in EC from H&#x26;E WSIs. Pathologists, who have a laborious, time-consuming, and easily misinterpreted diagnostic process, could benefit significantly from automated cancer subtype detection by having less work to do.</p>
<p>Recognizing that patch-level cancer subtype detection can be integrated with additional contextual information from WSI, such as slide-level annotations, can help overcome the limitations associated with patch-level analysis. By incorporating a broader perspective and considering the overall tissue architecture and spatial relationships within the slide, the accuracy and reliability of cancer subtype detection can be improved. Further research and development efforts are necessary to address these limitations and refine the performance of patch-level cancer subtype detection methods in the context of a digital pathology-based cancer diagnosis. Addressing data scarcity in tasks linked to histopathology is also crucial to maximizing the effectiveness of deep learning systems. High-quality and massive amounts of disease data with detailed tile annotations will be required to accelerate model building. DL models, are particularly suitable for large-scale data analysis (<xref ref-type="bibr" rid="B25">Jan et al., 2019</xref>), depending on the amount of data provided, making it challenging to apply them to real-world circumstances. Unfortunately, having enough data for DL models in most real-world circumstances is not feasible, especially in medical science (<xref ref-type="bibr" rid="B62">Zewdie et al., 2021</xref>). As an alternative, transfer learning has shown promising results for computer vision problems where only a few training samples are available (refer to <xref ref-type="table" rid="T4">Table 4</xref>). A feature extractor trained on various pathological datasets may produce better outcomes than our cancer sub-type-specific model.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Comparison of studies with proposed architecture.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Study</th>
<th align="center">Organ</th>
<th align="center">Approach</th>
<th align="center">Classifier</th>
<th align="center">Dataset</th>
<th align="center">Patients</th>
<th align="center">Results</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">
<xref ref-type="bibr" rid="B57">Wagner and Cosgrove (2023)</xref>
</td>
<td align="center">Uterus</td>
<td align="center">Image level annotation</td>
<td align="center">CNN</td>
<td align="center">TCGA-UCEC</td>
<td align="center">657</td>
<td align="center">0.82 (AUC)</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B63">Zhao et al. (2023)</xref>
</td>
<td align="center">Lung</td>
<td align="center">pixel-level annotation</td>
<td align="center">CNN</td>
<td align="center">Beijing Chest Hospital</td>
<td align="center">523</td>
<td align="center">0.80 (AUC)</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B30">Kumar A and Mubarak (2022)</xref>
</td>
<td align="center">Esophagus</td>
<td align="center">Image level annotation</td>
<td align="center">SVM</td>
<td align="center">Kvasir dataset</td>
<td align="center">1800</td>
<td align="center">0.93 (ACC)</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B59">Wang et al. (2020)</xref>
</td>
<td align="center">Ovarian Cancer</td>
<td align="center">Patch level annotation</td>
<td align="center">Random Forest</td>
<td align="center">Vancouver General Hospital</td>
<td align="center">305</td>
<td align="center">0.87 (ACC)</td>
</tr>
<tr>
<td align="center">
<bold>Proposed Method</bold>
</td>
<td align="center">
<bold>Esophagus</bold>
</td>
<td align="center">
<bold>Image level annotation</bold>
</td>
<td align="center">
<bold>FFNN</bold>
</td>
<td align="center">
<bold>TCGA-ESCA</bold>
</td>
<td align="center">
<bold>59</bold>
</td>
<td align="center">
<bold>0.94 (ACC)</bold>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Utilizing transfer learning with ResNet101 on histopathological imagery, our study achieved superior performance with a Feed Forward Neural Network, boasting 94% accuracy and 0.92 AUC. Support Vector Classifier and Logistic Regression followed closely with an 88% accuracy, outperforming Random Forest Classifier (RFC) at 82%, while Decision Tree (DT) and AdaBoost lagged with 64% accuracy. This approach was centred on examining H&#x26;E stained WSIs, renowned for their capacity to preserve intricate microscopic tissue properties, thereby providing a robust foundation for detailed cancer tissue analysis. Looking ahead, we propose the inclusion of WSIs from additional databases in future investigations. These datasets should ideally share resolutions and characteristics similar to those used in this study to ensure consistency and reliability in comparative analyses. A thorough assessment of these representations and their parameters could offer insightful perspectives on the accuracy and repeatability of diagnostic algorithms, especially considering the distinctive nature of realistic <italic>versus</italic> pathological imagery domains. To sum up, our research proves that ResNet101-based transfer learning outperforms other methods in analyzing histopathological images and presents new opportunities for improving cancer diagnosis techniques. By utilizing the capabilities of sophisticated neural network architectures, there is considerable potential to increase the precision and speed of cancer detection from histological images. In addition, we recognize the importance of addressing the interpretability of the proposed model and plan to incorporate explainable AI techniques as part of our future research.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/Supplementary material, further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>SA: Data curation, Formal Analysis, Investigation, Validation, Writing&#x2013;original draft, Writing&#x2013;review and editing. ABA: Data curation, Formal Analysis, Investigation, Validation, Writing&#x2013;original draft. TM: Resources, Writing&#x2013;review and editing. AB: Writing&#x2013;review and editing. AA-S: Writing&#x2013;review and editing. MK: Writing&#x2013;review and editing. AAs: Conceptualization, Supervision, Writing&#x2013;review and editing, Resources. MM: Conceptualization, Funding acquisition, Supervision, Writing&#x2013;review and editing, Resources. MB: Supervision, Writing&#x2013;original draft, Writing&#x2013;review and editing, Conceptualization, Resources.</p>
</sec>
<sec sec-type="funding-information" id="s7">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. This study was funded, in part, by a Research Grant (Grant number: ID No. 2022-16465) from the Indian Council of Medical Research (ICMR) Govt. of India, New Delhi and a Core Research Grant (<ext-link ext-link-type="uri" xlink:href="https://serbonline.in/SERB/ProposalInfoNew">CRG/2021/003805</ext-link>) from Science and Engineering Research Board (SERB), Govt. of India, New Delhi to MM. Promotion of University Research and Scientific Excellence (PURSE) (SR/PURSE/2022/121) grant from the Department of Science and Technology, Govt. of India, New Delhi to the Islamic University of Science and Technology (IUST), Awantipora.</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>Author MK was employed by DigiBiomics Inc.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
<p>The author(s) declared that they were an editorial board member of Frontiers, at the time of submission. This had no impact on the peer review process and the final decision.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abbas</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Krasna</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Overview of esophageal cancer</article-title>. <source>Ann. Cardiothorac. Surg.</source> <volume>6</volume> (<issue>2</issue>), <fpage>131</fpage>&#x2013;<lpage>136</lpage>. <pub-id pub-id-type="doi">10.21037/acs.2017.03.03</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Agarap</surname>
<given-names>A. F.</given-names>
</name>
</person-group> (<year>2018</year>). <source>Deep Learn. using Rectified Linear Units (ReLU)</source> <volume>2</volume> (<issue>1</issue>), <fpage>2</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.48550/arXiv.1803.08375</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Al-Abbadi</surname>
<given-names>M. A.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Basics of cytology</article-title>. <source>Avicenna J. Med.</source> <volume>01</volume> (<issue>01</issue>), <fpage>18</fpage>&#x2013;<lpage>28</lpage>. <pub-id pub-id-type="doi">10.4103/2231-0770.83719</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Allison</surname>
<given-names>K. H.</given-names>
</name>
<name>
<surname>Reisch</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Carney</surname>
<given-names>P. A.</given-names>
</name>
<name>
<surname>Weaver</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>Schnitt</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>O&#x27;Malley</surname>
<given-names>F. P.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Understanding diagnostic variability in breast pathology: lessons learned from an expert consensus review panel</article-title>. <source>Histopathology</source> <volume>65</volume> (<issue>2</issue>), <fpage>240</fpage>&#x2013;<lpage>251</lpage>. <pub-id pub-id-type="doi">10.1111/his.12387</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Bebis</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Georgiopoulos</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>1994</year>). <source>Feed-forward neural networks: why network size is so important</source>. <publisher-name>IEEE Potentials</publisher-name>, <fpage>27</fpage>&#x2013;<lpage>31</lpage>. <comment>Available: <ext-link ext-link-type="uri" xlink:href="http://ieeexplore.ieee.org/xpls/abs_all.jsp?arnumber=329294">http://ieeexplore.ieee.org/xpls/abs_all.jsp?arnumber&#x3d;329294</ext-link>.</comment>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname>
<given-names>L. E. O.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Random forests</article-title>. <source>Mach. Learn.</source>, <fpage>542</fpage>&#x2013;<lpage>545</lpage>. <pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Busuttil</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2003</year>). &#x201c;<article-title>Support vector machines</article-title>,&#x201d; in <conf-name>1st Computer Science Annual Workshop (CSAW&#x2019;03)</conf-name>, <fpage>34</fpage>&#x2013;<lpage>39</lpage>.</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Canny</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>1986</year>). <article-title>A computational approach to edge detection</article-title>. <source>IEEE Trans. Pattern Anal. Mach. Intell.</source> <volume>8</volume> (<issue>6</issue>), <fpage>679</fpage>&#x2013;<lpage>698</lpage>. <pub-id pub-id-type="doi">10.1109/TPAMI.1986.4767851</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>M. Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Williamson</surname>
<given-names>D. F. K.</given-names>
</name>
<name>
<surname>Rodig</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Lindeman</surname>
<given-names>N. I.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Pathomic fusion: an integrated framework for fusing histopathology and genomic features for cancer diagnosis and prognosis</article-title>. <source>IEEE Trans. Med. Imaging</source> <volume>41</volume> (<issue>4</issue>), <fpage>757</fpage>&#x2013;<lpage>770</lpage>. <pub-id pub-id-type="doi">10.1109/TMI.2020.3021387</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cycles</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>1989</year>). <article-title>Decision trees</article-title>. <source>Cycle</source> <volume>1897</volume>, <fpage>44</fpage>&#x2013;<lpage>45</lpage>. <comment>Figure 1</comment>. <pub-id pub-id-type="doi">10.1007/0-387-25465-X</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Evans</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hero</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Minhas</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wahab</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Dodd</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Sahota</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Standardized clinical annotation of digital histopathology slides at the point of diagnosis</article-title>. <source>Mod. Pathol.</source> <volume>36</volume> (<issue>11</issue>), <fpage>100297</fpage>. <pub-id pub-id-type="doi">10.1016/j.modpat.2023.100297</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Felzenszwalb</surname>
<given-names>P. F.</given-names>
</name>
<name>
<surname>Huttenlocher</surname>
<given-names>D. P.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Efficient graph-based image segmentation</article-title>. <source>Int. J. Comput. Vis.</source> <volume>59</volume> (<issue>2</issue>), <fpage>167</fpage>&#x2013;<lpage>181</lpage>. <pub-id pub-id-type="doi">10.1023/B:VISI.0000022288.19776.77</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Freund</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Schapire</surname>
<given-names>R. E.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>A decision-theoretic generalization of on-line learning and an application to boosting</article-title>. <source>J. Comput. Syst. Sci.</source> <volume>55</volume> (<issue>1</issue>), <fpage>119</fpage>&#x2013;<lpage>139</lpage>. <pub-id pub-id-type="doi">10.1006/jcss.1997.1504</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goh</surname>
<given-names>T. Y.</given-names>
</name>
<name>
<surname>Basah</surname>
<given-names>S. N.</given-names>
</name>
<name>
<surname>Yazid</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Aziz Safar</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Ahmad Saad</surname>
<given-names>F. S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Performance analysis of image thresholding: Otsu technique</article-title>. <source>Measurement</source> <volume>114</volume>, <fpage>298</fpage>&#x2013;<lpage>307</lpage>. <pub-id pub-id-type="doi">10.1016/j.measurement.2017.09.052</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Niu</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Integration of natural and deep artificial cognitive models in medical images: BERT-based NER and relation extraction for electronic medical records</article-title>. <source>Front. Neurosci.</source> <volume>17</volume>, <fpage>1266771</fpage>. <pub-id pub-id-type="doi">10.3389/fnins.2023.1266771</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gurcan</surname>
<given-names>M. N.</given-names>
</name>
<name>
<surname>Boucheron</surname>
<given-names>L. E.</given-names>
</name>
<name>
<surname>Can</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Madabhushi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Rajpoot</surname>
<given-names>N. M.</given-names>
</name>
<name>
<surname>Yener</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Histopathological image analysis: a review</article-title>. <source>IEEE Rev. Biomed. Eng.</source> <volume>2</volume> (<issue>2</issue>), <fpage>147</fpage>&#x2013;<lpage>171</lpage>. <pub-id pub-id-type="doi">10.1109/RBME.2009.2034865</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gutman</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Cobb</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Somanna</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Kurc</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Cancer Digital Slide Archive: an informatics resource to support integrated <italic>in silico</italic> analysis of TCGA pathology data</article-title>. <source>J. Am. Med. Inf. Assoc.</source> <volume>20</volume> (<issue>6</issue>), <fpage>1091</fpage>&#x2013;<lpage>1098</lpage>. <pub-id pub-id-type="doi">10.1136/amiajnl-2012-001469</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>H&#xe4;gele</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Seegerer</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Lapuschkin</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bockmayr</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Samek</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Klauschen</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Resolving challenges in deep learning-based analyses of histopathological images using explanation methods</article-title>. <source>Sci. Rep.</source> <volume>10</volume> (<issue>1</issue>), <fpage>6423</fpage>&#x2013;<lpage>6512</lpage>. <pub-id pub-id-type="doi">10.1038/s41598-020-62724-2</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Deep residual learning for image recognition</article-title>. <source>Proc. IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit.</source> <volume>2016</volume>, <fpage>770</fpage>&#x2013;<lpage>778</lpage>. <pub-id pub-id-type="doi">10.1109/CVPR.2016.90</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Long</surname>
<given-names>L. R.</given-names>
</name>
<name>
<surname>Antani</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Thoma</surname>
<given-names>G. R.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Histology image analysis for carcinoma detection and grading</article-title>. <source>Comput. Methods Programs Biomed.</source> <volume>107</volume> (<issue>3</issue>), <fpage>538</fpage>&#x2013;<lpage>556</lpage>. <pub-id pub-id-type="doi">10.1016/j.cmpb.2011.12.007</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hou</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Samaras</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Kurc</surname>
<given-names>T. M.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>Saltz</surname>
<given-names>J. H.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Patch-based convolutional neural network for whole slide tissue image classification</article-title>. <source>Proc. IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit.</source> <volume>2016</volume>, <fpage>2424</fpage>&#x2013;<lpage>2433</lpage>. <pub-id pub-id-type="doi">10.1109/CVPR.2016.266</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Development and validation of a deep learning model to predict survival of patients with esophageal cancer</article-title>. <source>Front. Oncol.</source> <volume>12</volume> (<issue>August</issue>), <fpage>971190</fpage>. <pub-id pub-id-type="doi">10.3389/fonc.2022.971190</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>AN OTSU image segmentation based on fruitfly optimization algorithm</article-title>. <source>Alex. Eng. J.</source> <volume>60</volume> (<issue>1</issue>), <fpage>183</fpage>&#x2013;<lpage>188</lpage>. <pub-id pub-id-type="doi">10.1016/j.aej.2020.06.054</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hussain</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Rahman</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Rahman</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Khaled</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Abdullah-Al Wadud</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hossain Khan</surname>
<given-names>M. A.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>A histogram specification technique for dark image enhancement using a local transformation method</article-title>. <source>IPSJ Trans. Comput. Vis. Appl.</source> <volume>10</volume> (<issue>1</issue>), <fpage>3</fpage>. <pub-id pub-id-type="doi">10.1186/s41074-018-0040-0</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jan</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Farman</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Khan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Imran</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Islam</surname>
<given-names>I. U.</given-names>
</name>
<name>
<surname>Ahmad</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Deep learning in big data Analytics: a comparative study</article-title>. <source>Comput. Electr. Eng.</source> <volume>75</volume>, <fpage>275</fpage>&#x2013;<lpage>287</lpage>. <pub-id pub-id-type="doi">10.1016/j.compeleceng.2017.12.009</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kalton</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Simple random sampling</article-title>. <source>Introd. Surv. Sampl.</source>, <fpage>9</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.4135/9781412984683.n2</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kermany</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Goldbaum</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Valentim</surname>
<given-names>C. C. S.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Baxter</surname>
<given-names>S. L.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Identifying medical diagnoses and treatable diseases by image-based deep learning</article-title>. <source>Cell</source> <volume>172</volume> (<issue>5</issue>), <fpage>1122</fpage>&#x2013;<lpage>1131</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2018.02.010</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kingma</surname>
<given-names>D. P.</given-names>
</name>
<name>
<surname>Ba</surname>
<given-names>J. L.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Adam: a method for stochastic optimization</article-title>. <source>3rd Int. Conf. Learn. Represent. ICLR 2015 - Conf. Track Proc.</source>, <fpage>1</fpage>&#x2013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.48550/arXiv.1412.6980</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kumar</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Basu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Berglund</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Eschrich</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Schabath</surname>
<given-names>M. B.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Radiomics: the process and the challenges</article-title>. <source>Magn. Reson. Imaging</source> <volume>30</volume> (<issue>9</issue>), <fpage>1234</fpage>&#x2013;<lpage>1248</lpage>. <pub-id pub-id-type="doi">10.1016/j.mri.2012.06.010</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kumar A</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Mubarak</surname>
<given-names>D. M. N.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Classification of early stages of esophageal cancer using transfer learning</article-title>. <source>IRBM</source> <volume>43</volume> (<issue>4</issue>), <fpage>251</fpage>&#x2013;<lpage>258</lpage>. <pub-id pub-id-type="doi">10.1016/j.irbm.2021.10.003</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lakshmanan</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Anand</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jenitha</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Stain removal through color normalization of Haematoxylin and Eosin images: a review</article-title>. <source>J. Phys. Conf. Ser.</source> <volume>1362</volume> (<issue>1</issue>), <fpage>012108</fpage>. <pub-id pub-id-type="doi">10.1088/1742-6596/1362/1/012108</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Le</surname>
<given-names>N.-Q.-K.</given-names>
</name>
<name>
<surname>Nguyen</surname>
<given-names>T.-T.-D.</given-names>
</name>
<name>
<surname>Ou</surname>
<given-names>Y.-Y.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Identifying the molecular functions of electron transport proteins using radial basis function networks and biochemical properties</article-title>. <source>J. Mol. Graph. Model.</source> <volume>73</volume>, <fpage>166</fpage>&#x2013;<lpage>178</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmgm.2017.01.003</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Le</surname>
<given-names>N.-Q.-K.</given-names>
</name>
<name>
<surname>Ou</surname>
<given-names>Y.-Y.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Incorporating efficient radial basis function networks and significant amino acid pairs for predicting GTP binding sites in transport proteins</article-title>. <source>BMC Bioinforma.</source> <volume>17</volume> (<issue>Suppl. 19</issue>), <fpage>501</fpage>. <pub-id pub-id-type="doi">10.1186/s12859-016-1369-y</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lyon</surname>
<given-names>H. O.</given-names>
</name>
<name>
<surname>De Leenheer</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Horobin</surname>
<given-names>R. W.</given-names>
</name>
<name>
<surname>Lambert</surname>
<given-names>W. E.</given-names>
</name>
<name>
<surname>Schulte</surname>
<given-names>E. K.</given-names>
</name>
<name>
<surname>Van Liedekerke</surname>
<given-names>B.</given-names>
</name>
<etal/>
</person-group> (<year>1994</year>). <article-title>Standardization of reagents and methods used in cytological and histological practice with emphasis on dyes, stains and chromogenic reagents</article-title>. <source>Histochem. J.</source> <volume>26</volume> (<issue>7</issue>), <fpage>533</fpage>&#x2013;<lpage>544</lpage>. <pub-id pub-id-type="doi">10.1007/BF00158587</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mi</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Deep learning-based multi-class classification of breast digital pathology images</article-title>. <source>Cancer Manag. Res.</source> <volume>13</volume>, <fpage>4605</fpage>&#x2013;<lpage>4617</lpage>. <pub-id pub-id-type="doi">10.2147/CMAR.S312608</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muller</surname>
<given-names>J. J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Milddleton</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Alizadeh</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>K. C.</given-names>
</name>
<name>
<surname>Hryczyk</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Machine learning-based classification of chronic traumatic brain injury using hybrid diffusion imaging</article-title>. <source>Front. Neurosci.</source> <volume>17</volume>, <fpage>1182509</fpage>. <pub-id pub-id-type="doi">10.3389/fnins.2023.1182509</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mu&#xf1;oz-Aguirre</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ntasis</surname>
<given-names>V. F.</given-names>
</name>
<name>
<surname>Rojas</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Guig&#xf3;</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>PyHIST: a histological image segmentation tool</article-title>. <source>PLoS Comput. Biol.</source> <volume>16</volume> (<issue>10</issue>), <fpage>e1008349</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1008349</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Napier</surname>
<given-names>K. J.</given-names>
</name>
<name>
<surname>Scheerer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Misra</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Esophageal cancer: a review of epidemiology, pathogenesis, staging workup and treatment modalities</article-title>. <source>World J. Gastrointest. Oncol.</source> <volume>6</volume> (<issue>5</issue>), <fpage>112</fpage>&#x2013;<lpage>120</lpage>. <pub-id pub-id-type="doi">10.4251/wjgo.v6.i5.112</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Otsu</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>1979</year>). <article-title>A threshold selection method from gray-level histograms</article-title>. <source>IEEE Trans. Syst. Man. Cybern.</source> <volume>20</volume> (<issue>1</issue>), <fpage>62</fpage>&#x2013;<lpage>66</lpage>. <pub-id pub-id-type="doi">10.1109/TSMC.1979.4310076</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pakzad</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Mohammadian-Hafshejani</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Khosravi</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Soltani</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Pakzad</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Mohammadian</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>The incidence and mortality of esophageal cancer and their relationship to development in Asia</article-title>. <source>Ann. Transl. Med.</source> <volume>4</volume> (<issue>2</issue>), <fpage>29</fpage>. <pub-id pub-id-type="doi">10.3978/j.issn.2305-5839.2016.01.11</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paul</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mukherjee</surname>
<given-names>D. P.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Mitosis detection for invasive breast cancer grading in histopathological images</article-title>. <source>IEEE Trans. Image Process.</source> <volume>24</volume> (<issue>11</issue>), <fpage>4041</fpage>&#x2013;<lpage>4054</lpage>. <pub-id pub-id-type="doi">10.1109/TIP.2015.2460455</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peng</surname>
<given-names>C. Y. J.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>K. L.</given-names>
</name>
<name>
<surname>Ingersoll</surname>
<given-names>G. M.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>An introduction to logistic regression analysis and reporting</article-title>. <source>J. Educ. Res.</source> <volume>96</volume> (<issue>1</issue>), <fpage>3</fpage>&#x2013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.1080/00220670209598786</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pennathur</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gibson</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Jobe</surname>
<given-names>B. A.</given-names>
</name>
<name>
<surname>Luketich</surname>
<given-names>J. D.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Oesophageal carcinoma</article-title>. <source>Lancet</source> <volume>381</volume> (<issue>9864</issue>), <fpage>400</fpage>&#x2013;<lpage>412</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(12)60643-6</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Rustgi</surname>
<given-names>V. K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Genetic mutation and biological pathway prediction based on whole slide images in breast carcinoma using deep learning</article-title>. <source>npj Precis. Oncol.</source> <volume>5</volume> (<issue>1</issue>), <fpage>87</fpage>. <pub-id pub-id-type="doi">10.1038/s41698-021-00225-9</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reinhard</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Ashikhmin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gooch</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Shirley</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Pre</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Reinhard</surname>
</name>
<etal/>
</person-group> (<year>2001</year>). <article-title>Color transfer between images</article-title>. <source>Appl. Percept.</source> <volume>21</volume>, <fpage>34</fpage>&#x2013;<lpage>41</lpage>. <pub-id pub-id-type="doi">10.1109/38.946629</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Roy</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Dutta</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Dey</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Dey</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Chakraborty</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ray</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2014</year>). &#x201c;<article-title>Adaptive thresholding: a comparative study</article-title>,&#x201d; in <conf-name>2014 International Conference on Control, Instrumentation, Communication and Computational Technologies (ICCICCT)</conf-name>, <conf-loc>Kanyakumari, India</conf-loc>, <conf-date>10-11 July 2014</conf-date>, <fpage>1182</fpage>&#x2013;<lpage>1186</lpage>. <pub-id pub-id-type="doi">10.1109/ICCICCT.2014.6993140</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roy</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Panda</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jangid</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Modified reinhard algorithm for color normalization of colorectal cancer histopathology images</article-title>. <source>Eur. Signal Process. Conf.</source>, <fpage>1231</fpage>&#x2013;<lpage>1235</lpage>. <pub-id pub-id-type="doi">10.23919/EUSIPCO54536.2021.9616117</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Saxe</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Berlin</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2015</year>). &#x201c;<article-title>Deep neural network based malware detection using two dimensional binary program features</article-title>,&#x201d; in <conf-name>2015 10th International Conference on Malicious and Unwanted Software (MALWARE)</conf-name>, <conf-loc>Fajardo, PR, USA</conf-loc>, <conf-date>20-22 October 2015</conf-date>, <fpage>11</fpage>&#x2013;<lpage>20</lpage>. <pub-id pub-id-type="doi">10.1109/MALWARE.2015.7413680</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shimizu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Nakayama</surname>
<given-names>K. I.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Artificial intelligence in oncology</article-title>. <source>Cancer Sci.</source> <volume>111</volume> (<issue>5</issue>), <fpage>1452</fpage>&#x2013;<lpage>1460</lpage>. <pub-id pub-id-type="doi">10.1111/cas.14377</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singh</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Bhandari</surname>
<given-names>A. K.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>I. V.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Fusion-based contextually selected 3D Otsu thresholding for image segmentation</article-title>. <source>Multimed. Tools Appl.</source> <volume>80</volume> (<issue>13</issue>), <fpage>19399</fpage>&#x2013;<lpage>19420</lpage>. <pub-id pub-id-type="doi">10.1007/s11042-021-10706-5</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singh</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Borgohain</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Sarkar</surname>
<given-names>A. K.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sharma</surname>
<given-names>L. D.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Feed-forward deep neural network (FFDNN)-Based deep features for static malware detection</article-title>. <source>Int. J. Intell. Syst.</source> <volume>2023</volume>, <fpage>1</fpage>&#x2013;<lpage>20</lpage>. <pub-id pub-id-type="doi">10.1155/2023/9544481</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Srinidhi</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Ciga</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Martel</surname>
<given-names>A. L.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Deep neural network models for computational histopathology: a survey</article-title>. <source>Med. Image Anal.</source> <volume>67</volume> (<issue>1</issue>), <fpage>101813</fpage>&#x2013;<lpage>102148</lpage>. <pub-id pub-id-type="doi">10.1016/j.media.2020.101813</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sung</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ferlay</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Siegel</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Laversanne</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Soerjomataram</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Jemal</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Global cancer statistics 2020: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>. <source>Ca. Cancer J. Clin.</source> <volume>71</volume> (<issue>3</issue>), <fpage>209</fpage>&#x2013;<lpage>249</lpage>. <pub-id pub-id-type="doi">10.3322/caac.21660</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tomaszewski</surname>
<given-names>J. E.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Overview of the role of artificial intelligence in pathology: the computer as a pathology digital assistant</article-title>. <source>Artif. Intell. Deep Learn. Pathol.</source>, <fpage>237</fpage>&#x2013;<lpage>262</lpage>. <pub-id pub-id-type="doi">10.1016/B978-0-323-67538-3.00011-7</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tran</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Kondrashova</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Bradley</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Williams</surname>
<given-names>E. D.</given-names>
</name>
<name>
<surname>Pearson</surname>
<given-names>J. V.</given-names>
</name>
<name>
<surname>Waddell</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Deep learning in cancer diagnosis, prognosis and treatment selection</article-title>. <source>Genome Med.</source> <volume>13</volume> (<issue>1</issue>), <fpage>152</fpage>&#x2013;<lpage>217</lpage>. <pub-id pub-id-type="doi">10.1186/s13073-021-00968-x</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vahadane</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Peng</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sethi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Albarqouni</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Baust</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Structure-preserving color normalization and sparse stain separation for histological images</article-title>. <source>IEEE Trans. Med. Imaging</source> <volume>35</volume> (<issue>8</issue>), <fpage>1962</fpage>&#x2013;<lpage>1971</lpage>. <pub-id pub-id-type="doi">10.1109/TMI.2016.2529665</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wagner</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Cosgrove</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Predicting endometrial cancer molecular classification from histology slides using deep learning (030)</article-title>. <source>Gynecol. Oncol.</source> <volume>176</volume>, <fpage>S23</fpage>. <pub-id pub-id-type="doi">10.1016/j.ygyno.2023.06.495</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Trends in using deep learning algorithms in biomedical prediction systems</article-title>. <source>Front. Neurosci.</source> <volume>17</volume>, <fpage>1256351</fpage>. <pub-id pub-id-type="doi">10.3389/fnins.2023.1256351</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <source>Classification of epithelial ovarian carcinoma whole-slide pathology images using deep transfer learning</source>, <fpage>1</fpage>&#x2013;<lpage>5</lpage>. <comment>Available: <ext-link ext-link-type="uri" xlink:href="http://arxiv.org/abs/2005.10957">http://arxiv.org/abs/2005.10957</ext-link>.</comment>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiao</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Niu</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Leveraging natural cognitive systems in conjunction with ResNet50-BiGRU model and attention mechanism for enhanced medical image analysis and sports injury prediction</article-title>. <source>Front. Neurosci.</source> <volume>17</volume>, <fpage>1273931</fpage>. <pub-id pub-id-type="doi">10.3389/fnins.2023.1273931</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Rao</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Understanding esophageal cancer: the challenges and opportunities for the next decade</article-title>. <source>Front. Oncol.</source> <volume>10</volume> (<issue>September</issue>), <fpage>1727</fpage>&#x2013;<lpage>1813</lpage>. <pub-id pub-id-type="doi">10.3389/fonc.2020.01727</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zewdie</surname>
<given-names>E. T.</given-names>
</name>
<name>
<surname>Tessema</surname>
<given-names>A. W.</given-names>
</name>
<name>
<surname>Simegn</surname>
<given-names>G. L.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Classification of breast cancer types, sub-types and grade from histopathological images using deep learning technique</article-title>. <source>Health Technol.</source> <volume>11</volume> (<issue>6</issue>), <fpage>1277</fpage>&#x2013;<lpage>1290</lpage>. <pub-id pub-id-type="doi">10.1007/s12553-021-00592-0</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Ju</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhen</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Deep learning-based diagnosis of histopathological patterns for invasive non-mucinous lung adenocarcinoma using semantic segmentation</article-title>. <source>BMJ Open</source> <volume>13</volume> (<issue>7</issue>), <fpage>e069181</fpage>. <pub-id pub-id-type="doi">10.1136/bmjopen-2022-069181</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Rahaman</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ai</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>A comprehensive review for breast histopathology image analysis using classical and deep neural networks</article-title>. <source>IEEE Access</source> <volume>8</volume>, <fpage>90931</fpage>&#x2013;<lpage>90956</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2020.2993788</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>