<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychiatry</journal-id>
<journal-title>Frontiers in Psychiatry</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychiatry</abbrev-journal-title>
<issn pub-type="epub">1664-0640</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyt.2024.1395563</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Psychiatry</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Enhancing Alzheimer&#x2019;s disease diagnosis and staging: a multistage CNN framework using MRI</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Ali</surname>
<given-names>Muhammad Umair</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1275589"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Kim</surname>
<given-names>Kwang Su</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Khalid</surname>
<given-names>Majdi</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2673013"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Farrash</surname>
<given-names>Majed</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zafar</surname>
<given-names>Amad</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/570476"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Lee</surname>
<given-names>Seung Won</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2058535"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Artificial Intelligence and Robotics, Sejong University</institution>, <addr-line>Seoul</addr-line>, <country>Republic of Korea</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Scientific Computing, Pukyong National University</institution>, <addr-line>Busan</addr-line>, <country>Republic of Korea</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Interdisciplinary Biology Laboratory (iBLab), Division of Biological Science, Graduate School of Science, Nagoya University</institution>, <addr-line>Nagoya</addr-line>, <country>Japan</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Department of Computer Science and Artificial Intelligence, College of Computing, Umm Al-Qura University</institution>, <addr-line>Makkah</addr-line>, <country>Saudi Arabia</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Department of Precision Medicine, Sungkyunkwan University School of Medicine</institution>, <addr-line>Suwon</addr-line>, <country>Republic of Korea</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Gaelle Eve Doucet, Boys Town National Research Hospital, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Karthik R, Vellore Institute of Technology (VIT), India</p>
<p>Jannik Prasuhn, Johns Hopkins University, United States</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Amad Zafar, <email xlink:href="mailto:amad@sejong.ac.kr">amad@sejong.ac.kr</email>; Seung Won Lee, <email xlink:href="mailto:swleemd@g.skku.edu">swleemd@g.skku.edu</email>
</p>
</fn>
<fn fn-type="equal" id="fn003">
<p>&#x2020;These authors have contributed equally to this work and share first authorship</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>24</day>
<month>06</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>15</volume>
<elocation-id>1395563</elocation-id>
<history>
<date date-type="received">
<day>04</day>
<month>03</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>07</day>
<month>06</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Ali, Kim, Khalid, Farrash, Zafar and Lee</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Ali, Kim, Khalid, Farrash, Zafar and Lee</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>This study addresses the pervasive and debilitating impact of Alzheimer&#x2019;s disease (AD) on individuals and society, emphasizing the crucial need for timely diagnosis. We present a multistage convolutional neural network (CNN)-based framework for AD detection and sub-classification using brain magnetic resonance imaging (MRI). After preprocessing, a 26-layer CNN model was designed to differentiate between healthy individuals and patients with dementia. After detecting dementia, the 26-layer CNN model was reutilized using the concept of transfer learning to further subclassify dementia into mild, moderate, and severe dementia. Leveraging the frozen weights of the developed CNN on correlated medical images facilitated the transfer learning process for sub-classifying dementia classes. An online AD dataset is used to verify the performance of the proposed multistage CNN-based framework. The proposed approach yielded a noteworthy accuracy of 98.24% in identifying dementia classes, whereas it achieved 99.70% accuracy in dementia subclassification. Another dataset was used to further validate the proposed framework, resulting in 100% performance. Comparative evaluations against pre-trained models and the current literature were also conducted, highlighting the usefulness and superiority of the proposed framework and presenting it as a robust and effective AD detection and subclassification method.</p>
</abstract>
<kwd-group>
<kwd>Alzheimer&#x2019;s disease</kwd>
<kwd>MRI</kwd>
<kwd>convolutional neural network</kwd>
<kwd>dementia</kwd>
<kwd>neuroimaging</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Research Foundation of Korea<named-content content-type="fundref-id">10.13039/501100003725</named-content>
</contract-sponsor>
<counts>
<fig-count count="8"/>
<table-count count="6"/>
<equation-count count="8"/>
<ref-count count="50"/>
<page-count count="15"/>
<word-count count="5756"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Aging Psychiatry</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Alzheimer&#x2019;s disease (AD) is a progressive neurodegenerative disease that causes irreversible cognitive dysfunction, amnesia, and progressive loss of brain function, eventually resulting in an inability to function independently in daily life (<xref ref-type="bibr" rid="B1">1</xref>). AD is the most prevalent type of dementia and requires a high level of medical attention. Global projections anticipate a significant increase in the number of individuals affected by AD, with an estimated 152 million affected by 2050 compared to the current 47 million. This poses challenges across the economic, medical, and societal domains (<xref ref-type="bibr" rid="B2">2</xref>). Every 3 seconds, one person worldwide is affected by dementia, with AD accounting for 60% of all dementia cases (<xref ref-type="bibr" rid="B3">3</xref>). The phases of dementia associated with AD can be broadly divided into the following categories: i) mild cognitive impairment (MCI), ii) mild dementia, iii) moderate dementia, and iv) severe dementia. MCI, which is often characterized by memory loss with increasing age, can lead to dementia in certain individuals. Individuals with mild dementia occasionally struggle with cognitive deficits that affect their daily activities. The symptoms include disorientation, memory loss, uncertainty, personality changes, and difficulties in performing daily chores. Moderate dementia significantly complicates daily life and requires greater assistance and care. These symptoms are more prominent and resemble those observed in patients with mild dementia. Individuals may require assistance with basic tasks, such as brushing their hair, and experience significant personality changes, including sudden onset of irritation or anxiety. Sleep disturbances were also frequent. Patients with severe dementia experience a marked decline in their condition as symptoms progress. Loss of communication skills may necessitate full-time care. The inability to perform basic activities, such as sitting in a chair or holding one&#x2019;s head up, and loss of bladder control are characteristics of this stage.</p>
<p>Currently, there are no viable treatments to cure or decrease the progression of AD, and a complete understanding of its pathogenesis remains elusive. MCI is the transitional stage between AD and normal cognitive aging. Individuals with MCI are more likely to develop AD than those with age-matched healthy cognition (<xref ref-type="bibr" rid="B4">4</xref>). Preventive strategies to limit disease progression as well as efficient treatment and care procedures depend on the early detection of AD.</p>
<p>Medical history, physical examination, and further diagnostic tests such as neurological screenings that examine reflexes, coordination, and muscle tone are all common components of AD diagnostic evaluation (<xref ref-type="bibr" rid="B5">5</xref>). Magnetic resonance imaging (MRI), computed tomography (CT), and positron emission tomography (PET) are important imaging techniques for the diagnosis of AD. In particular, fluid-attenuated inversion recovery sequences in MRI are used to suppress the cerebrospinal fluid, allowing for a more thorough evaluation of anatomical structures and examination of gliotic alterations (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B7">7</xref>). The advantages of MRI include improved flexibility, clear tissue contrast, lack of ionizing radiation, and the capacity to provide insightful information regarding the structure of the human brain (<xref ref-type="bibr" rid="B8">8</xref>). Developing an improved computer-aided diagnostic system capable of analyzing MRI images to determine whether individuals have AD or are in good health is crucial.</p>
<p>A wide range of machine-learning methodologies that integrate neuroimaging have improved the accuracy of identifying distinct dementia subtypes (<xref ref-type="bibr" rid="B9">9</xref>). Conventional machine-learning methods such as support vector machine (SVM) (<xref ref-type="bibr" rid="B10">10</xref>), random forest (<xref ref-type="bibr" rid="B11">11</xref>), and linear program boosting algorithms (<xref ref-type="bibr" rid="B12">12</xref>) have been used to detect AD using MRI (<xref ref-type="bibr" rid="B13">13</xref>). Furthermore, the variants of SVM and the ensemble of classifiers were also proposed. However, conventional machine-learning approaches frequently require the manual selection of predefined brain areas of interest based on established MRI markers linked to AD. Due to an inadequate understanding of definitive MRI biomarkers for AD, predetermined regions are likely unable to include all the information required to unravel the complexities of AD. In addition to being labor-intensive and time-consuming, manual selection also has the potential for subjective errors. Likewise, when it comes to choosing ensemble methods, managing computational expenses poses a significant challenge.</p>
<p>In contrast, deep-learning networks adopt a more advanced approach, including methods such as convolutional neural networks (CNNs), deep belief networks, recurrent neural networks, long-short term memory, stacked autoencoders, and restricted Boltzmann machine (<xref ref-type="bibr" rid="B14">14</xref>&#x2013;<xref ref-type="bibr" rid="B17">17</xref>). These techniques combine low-level features in the data to automatically create a higher-level, more abstract representation of a learning system (<xref ref-type="bibr" rid="B18">18</xref>). Because of high image classification accuracy, deep learning state-of-the-art techniques are preferred over conventional machine-learning methods. In general, CNN and its variants are the most popular deep-learning algorithms due to their better performance in identifying AD. CNN models are widely used in segmentation, object recognition, and classification (<xref ref-type="bibr" rid="B19">19</xref>&#x2013;<xref ref-type="bibr" rid="B21">21</xref>). This popularity can be attributed to several benefits including leveraging the spatial information of neighboring pixels, direct acceptance of image data as input, and efficient reduction of model parameters by utilizing weight-sharing, subsampling, and local receptive fields. A CNN trained using MRI slices can automatically extract features from images, thereby eliminating the requirement for manual feature selection during the learning phase (<xref ref-type="bibr" rid="B22">22</xref>). Furthermore, they also display higher generalization skills when dealing with scans from various sources or scanners.</p>
<p>Several CNN models have recently been proposed as diagnostic tools (<xref ref-type="bibr" rid="B23">23</xref>). Lu et&#xa0;al. (<xref ref-type="bibr" rid="B24">24</xref>) presented a multimodal CNN model using MRI and PET. Their proposed framework yielded an accuracy of 82.4% for patients with MCI who were subsequently diagnosed with AD. The model achieved a classification accuracy of 86.3% for individuals without dementia. In another study (<xref ref-type="bibr" rid="B25">25</xref>), accuracies of 90.05 and 85.55% were achieved for different datasets using CNN-based features and softmax as classifiers for binary classification (normal controls and AD). A pretrained AlexNet CNN model was used to retrieve deep features, and conventional machine-learning methods were used as classifiers (<xref ref-type="bibr" rid="B26">26</xref>). The results showed that the proposed methodology outperformed other handcrafted features with an accuracy of 99.21%. A VGG-16-based CNN model was used to classify the MRI slices (<xref ref-type="bibr" rid="B27">27</xref>). The model achieved a high accuracy of 95.73% for tertiary classification problems (early MCI, normal control, and late MCI). Pan et&#xa0;al. (<xref ref-type="bibr" rid="B28">28</xref>) hybridized ensemble learning and CNN models to classify brain MRI for various classification problems. Their models exhibited reasonable classification performance. Murugan et&#xa0;al. (<xref ref-type="bibr" rid="B29">29</xref>) presented the DEMNET model to classify various stages of dementia using MRI. They used the synthetic minority oversampling technique (SMOTE) approach to resolve class imbalance issues. Their model achieved a high accuracy of 95.23% for four classes. Although DEMNET shows high classification performance, the accuracy of an augmented dataset is not considered reliable for real-time applications. Recently, Fathi et&#xa0;al. (<xref ref-type="bibr" rid="B30">30</xref>) introduced a weighted probability-based ensemble method to combine six 2D-CNN architectures and obtain a high classification rate of 93.88 for four classes. Furthermore, they compared different ensemble methods and showed that the ensemble methods yielded better results than individual architectures. Kang et&#xa0;al. (<xref ref-type="bibr" rid="B31">31</xref>) proposed a three-round learning strategy based on a 3D deep convolutional generative adversarial network model and obtained an accuracy of 92.8% for two classes.</p>
<p>To improve the prediction performance, numerous studies have recently included attention models. The attention models focus on the most informative image regions. By combining two distinct attention modules (i.e., enhanced non-local attention and coordinate attention), Illakiya et&#xa0;al. (<xref ref-type="bibr" rid="B32">32</xref>) presented an adaptive hybrid attention network to enhance the performance of the DenseNet architecture, resulting in a higher classification accuracy of 98.53%. Similarly, in another study (<xref ref-type="bibr" rid="B33">33</xref>), an integrated model consisting of a depthwise group shuffle, global context network, hybrid multi-focus attention block, and EfficientNEt-B0 was developed to improve the prediction performance of MCI classification. Zhang et&#xa0;al. (<xref ref-type="bibr" rid="B34">34</xref>) developed an end-to-end 3D CNN framework based on the ResNet architecture, which employs multi-modality brain images to perform AD diagnostic and MCI prediction tasks by integrating 3D attention processes with multi-layer feature fusion algorithms. They showed that their multimodal model outperformed a single modality in predicting AD and MCI, with superior results of 6.37% and 3.51%, respectively. Some studies have also combined the transformer and attention networks. Hu et&#xa0;al. (<xref ref-type="bibr" rid="B35">35</xref>) designed a classifier model by combining a CNN with a swine transformer. In addition, they added a shift window attention mechanism to the transformer to improve the feature extraction. They achieved an accuracy of 93.5% for the two classes using their proposed model. Illakiya et&#xa0;al. (<xref ref-type="bibr" rid="B36">36</xref>) utilized a swine transformer, a dimension-centric proximity-aware attention network, and an age deviation factor to improve feature extraction from brain MRI images. The proposed network improves the classification results by utilizing a novel feature fusion strategy that incorporates global, local, and proximal characteristics, as well as dimensional dependencies. The literature describes various methods for classifying AD using conventional machine-learning and deep-learning models. However, there are challenges related to the large number of model parameters, training time, and high performance without augmentation in multiclass AD classification.</p>
<p>To address these issues, the primary contributions and steps of this study are outlined below:</p>
<list list-type="bullet">
<list-item>
<p>We hypothesized that leveraging the frozen weights of the developed CNN on correlated medical images facilitated the transfer learning process for sub-classifying dementia classes.</p>
</list-item>
<list-item>
<p>To prove the hypothesis, a lightweight CNN model was developed in stage 1 to detect dementia using MRI images after preprocessing.</p>
</list-item>
<list-item>
<p>In stage 2, a new model was built by reutilizing the frozen weight of the developed model for further classification of dementia into mild, moderate, and very mild dementia using transfer learning.</p>
</list-item>
<list-item>
<p>Various online AD datasets were used to validate the proposed model.</p>
</list-item>
<list-item>
<p>Various pre-trained models were trained using the same parameters and datasets for a fair comparison.</p>
</list-item>
</list>
<p>The results were compared with those reported in the literature.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Proposed framework</title>
<p>The proposed CNN-based framework is depicted in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>. In the proposed framework, dementia detection and sub-classification were divided into two stages (i.e., stage 1 and stage 2). In stage 1, the brain MRI scans were classified into two classes (healthy and dementia) using a proposed 26-layer CNN model (presented in Section 2.4). In stage 2, transfer learning was used to reutilize the frozen weights of the 26-layer CNN model (i.e., developed in stage 1) to fine-tune the new transfer-learned model by replacing the last three layers of the developed CNN for dementia subclassification (mild, moderate, and very mild dementia).</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>CNN-based proposed framework for dementia detection and subclassification.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-g001.tif"/>
</fig>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Datasets</title>
<p>Two different datasets (the Alzheimer&#x2019;s dataset (four classes of images) and ADNI_Extracted_Axial) were used to validate the proposed approach. Both datasets are publicly available (<ext-link ext-link-type="uri" xlink:href="https://www.kaggle.com/datasets/tourist55/alzheimers-dataset-4-class-of-images">https://www.kaggle.com/datasets/tourist55/alzheimers-dataset-4-class-of-images</ext-link> and <ext-link ext-link-type="uri" xlink:href="https://www.kaggle.com/datasets/katalniraj/adni-extracted-axial">https://www.kaggle.com/datasets/katalniraj/adni-extracted-axial</ext-link>; accessed November 13, 2023). The specifications of this dataset are listed in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Details of various online available datasets.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Dataset</th>
<th valign="middle" align="center">Classification</th>
<th valign="middle" align="center">Subclassification</th>
<th valign="middle" align="center">MRI Slices</th>
<th valign="middle" align="center">No. of Samples</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="4" align="left">Alzheimer&#x2019;s<break/>Dataset</td>
<td valign="middle" align="left">Healthy</td>
<td valign="middle" align="left">Lack of Dementia</td>
<td valign="top" align="left">
<inline-graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-i001.tif"/>
</td>
<td valign="middle" align="left">2560</td>
</tr>
<tr>
<td valign="middle" rowspan="3" align="left">Dementia</td>
<td valign="middle" align="left">Mild Dementia</td>
<td valign="top" align="left">
<inline-graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-i002.tif"/>
</td>
<td valign="middle" align="left">717</td>
</tr>
<tr>
<td valign="middle" align="left">Moderate Dementia</td>
<td valign="top" align="left">
<inline-graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-i003.tif"/>
</td>
<td valign="middle" align="left">52</td>
</tr>
<tr>
<td valign="middle" align="left">Very Mild Dementia</td>
<td valign="top" align="left">
<inline-graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-i004.tif"/>
</td>
<td valign="middle" align="left">1792</td>
</tr>
<tr>
<td valign="middle" rowspan="3" align="left">ADNI_Extracted<break/>_Axial</td>
<td valign="middle" align="left">Healthy</td>
<td valign="middle" align="left">Common Normal</td>
<td valign="top" align="left">
<inline-graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-i005.tif"/>
</td>
<td valign="middle" align="left">1440</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="left">Dementia</td>
<td valign="middle" align="left">Alzheimer&#x2019;s Disease</td>
<td valign="top" align="left">
<inline-graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-i006.tif"/>
</td>
<td valign="middle" align="left">1124</td>
</tr>
<tr>
<td valign="middle" align="left">Mild Cognitive Impairment</td>
<td valign="top" align="left">
<inline-graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-i007.tif"/>
</td>
<td valign="middle" align="left">2590</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Pre-processing</title>
<p>In CNN applications, irrelevant information in an image can adversely affect the subsequent image-processing steps. Preprocessing is imperative to address these issues and ensure the accuracy of subsequent steps in image processing. Therefore, a cropping and zero-center approach was applied to remove unwanted information and normalization (<xref ref-type="bibr" rid="B37">37</xref>). After preprocessing and normalization of the dataset, the images were input into a developed CNN, which identified the AD-affected area by extracting discriminating features.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Design of CNN for AD Detection</title>
<p>CNNs are a type of deep-learning model developed specifically for analyzing structured grid data, such as images. Their ability to learn hierarchical feature representations autonomously has revolutionized computer vision tasks. CNNs comprise layers that perform convolutional operations to capture local patterns and pooling operations to reduce spatial dimensions. Weight sharing characterizes these networks, allowing them to recognize comparable features across the input space. Convolutional layers are often followed by fully connected layers to achieve a high level of feature integration and classification. CNNs excel at image identification, object detection, and segmentation and demonstrate superior performance across various domains. The ability of CNNs to automatically extract significant characteristics from raw data makes them valuable tools for complicated pattern detection, leading to the development of artificial intelligence.</p>
<p>In this study, a 26-layer CNN model was developed from scratch to detect dementia in stage 1. This architecture comprised five blocks of convolutional layers, batch normalization, ReLU activation functions, and max-pooling layers. Fully connected layers and a softmax output layer were used for the classification. The model uses dropout for regularization, and the final output layer employs cross-entropy loss. Complete information regarding the designed CNN model is presented in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>. The details of the layers are presented in the subsequent sections.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Details of the designed CNN model for AD detection.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Layer No.</th>
<th valign="top" align="center">Type of Layer</th>
<th valign="top" align="center">Properties</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">Image Input</td>
<td valign="top" align="center">227&#xd7;227&#xd7;1 images with &#x2018;zerocenter&#x2019; normalization</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2-D Convolution</td>
<td valign="top" align="center">32 3&#xd7;3&#xd7;1 convolutions with stride [2 2] and padding [0 0 0 0]</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">Batch Normalization</td>
<td valign="top" align="center">Batch normalization with 32 channels</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">ReLU</td>
<td valign="top" align="center">ReLU</td>
</tr>
<tr>
<td valign="top" align="center">5</td>
<td valign="top" align="center">2-D Max Pooling</td>
<td valign="top" align="center">2&#xd7;2 max pooling with stride [2 2] and padding [0 0 0 0]</td>
</tr>
<tr>
<td valign="top" align="center">6</td>
<td valign="top" align="center">2-D Convolution</td>
<td valign="top" align="center">32 3&#xd7;3&#xd7;32 convolutions with stride [1 1] and padding [2 2 2 2]</td>
</tr>
<tr>
<td valign="top" align="center">7</td>
<td valign="top" align="center">Batch Normalization</td>
<td valign="top" align="center">Batch normalization with 32 channels</td>
</tr>
<tr>
<td valign="top" align="center">8</td>
<td valign="top" align="center">ReLU</td>
<td valign="top" align="center">ReLU</td>
</tr>
<tr>
<td valign="top" align="center">9</td>
<td valign="top" align="center">2-D Max Pooling</td>
<td valign="top" align="center">2&#xd7;2 max pooling with stride [2 2] and padding [0 0 0 0]</td>
</tr>
<tr>
<td valign="top" align="center">10</td>
<td valign="top" align="center">Batch Normalization</td>
<td valign="top" align="center">Batch normalization with 32 channels</td>
</tr>
<tr>
<td valign="top" align="center">11</td>
<td valign="top" align="center">2-D Convolution</td>
<td valign="top" align="center">64 3&#xd7;3&#xd7;32 convolutions with stride [1 1] and padding [2 2 2 2]</td>
</tr>
<tr>
<td valign="top" align="center">12</td>
<td valign="top" align="center">ReLU</td>
<td valign="top" align="center">ReLU</td>
</tr>
<tr>
<td valign="top" align="center">13</td>
<td valign="top" align="center">2-D Max Pooling</td>
<td valign="top" align="center">2&#xd7;2 max pooling with stride [2 2] and padding [0 0 0 0]</td>
</tr>
<tr>
<td valign="top" align="center">14</td>
<td valign="top" align="center">2-D Convolution</td>
<td valign="top" align="center">128 3&#xd7;3&#xd7;64 convolutions with stride [1 1] and padding [2 2 2 2]</td>
</tr>
<tr>
<td valign="top" align="center">15</td>
<td valign="top" align="center">Batch Normalization</td>
<td valign="top" align="center">Batch normalization with 128 channels</td>
</tr>
<tr>
<td valign="top" align="center">16</td>
<td valign="top" align="center">ReLU</td>
<td valign="top" align="center">ReLU</td>
</tr>
<tr>
<td valign="top" align="center">17</td>
<td valign="top" align="center">2-D Max Pooling</td>
<td valign="top" align="center">2&#xd7;2 max pooling with stride [2 2] and padding [0 0 0 0]</td>
</tr>
<tr>
<td valign="top" align="center">18</td>
<td valign="top" align="center">2-D Convolution</td>
<td valign="top" align="center">256 3&#xd7;3&#xd7;128 convolutions with stride [1 1] and padding [2 2 2 2]</td>
</tr>
<tr>
<td valign="top" align="center">19</td>
<td valign="top" align="center">Batch Normalization</td>
<td valign="top" align="center">Batch normalization with 256 channels</td>
</tr>
<tr>
<td valign="top" align="center">20</td>
<td valign="top" align="center">ReLU</td>
<td valign="top" align="center">ReLU</td>
</tr>
<tr>
<td valign="top" align="center">21</td>
<td valign="top" align="center">Batch Normalization</td>
<td valign="top" align="center">Batch normalization with 256 channels</td>
</tr>
<tr>
<td valign="top" align="center">22</td>
<td valign="top" align="center">Fully Connected</td>
<td valign="top" align="center">1024 fully connected layer</td>
</tr>
<tr>
<td valign="top" align="center">23</td>
<td valign="top" align="center">Dropout</td>
<td valign="top" align="center">30% dropout</td>
</tr>
<tr>
<td valign="top" align="center">24</td>
<td valign="top" align="center">Fully Connected</td>
<td valign="top" align="center">2 fully connected layer</td>
</tr>
<tr>
<td valign="top" align="center">25</td>
<td valign="top" align="center">Softmax</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="center">26</td>
<td valign="top" align="center">Classification Output</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>CNN, convolutional neural network; AD, Alzheimer&#x2019;s disease; ReLU, rectified linear unit activation.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<sec id="s2_4_1">
<label>2.4.1</label>
<title>Input layer</title>
<p>The input layer of the developed model represents the initial layer and accepts normalized images. This layer sets the input size and normalization strategy for the subsequent processing.</p>
</sec>
<sec id="s2_4_2">
<label>2.4.2</label>
<title>Convolutional layer</title>
<p>The foundation of any CNN model is comprised of convolutional layers. Convolutional layers are the core layers of any CNN model and are responsible for the extensive computational work. The input image is passed through this layer to produce a feature map or response by convolving it with weight filters and adding bias values. Subsequently, the feature response is passed through the following layers. Mathematically, convolution involves taking the element-wise product of the filter and a patch of the input and summing up all these products. The input (<italic>x</italic>), can be expressed as <xref ref-type="disp-formula" rid="eq1">Equation (1)</xref>.</p>
<disp-formula id="eq1">
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mo>=</mml:mo>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>W</mml:mi>
<mml:mo>&#x2217;</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>W</italic> and <italic>b<sub>i</sub>
</italic> are the filter and bias of each filter, respectively.</p>
</sec>
<sec id="s2_4_3">
<label>2.4.3</label>
<title>Batch normalization</title>
<p>Batch normalization was applied to the output of the convolutional layer. This layer normalizes the activation and enhances convergence and training stability. This introduced learnable parameters for scaling and shifting. <italic>x</italic> is assumed to be the convolutional layer output. Batch normalization normalizes <italic>x</italic> across batch dimensions using <xref ref-type="disp-formula" rid="eq2">Equation (2)</xref> (<xref ref-type="bibr" rid="B38">38</xref>):</p>
<disp-formula id="eq2">
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:msup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:mo>&#x2208;</mml:mo>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>&#x3bc;</italic> is the mean, <italic>&#x3c3;</italic> is the variance, and <inline-formula>
<mml:math display="inline" id="im1">
<mml:mo>&#x2208;</mml:mo>
</mml:math>
</inline-formula> is a small constant used to avoid division by zero. It scales and shifts the normalized output <inline-formula>
<mml:math display="inline" id="im2">
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
<mml:mo>+</mml:mo>
<mml:mi>&#x3b2;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, where <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic> are learnable parameters.</p>
</sec>
<sec id="s2_4_4">
<label>2.4.4</label>
<title>Rectified linear unit activation</title>
<p>The rectified linear unit (ReLU) activation function was applied element-wise. ReLUs introduce nonlinearity, which allows the model to capture more complex data patterns. If the input value is positive, the ReLU activation function immediately outputs the value. If not positive, it outputs zero. This can be mathematically expressed as <xref ref-type="disp-formula" rid="eq3">Equation (3)</xref> (<xref ref-type="bibr" rid="B29">29</xref>):</p>
<disp-formula id="eq3">
<label>(3)</label>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mi>max</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
</sec>
<sec id="s2_4_5">
<label>2.4.5</label>
<title>Max pooling</title>
<p>Pooling layers were used between the convolutional layers to reduce the representation in the spatial domain and computation space. Max pooling helps retain essential information while reducing the computational complexity by reducing the spatial dimensions. Max pooling was calculated using <xref ref-type="disp-formula" rid="eq4">Equation (4)</xref> (<xref ref-type="bibr" rid="B29">29</xref>):</p>
<disp-formula id="eq4">
<label>(4)</label>
<mml:math display="block" id="M4">
<mml:mrow>
<mml:mtext>Max&#xa0;Pooling</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mtext>Input&#xa0;</mml:mtext>
<mml:mi>x</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext>Pooling&#xa0;window&#xa0;size</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>stride</mml:mtext>
</mml:mrow>
</mml:mfrac>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
</sec>
<sec id="s2_4_6">
<label>2.4.6</label>
<title>Fully connected layer</title>
<p>The fully connected layer is densely connected. It captures high-level features from convolutional layers and prepares a classification model. Mathematically, this can be expressed as <xref ref-type="disp-formula" rid="eq5">Equation (5)</xref>.</p>
<disp-formula id="eq5">
<label>(5)</label>
<mml:math display="block" id="M5">
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>W</mml:mi>
<mml:mo>&#x2217;</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>
</sec>
<sec id="s2_4_7">
<label>2.4.7</label>
<title>Dropout layer</title>
<p>Dropout prevents overfitting by randomly deactivating neurons during training, enhancing model generalization.</p>
</sec>
<sec id="s2_4_8">
<label>2.4.8</label>
<title>Softmax</title>
<p>Softmax applies an activation function to convert logs into class probabilities. Softmax ensures that the sum of probabilities for all classes is one.</p>
</sec>
<sec id="s2_4_9">
<label>2.4.9</label>
<title>Classification output</title>
<p>It uses cross-entropy loss, specifically &#x2018;crossentropyex&#x2019; in MATLAB, for model training. Cross-entropy measures the dissimilarity between predicted and actual class probabilities as <xref ref-type="disp-formula" rid="eq6">Equation (6)</xref>.</p>
<disp-formula id="eq6">
<label>(6)</label>
<mml:math display="block" id="M6">
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>p</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#xb7;</mml:mo>
<mml:mi>log</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>H</italic> denotes the cross-entropy loss, <italic>y<sub>i</sub>
</italic> denotes the predicted probability distribution, and <italic>p<sub>i</sub>
</italic> denotes the true probability distribution.</p>
</sec>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Design of transfer learned CNN for subclassification</title>
<p>Transfer learning, a machine-learning technique, leverages pre-existing models to expedite learning in new tasks. That is, the model developed for a task is reused as the starting point for the model for a second task. This approach is particularly useful when data are scarce. The main concept of transfer learning is to leverage the features learned from tasks with a large amount of available data to improve the performance of tasks with less data. This is based on the idea that tasks share commonalities that can be utilized to improve performance. Assume that a domain is composed of two elements (<xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B40">40</xref>), as shown in <xref ref-type="disp-formula" rid="eq7">Equation (7)</xref>.</p>
<disp-formula id="eq7">
<label>(7)</label>
<mml:math display="block" id="M7">
<mml:mrow>
<mml:msub>
<mml:mi>A</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mi>Y</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>b</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq7">Equation (7)</xref>, <italic>Y</italic> and <italic>prob</italic>(<italic>y</italic>) denote the feature space and marginal probability, respectively. Suppose a task has two components:</p>
<disp-formula id="eq8">
<label>(8)</label>
<mml:math display="block" id="M8">
<mml:mrow>
<mml:msub>
<mml:mi>L</mml:mi>
<mml:mi>r</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq8">Equation (8)</xref>, <italic>X</italic> and <italic>&#x3b1;</italic> symbolize the label space and the objective function, respectively. Here, <inline-formula>
<mml:math display="inline" id="im3">
<mml:mrow>
<mml:msubsup>
<mml:mi>A</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>s</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im4">
<mml:mrow>
<mml:msubsup>
<mml:mi>L</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>s</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> represent the source domain and task, respectively, and <inline-formula>
<mml:math display="inline" id="im5">
<mml:mrow>
<mml:msubsup>
<mml:mi>A</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im6">
<mml:mrow>
<mml:msubsup>
<mml:mi>L</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>t</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> represent the target domain and task, respectively. The goal of transfer learning is to utilize knowledge from the source domain to understand the conditional probability in the target domain.</p>
<p>In stage 2 of this study, transfer learning is applied to the 26-layer CNN model that was developed in the first stage (section 2.4). Reutilizing the frozen weights of the 26-layer CNN model, the model was retrained by replacing the last three layers (i.e., fully connected, softmax, and classification layers) for dementia subclassification (mild, moderate, and very mild dementia). <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref> shows the concept of knowledge sharing from dementia to dementia subclassification.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>The concept of knowledge sharing.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-g002.tif"/>
</fig>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<p>MATLAB 2023a was used to perform all simulations and analyses on a personal computer with the following specifications: Core i7, 12th Generation, 32 GB RAM, NVIDIA GeForce RTX 3050, 1 TB SSD, and 64-bit Windows 11 operating system. The dataset was randomly divided into 80 and 20 ratios for model training and testing, respectively. The images used for model testing were not used to train the CNN. The following initial parameters were utilized: 100 Epochs, 0.9 momentum, 128 mini batch-size, and 0.001 learning rate. The stochastic gradient descent with momentum (SGDM) solver was utilized to train and test the model.</p>
<p>First, various publicly available pre-trained CNNs, such as ResNet50, Inception-v3, GoogleNet, EfficientNet-b0, and DenseNet-201, were used to categorize the brain MRI dataset. Subsequently, the proposed CNN model was trained to classify the brain MRI scans using the same parameters. <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref> shows a performance comparison of various pre-trained models with the developed 26-layer CNN; and the confusion matrix of all models is presented in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>, which also shows the true positive rate (TPR), false negative rate (FNR), positive predictive value (PPV), and false discovery rate (FDR).</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Performance comparison of various CNN models for Alzheimer&#x2019;s Dataset.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" align="center">Parameters</th>
<th valign="middle" colspan="6" align="center">CNN</th>
</tr>
<tr>
<th valign="middle" align="center">ResNet50</th>
<th valign="middle" align="center">Inception-v3</th>
<th valign="middle" align="center">GoogleNet</th>
<th valign="middle" align="center">EfficientNet-b0</th>
<th valign="middle" align="center">DenseNet-201</th>
<th valign="middle" align="center">Developed<break/>26-layer CNN</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">
<bold>Training Accuracy (%)</bold>
</td>
<td valign="middle" align="center">100</td>
<td valign="middle" align="center">100</td>
<td valign="middle" align="center">100</td>
<td valign="middle" align="center">100</td>
<td valign="middle" align="center">100</td>
<td valign="middle" align="center">100</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>Training Loss</bold>
</td>
<td valign="middle" align="center">1.9 &#xd7;10<sup>-04</sup>
</td>
<td valign="middle" align="center">4.3 &#xd7;10<sup>-04</sup>
</td>
<td valign="middle" align="center">3.6 &#xd7;10<sup>-04</sup>
</td>
<td valign="middle" align="center">2.8 &#xd7;10<sup>-03</sup>
</td>
<td valign="middle" align="center">1.4 &#xd7;10<sup>-04</sup>
</td>
<td valign="middle" align="center">1.8 &#xd7;10<sup>-04</sup>
</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>Validation Accuracy (%)</bold>
</td>
<td valign="middle" align="center">88.95</td>
<td valign="middle" align="center">84.84</td>
<td valign="middle" align="center">92.57</td>
<td valign="middle" align="center">90.32</td>
<td valign="middle" align="center">93.93</td>
<td valign="middle" align="center">97.45</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>Validation Loss</bold>
</td>
<td valign="middle" align="center">0.3938</td>
<td valign="middle" align="center">0.5598</td>
<td valign="middle" align="center">0.3584</td>
<td valign="middle" align="center">0.3030</td>
<td valign="middle" align="center">0.2152</td>
<td valign="middle" align="center">0.07675</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>Training Time</bold>
</td>
<td valign="middle" align="center">299 min<break/>40 s</td>
<td valign="middle" align="center">435 min<break/>47 s</td>
<td valign="middle" align="center">40 min<break/>30 s</td>
<td valign="middle" align="center">329 min<break/>45 s</td>
<td valign="middle" align="center">1062 min<break/>20 s</td>
<td valign="middle" align="center">8 min<break/>53 s</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>CNN, convolutional neural network.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Confusion matrix of various CNN models for Alzheimer&#x2019;s Dataset. <bold>(A)</bold> ResNet50, <bold>(B)</bold> Inception-v3, <bold>(C)</bold> GoogleNet, <bold>(D)</bold> EfficientNet-b0, <bold>(E)</bold> DenseNet-201, and <bold>(F)</bold> Developed 26-layer CNN. MID, mild dementia; MOD, moderate dementia; ND, non-dementia; VMD, very mild dementia; CNN convolutional neural networks.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-g003.tif"/>
</fig>
<p>After thoroughly analyzing the results presented in <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref> and <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>, it was found that the developed 26-layer CNN model has the best classification rate, with minimal training time and a high true positive rate for each class compared to all other pre-trained models. The learning curves of the various pre-trained models with the developed multistage 26-layer CNN are presented in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Learning curves of various convolutional neural networks. <bold>(A, C)</bold> shows the training accuracy and loss curves, <bold>(B, D)</bold> of training and depict the validation accuracy and loss curves.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-g004.tif"/>
</fig>
<p>After a comprehensive analysis of the results presented in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>, it was found that DenseNet-201 was 100% trained in fewer epochs than ResNet50, Inception-v3, GoogleNet, EfficientNet-b0, and 26-layer CNN; it took approximately 5 epochs to stabilize the results. DenseNet-201 also demonstrates the highest validation accuracy of 93.93% among all pre-trained models for dementia classification (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>). In contrast, GoogleNet took almost 32 epochs to train the model and also showed a reasonable validation performance (92.57%) than the remaining pre-trained models. The developed 26-layer CNN took almost 47 epochs to reach 100% training accuracy but had the best validation accuracy of 97.45% for dementia classification. Furthermore, the time consumed for the training of the developed 26-layer CNN was only 8 min 57 s for 100 epochs, which was the fastest among all methods. It validates the robustness and high classification performance of the developed CNN model compared to other pre-trained models.</p>
<p>To further enhance the dementia detection rate and subclassification performance, the proposed framework is divided into two stages. The performance of the proposed framework for both stages is presented in <xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref>. <xref ref-type="fig" rid="f5">
<bold>Figures&#xa0;5A, B</bold>
</xref> show the confusion matrix for dementia detection and sub-classification, respectively.</p>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>Performance of proposed CNN-based framework for dementia detection and subclassification.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Parameters</th>
<th valign="top" align="center">Developed 26-layer CNN for Binary Classification</th>
<th valign="top" align="center">Developed Transfer Learned 26-layer CNN for Subclassification</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">
<bold>Training Accuracy (%)</bold>
</td>
<td valign="top" align="center">100</td>
<td valign="top" align="center">100</td>
</tr>
<tr>
<td valign="top" align="center">
<bold>Training Loss</bold>
</td>
<td valign="top" align="center">2.2 &#xd7;10<sup>-04</sup>
</td>
<td valign="top" align="center">5.9 &#xd7;10<sup>-04</sup>
</td>
</tr>
<tr>
<td valign="top" align="center">
<bold>Validation Accuracy (%)</bold>
</td>
<td valign="top" align="center">98.24</td>
<td valign="top" align="center">99.70</td>
</tr>
<tr>
<td valign="top" align="center">
<bold>Validation Loss</bold>
</td>
<td valign="top" align="center">0.0553</td>
<td valign="top" align="center">0.0134</td>
</tr>
<tr>
<td valign="top" align="center">
<bold>Training Time</bold>
</td>
<td valign="top" align="center">6 min 42 s</td>
<td valign="top" align="center">3 min 9 s</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>CNN, convolutional neural network.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Confusion matrices using the proposed 2-stage framework. <bold>(A)</bold> Dementia detection and <bold>(B)</bold> dementia subclassification.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-g005.tif"/>
</fig>
<p>After carefully evaluating the result presented in <xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref>, it was found that the proposed 2-stage approach performs efficiently to differentiate between healthy and dementia persons with a high classification rate of 98.24% with only 6 min 42 s training time. The comprehensive performance of the model is presented in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref> using a confusion matrix. The proposed model only misclassified 9 samples of each class (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>), resulting in a high true positive rate of 98.2% for each class. After that, a new transfer-learned model was used for the subclassification of the dementia class and yielded a high accuracy of 99.7%, with only one sample of mild dementia misclassified, as shown in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>. The learning curves of the dementia detection and subclassification are shown in <xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6A, B</bold>
</xref>, respectively.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Training and loss curves. <bold>(A)</bold> for dementia detection and <bold>(B)</bold> for dementia subclassification. MID, mild dementia; MOD, moderate dementia; VMD, very mild dementia.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-g006.tif"/>
</fig>
<p>To further validate the performance of the proposed 2-stage approach against overfitting, the results of 10-fold cross-validation are presented in <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Confusion matrices using 10-fold cross-validation for the proposed 2-stage framework. <bold>(A)</bold> Dementia detection and <bold>(B)</bold> dementia subclassification. AD, Alzheimer&#x2019;s disease; CI, mild cognitive impairment.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-g007.tif"/>
</fig>
<p>Furthermore, other data were also used to validate the approach&#x2019;s reliability, adaptability, and accuracy. The results of dementia detection and subclassification are presented in <xref ref-type="fig" rid="f8">
<bold>Figures&#xa0;8A, B</bold>
</xref>, respectively.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>Confusion matrices using the proposed 2-stage framework for another dataset. <bold>(A)</bold> Dementia detection and <bold>(B)</bold> dementia subclassification. AD, Alzheimer&#x2019;s disease; CI, mild cognitive impairment.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-15-1395563-g008.tif"/>
</fig>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>This study investigated the application of CNNs to identify AD and differentiate between the different stages of dementia by analyzing MRI. Recently, there has been an increase in the use of computer-aided systems for early AD detection, using both machine learning and CNNs. This study contributes to the development of an automated AD detection system for improving the operating efficiency of medical centers.</p>
<p>The ablation study was performed for the layers selection of developed CNN. The effect of changing the number of layers (from 22 to 34 layers) is reported in <xref ref-type="table" rid="T5">
<bold>Table&#xa0;5</bold>
</xref>. All models attain 100% training accuracy showing that the deep network models match the training data closely. However, 26-layer CNN yielded the less training loss. Furthermore, the 26-layer CNN model also gives higher validation accuracy and lower validation loss as compared to other models. This shows that the 26-layer model seems to provide a greater generalization of the unknown validation data. The 26-layer CNN model was chosen because it appears to achieve an optimal balance between model complexity and generalization at this depth. Too few or too many layers may result in suboptimal performance on validation data.</p>
<table-wrap id="T5" position="float">
<label>Table&#xa0;5</label>
<caption>
<p>Results of ablation study for selection of layers.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" align="center">Parameters</th>
<th valign="middle" colspan="4" align="center">Developed CNNs</th>
</tr>
<tr>
<th valign="middle" align="center">22-Layer</th>
<th valign="middle" align="center">26-Layer</th>
<th valign="middle" align="center">30-Layer</th>
<th valign="middle" align="center">34-Layer</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Training Loss</td>
<td valign="middle" align="center">1.7 &#xd7; 10<sup>-3</sup>
</td>
<td valign="middle" align="center">1.8 &#xd7;10<sup>-04</sup>
</td>
<td valign="top" align="center">3.5 &#xd7;10<sup>-04</sup>
</td>
<td valign="top" align="center">6.2 &#xd7;10<sup>-04</sup>
</td>
</tr>
<tr>
<td valign="middle" align="left">Training Accuracy (%)</td>
<td valign="middle" align="center">100</td>
<td valign="middle" align="center">100</td>
<td valign="top" align="center">100</td>
<td valign="top" align="center">100</td>
</tr>
<tr>
<td valign="middle" align="left">Validation Loss</td>
<td valign="middle" align="center">0.10741</td>
<td valign="middle" align="center">0.07675</td>
<td valign="top" align="center">0.10735</td>
<td valign="top" align="center">0.17687</td>
</tr>
<tr>
<td valign="middle" align="left">Validation Accuracy (%)</td>
<td valign="middle" align="center">96.87</td>
<td valign="middle" align="center">97.45</td>
<td valign="top" align="center">96.08</td>
<td valign="top" align="center">94.13</td>
</tr>
<tr>
<td valign="middle" align="left">Training Time</td>
<td valign="middle" align="center">7 min 19 s</td>
<td valign="middle" align="center">8 min 53 s</td>
<td valign="top" align="center">9 min 20 s</td>
<td valign="top" align="center">9 min 56 s</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>CNN, convolutional neural network.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The developed 26-layer CNN model achieved an impressive classification accuracy of 97.45% for directly categorizing MRI scans into four classes, demonstrating superior performance with minimal training time compared to several pre-trained CNNs (<xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>). DenseNet-201 yielded better results than the other pre-trained networks. In the validation, the proposed model correctly classified 998 of the 1023 images (see <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3F</bold>
</xref>). The TPR of all classes was higher than 95%, with a very low FDR. All pre-trained models converged faster during the training, indicating that transfer learning facilitates fast convergence in the learning of pre-trained models (see <xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4A, C</bold>
</xref>).</p>
<p>The proposed technique for advancing diagnostic capabilities comprises two key stages. First (i.e., stage 1), a 26-layer CNN model was developed to detect dementia using MRI slices. Next (i.e., stage 2), the weights of the developed model were reutilized to subclassify the dementia class. In the first stage, to detect only dementia, the results showed that the proposed model yielded a high accuracy of 98.24% for binary classification, with a TPR of more than 98% for both classes (see <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>). In the second stage, the developed CNN model was reused using the transfer learning concept for dementia subclassification. The results showed that only one sample out of 512 samples was misclassified, and the model produced a high classification rate of 99.7%, with a very high TPR and low FDR (see <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>). Furthermore, fast convergence was observed as a result of transfer learning (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6B</bold>
</xref>). These results support our hypothesis that the frozen weight of a trained model from correlated images benefits transfer learning and results in a high classification performance. To further evaluate the performance of the model against data leakage issues, the authors have further performed 10-fold cross-validation. The proposed multistage framework shows almost similar high classification accuracy, further validating the effectiveness of the proposed approach (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>). Another ADNI MRI scan dataset was used to validate the efficacy of the proposed framework. The framework validated the 100% classification rate of the developed CNN for dementia detection and subclassification (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8</bold>
</xref>). <xref ref-type="table" rid="T6">
<bold>Table&#xa0;6</bold>
</xref> compares the proposed multistage framework with those of recent studies.</p>
<table-wrap id="T6" position="float">
<label>Table&#xa0;6</label>
<caption>
<p>Comparison of the proposed multistage CNN-based framework with recent research.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" align="center">Study</th>
<th valign="middle" colspan="2" align="center">Accuracy (%)</th>
</tr>
<tr>
<th valign="middle" align="center">ADNI_Extracted<break/>_Axial dataset</th>
<th valign="middle" align="center">Alzheimer&#x2019;s Dataset</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Wang et&#xa0;al. (<xref ref-type="bibr" rid="B41">41</xref>)</td>
<td valign="middle" align="center">97.52</td>
<td valign="middle" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="middle" align="center">Mohammed et&#xa0;al. (<xref ref-type="bibr" rid="B42">42</xref>)</td>
<td valign="middle" align="center">&#x2013;</td>
<td valign="middle" align="center">94.8</td>
</tr>
<tr>
<td valign="middle" align="center">Acharya et&#xa0;al. (<xref ref-type="bibr" rid="B43">43</xref>)</td>
<td valign="middle" align="center">&#x2013;</td>
<td valign="middle" align="center">95.70</td>
</tr>
<tr>
<td valign="middle" align="center">El-Latif et&#xa0;al. (<xref ref-type="bibr" rid="B44">44</xref>)</td>
<td valign="middle" align="center">&#x2013;</td>
<td valign="middle" align="center">95.93</td>
</tr>
<tr>
<td valign="middle" align="center">Murugan et&#xa0;al. (<xref ref-type="bibr" rid="B29">29</xref>)</td>
<td valign="middle" align="center">&#x2013;</td>
<td valign="middle" align="center">95.23 (augmentation)</td>
</tr>
<tr>
<td valign="middle" align="center">Loddo et&#xa0;al. (<xref ref-type="bibr" rid="B45">45</xref>)</td>
<td valign="middle" align="center">99.22</td>
<td valign="middle" align="center">97.71</td>
</tr>
<tr>
<td valign="middle" align="center">Kaplan et&#xa0;al. (<xref ref-type="bibr" rid="B46">46</xref>)</td>
<td valign="middle" align="center">&#x2013;</td>
<td valign="middle" align="center">99.62 (10-fold) (healthy vs dementia)</td>
</tr>
<tr>
<td valign="middle" align="center">Ching et&#xa0;al. (<xref ref-type="bibr" rid="B47">47</xref>)</td>
<td valign="middle" align="center">98.93</td>
<td valign="middle" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="middle" align="center">Mohammad and Ahmadi (<xref ref-type="bibr" rid="B48">48</xref>)</td>
<td valign="middle" align="center">99</td>
<td valign="middle" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="middle" align="center">Hasan and Wagler (<xref ref-type="bibr" rid="B49">49</xref>)</td>
<td valign="middle" align="center">&#x2013;</td>
<td valign="middle" align="center">99.06</td>
</tr>
<tr>
<td valign="middle" align="center">Shukla et&#xa0;al. (<xref ref-type="bibr" rid="B50">50</xref>)</td>
<td valign="middle" align="center">&#x2013;</td>
<td valign="middle" align="center">99 (for dementia detection)<break/>94 (dementia subclassification)</td>
</tr>
<tr>
<td valign="middle" align="center">Latif et&#xa0;al. (<xref ref-type="bibr" rid="B44">44</xref>)</td>
<td valign="middle" align="center">&#x2013;</td>
<td valign="middle" align="center">99.2 (for dementia detection)<break/>95.93 (dementia subclassification)</td>
</tr>
<tr>
<td valign="middle" align="center">Proposed multistage<break/>CNN-based framework</td>
<td valign="middle" align="center">100</td>
<td valign="middle" align="center">98.24 (for dementia detection)<break/>99.70 (dementia subclassification)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>CNN, convolutional neural network.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>After deeply analyzing the results presented in <xref ref-type="table" rid="T6">
<bold>Table&#xa0;6</bold>
</xref>, it can be concluded that the proposed CNN-based framework has the highest classification rate compared to others. These outcomes underscore the efficacy of the proposed model in efficiently and accurately handling the classification task, emphasizing its potential as a robust solution in AD detection and subclassification.</p>
<p>A single-modality dataset was used to evaluate the performance of the proposed network. In the future, multiple-modality datasets may be utilized to improve the classification performance for AD diagnosis. In addition, this study proposes a simple architecture; however, more intuitive architectures, such as transformers or the incorporation of attention networks, may be tested in the future. Confounding variables, such as the independent variable (imaging data in this case) and the dependent variable (presence or absence of AD), should be considered in designing AD studies. These confounding variables can introduce spurious correlations, leading to reduced AD identification accuracy. The key clinical confounding variables to be considered include age, education, vascular health, genetic factors, and lifestyle. For instance, a CNN model trained on an older-skewed dataset might learn age-related features instead of AD-specific ones, resulting in misdiagnosis for younger AD patients and overdiagnosis in healthy older adults. Other important confounding variables related to the imaging data of AD identification include data collection, preprocessing, model designing, and the evaluation of model performance for variables unseen during training. Image quality can be affected and data inconsistencies introduced by differences in acquisition paradigms, spatial resolution, and magnetic field strength. Furthermore, inadequate preprocessing can result in artifacts, spatial distortions, and data inconsistencies, all of which can have an impact on the accuracy and reliability of the study. Model architecture, hyperparameter tuning, and regularization techniques are also important in reducing confounding effects and maximizing model performance. Finally, the evaluation of the model must be done by employing a rigorous validation process. For example, <italic>k</italic>-fold cross-validation can assist in reducing the impact of data variability and produce more reliable estimates of model performance. Evaluation criteria should also be carefully chosen to take into consideration confounding variables unique to AD identification tasks, such as class imbalance and susceptibility to false positives.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>AD is a common and devastating neurological condition that substantially reduces the quality of life in affected individuals. These effects affect not only patients but also their families and society. Timely diagnosis is critical to adequately control AD and reduce its socioeconomic consequences. This paper proposes a multistage CNN-based AD detection and subclassification framework. A 26-layer CNN model was developed from scratch using MRI images to detect dementia. The model yielded a high accuracy of 98.24% in dementia detection using an online AD dataset. Subsequently, the developed CNN model was reutilized for the subclassification of dementia classes using transfer learning. This yielded a high accuracy rate of 99.70%, with only one misclassified sample. Moreover, another AD dataset was used to validate the model, and the results showed a 100% performance rate. The proposed framework was also compared with various pre-trained models and the latest literature to prove the effectiveness and superiority of the proposed model.</p>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material. Further inquiries can be directed to the corresponding author/s.</p>
</sec>
<sec id="s7" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>Ethical approval was not required for the study involving humans in accordance with the local legislation and institutional requirements. Written informed consent to participate in this study was not required from the participants or the participants&#x2019; legal guardians/next of kin in accordance with the national legislation and the institutional requirements.</p>
</sec>
<sec id="s8" sec-type="author-contributions">
<title>Author contributions</title>
<p>MA: Conceptualization, Methodology, Software, Writing &#x2013; original draft. KK: Conceptualization, Methodology, Software, Writing &#x2013; review &amp; editing. MK: Conceptualization, Formal analysis, Writing &#x2013; review &amp; editing. MF: Formal analysis, Investigation, Writing &#x2013; review &amp; editing. AZ: Formal analysis, Investigation, Validation, Visualization, Writing &#x2013; review &amp; editing. SL: Funding acquisition, Project administration, Resources, Supervision, Writing &#x2013; review &amp; editing.</p>
</sec>
</body>
<back>
<sec id="s9" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This work is supported by a National Research Foundation (NRF) grant funded by the Ministry of Education (MOE), South Korea, through the "Development Research Program" NRF2021R1I1A2059735 (SL). This work was supported by National Research Foundation of Korea (NRF) grants funded by the Korean government (MSIT) (2022R1C1C2003637) (to KK).</p>
</sec>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ulep</surname> <given-names>MG</given-names>
</name>
<name>
<surname>Saraon</surname> <given-names>SK</given-names>
</name>
<name>
<surname>McLea</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Alzheimer disease</article-title>. <source>J Nurse Practitioners</source>. (<year>2018</year>) <volume>14</volume>:<page-range>129&#x2013;35</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.nurpra.2017.10.014</pub-id>
</citation>
</ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salvatore</surname> <given-names>C</given-names>
</name>
<name>
<surname>Cerasa</surname> <given-names>A</given-names>
</name>
<name>
<surname>Battista</surname> <given-names>P</given-names>
</name>
<name>
<surname>Gilardi</surname> <given-names>MC</given-names>
</name>
<name>
<surname>Quattrone</surname> <given-names>A</given-names>
</name>
<name>
<surname>Castiglioni</surname> <given-names>I</given-names>
</name>
</person-group>. <article-title>Magnetic resonance imaging biomarkers for the early diagnosis of alzheimer's disease: A machine learning approach</article-title>. <source>Front Neurosci</source>. (<year>2015</year>) <volume>9</volume>:<elocation-id>307</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fnins.2015.00307</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Patterson</surname> <given-names>C</given-names>
</name>
</person-group>. <source>World alzheimer Report 2018</source>. (<year>2018</year>) (<publisher-loc>London, UK</publisher-loc>: <publisher-name>Alzheimer&#x2019;s Disease International (ADI)</publisher-name>).</citation>
</ref>
<ref id="B4">
<label>4</label>
<citation citation-type="confproc">
<person-group person-group-type="editor">
<name>
<surname>Liu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>W</given-names>
</name>
<name>
<surname>Pujol</surname> <given-names>S</given-names>
</name>
<name>
<surname>Kikinis</surname> <given-names>R</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>D</given-names>
</name>
</person-group> eds. (<year>2014</year>). <article-title>Early diagnosis of alzheimer's disease with deep learning</article-title>, in: <conf-name>2014 IEEE 11th international symposium on biomedical imaging (ISBI)</conf-name>, <publisher-loc>Beijing, China</publisher-loc>: <publisher-name>IEEE</publisher-name>.</citation>
</ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sabbagh</surname> <given-names>MN</given-names>
</name>
<name>
<surname>Lue</surname> <given-names>L-F</given-names>
</name>
<name>
<surname>Fayard</surname> <given-names>D</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Increasing precision of clinical diagnosis of alzheimer's disease using a combined algorithm incorporating clinical and novel biomarker data</article-title>. <source>Neurol Ther</source>. (<year>2017</year>) <volume>6</volume>:<fpage>83</fpage>&#x2013;<lpage>95</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s40120-017-0069-5</pub-id>
</citation>
</ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Noor</surname> <given-names>MBT</given-names>
</name>
<name>
<surname>Zenia</surname> <given-names>NZ</given-names>
</name>
<name>
<surname>Kaiser</surname> <given-names>MS</given-names>
</name>
<name>
<surname>Mamun</surname> <given-names>SA</given-names>
</name>
<name>
<surname>Mahmud</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Application of deep learning in detecting neurological disorders from magnetic resonance images: A survey on the detection of alzheimer&#x2019;s disease, parkinson&#x2019;s disease and schizophrenia</article-title>. <source>Brain Inf</source>. (<year>2020</year>) <volume>7</volume>:<elocation-id>11</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s40708-020-00112-2</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baratti</surname> <given-names>C</given-names>
</name>
<name>
<surname>Barkhof</surname> <given-names>F</given-names>
</name>
<name>
<surname>Hoogenraad</surname> <given-names>F</given-names>
</name>
</person-group>. <article-title>Valk J. Partially saturated fluid attenuated inversion recovery (Flair) sequences in multiple sclerosis: comparison with fully relaxed flair and conventional spin-echo</article-title>. <source>Magnetic Resonance Imaging</source>. (<year>1995</year>) <volume>13</volume>:<page-range>513&#x2013;21</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0730-725X(95)00009-6</pub-id>
</citation>
</ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moser</surname> <given-names>E</given-names>
</name>
<name>
<surname>Stadlbauer</surname> <given-names>A</given-names>
</name>
<name>
<surname>Windischberger</surname> <given-names>C</given-names>
</name>
<name>
<surname>Quick</surname> <given-names>HH</given-names>
</name>
<name>
<surname>Ladd</surname> <given-names>ME</given-names>
</name>
</person-group>. <article-title>Magnetic resonance imaging methodology</article-title>. <source>Eur J Nucl Med Mol Imaging</source>. (<year>2009</year>) <volume>36</volume>:<fpage>30</fpage>&#x2013;<lpage>41</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00259-008-0938-3</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mateos-P&#xe9;rez</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Dadar</surname> <given-names>M</given-names>
</name>
<name>
<surname>Lacalle-Aurioles</surname> <given-names>M</given-names>
</name>
<name>
<surname>Iturria-Medina</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zeighami</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Evans</surname> <given-names>AC</given-names>
</name>
</person-group>. <article-title>Structural neuroimaging as clinical predictor: A review of machine learning applications</article-title>. <source>NeuroImage: Clin</source>. (<year>2018</year>) <volume>20</volume>:<page-range>506&#x2013;22</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.nicl.2018.08.019</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10</label>
<citation citation-type="confproc">
<person-group person-group-type="editor">
<name>
<surname>Rabeh</surname> <given-names>AB</given-names>
</name>
<name>
<surname>Benzarti</surname> <given-names>F</given-names>
</name>
<name>
<surname>Amiri</surname> <given-names>H</given-names>
</name>
</person-group> eds. (<year>2016</year>). <article-title>Diagnosis of alzheimer diseases in early step using svm (Support vector machine)</article-title>, in: <conf-name>2016 13th International Conference on Computer Graphics, Imaging and Visualization (CGiV)</conf-name>; <conf-date>29 March-1 April 2016</conf-date>. <conf-loc>Beni Mellal, Morocco</conf-loc>.</citation>
</ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tripoliti</surname> <given-names>EE</given-names>
</name>
<name>
<surname>Fotiadis</surname> <given-names>DI</given-names>
</name>
<name>
<surname>Argyropoulou</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>A supervised method to assist the diagnosis and monitor progression of alzheimer's disease using data from an fmri experiment</article-title>. <source>Artif Intell Med</source>. (<year>2011</year>) <volume>53</volume>:<fpage>35</fpage>&#x2013;<lpage>45</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.artmed.2011.05.005</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hinrichs</surname> <given-names>C</given-names>
</name>
<name>
<surname>Singh</surname> <given-names>V</given-names>
</name>
<name>
<surname>Mukherjee</surname> <given-names>L</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>G</given-names>
</name>
<name>
<surname>Chung</surname> <given-names>MK</given-names>
</name>
<name>
<surname>Johnson</surname> <given-names>SC</given-names>
</name>
</person-group>. <article-title>Spatially augmented lpboosting for ad classification with evaluations on the adni dataset</article-title>. <source>NeuroImage</source>. (<year>2009</year>) <volume>48</volume>:<page-range>138&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.neuroimage.2009.05.056</pub-id>
</citation>
</ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thayumanasamy</surname> <given-names>I</given-names>
</name>
<name>
<surname>Ramamurthy</surname> <given-names>K</given-names>
</name>
</person-group>. <article-title>Performance analysis of machine learning and deep learning models for classification of alzheimer's disease from brain mri</article-title>. <source>Traitement Du Signal</source>. (<year>2022</year>) <volume>39</volume>:<page-range>1961&#x2013;70</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.18280/ts.390608</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hinton</surname> <given-names>GE</given-names>
</name>
</person-group>. <article-title>Deep belief networks</article-title>. <source>Scholarpedia</source>. (<year>2009</year>) <volume>4</volume>:<fpage>5947</fpage>.</citation>
</ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vincent</surname> <given-names>P</given-names>
</name>
<name>
<surname>Larochelle</surname> <given-names>H</given-names>
</name>
<name>
<surname>Lajoie</surname> <given-names>I</given-names>
</name>
<name>
<surname>Bengio</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Manzagol</surname> <given-names>P-A</given-names>
</name>
<name>
<surname>Bottou</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Stacked denoising autoencoders: learning useful representations in a deep network with a local denoising criterion</article-title>. <source>J Mach Learn Res</source>. (<year>2010</year>) <volume>11</volume>:<fpage>3371</fpage>&#x2013;<lpage>408</lpage>.</citation>
</ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rawat</surname> <given-names>W</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z</given-names>
</name>
</person-group>. <article-title>Deep convolutional neural networks for image classification: A comprehensive review</article-title>. <source>Neural Comput</source>. (<year>2017</year>) <volume>29</volume>:<page-range>2352&#x2013;449</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1162/neco_a_00990</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Illakiya</surname> <given-names>T</given-names>
</name>
<name>
<surname>Karthik</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>Automatic detection of alzheimer's disease using deep learning models and neuro-imaging: current trends and future perspectives</article-title>. <source>Neuroinformatics</source>. (<year>2023</year>) <volume>21</volume>:<page-range>339&#x2013;64</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12021-023-09625-7</pub-id>
</citation>
</ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khamparia</surname> <given-names>A</given-names>
</name>
<name>
<surname>Singh</surname> <given-names>KM</given-names>
</name>
</person-group>. <article-title>A systematic review on deep learning architectures and applications</article-title>. <source>Expert Syst</source>. (<year>2019</year>) <volume>36</volume>:<fpage>e12400</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/exsy.12400</pub-id>
</citation>
</ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ali</surname> <given-names>MU</given-names>
</name>
<name>
<surname>Kallu</surname> <given-names>KD</given-names>
</name>
<name>
<surname>Masood</surname> <given-names>H</given-names>
</name>
<name>
<surname>Tahir</surname> <given-names>U</given-names>
</name>
<name>
<surname>Gopi</surname> <given-names>CVVM</given-names>
</name>
<name>
<surname>Zafar</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>A cnn-based chest infection diagnostic model: A multistage multiclass isolated and developed transfer learning framework</article-title>. <source>Int J Intelligent Syst</source>. (<year>2023</year>) <volume>2023</volume>:<elocation-id>6850772</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2023/6850772</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alanazi</surname> <given-names>MF</given-names>
</name>
<name>
<surname>Ali</surname> <given-names>MU</given-names>
</name>
<name>
<surname>Hussain</surname> <given-names>SJ</given-names>
</name>
<name>
<surname>Zafar</surname> <given-names>A</given-names>
</name>
<name>
<surname>Mohatram</surname> <given-names>M</given-names>
</name>
<name>
<surname>Irfan</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Brain tumor/mass classification framework using magnetic-resonance-imaging-based isolated and developed transfer deep-learning model</article-title>. <source>Sensors</source>. (<year>2022</year>) <volume>22</volume>:<fpage>372</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/s22010372</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Almalki</surname> <given-names>YE</given-names>
</name>
<name>
<surname>Ali</surname> <given-names>MU</given-names>
</name>
<name>
<surname>Kallu</surname> <given-names>KD</given-names>
</name>
<name>
<surname>Masud</surname> <given-names>M</given-names>
</name>
<name>
<surname>Zafar</surname> <given-names>A</given-names>
</name>
<name>
<surname>Alduraibi</surname> <given-names>SK</given-names>
</name>
<etal/>
</person-group>. <article-title>Isolated convolutional-neural-network-based deep-feature extraction for brain tumor classification using shallow classifier</article-title>. <source>Diagnostics</source>. (<year>2022</year>) <volume>12</volume>:<fpage>1793</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/diagnostics12081793</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname> <given-names>W</given-names>
</name>
<name>
<surname>Tong</surname> <given-names>T</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>D</given-names>
</name>
<name>
<surname>Du</surname> <given-names>X</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Convolutional neural networks-based mri image analysis for the alzheimer&#x2019;s disease prediction from mild cognitive impairment</article-title>. <source>Front Neurosci</source>. (<year>2018</year>) <volume>12</volume>:<elocation-id>777</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fnins.2018.00777</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Thibeau-Sutre</surname> <given-names>E</given-names>
</name>
<name>
<surname>Diaz-Melo</surname> <given-names>M</given-names>
</name>
<name>
<surname>Samper-Gonz&#xe1;lez</surname> <given-names>J</given-names>
</name>
<name>
<surname>Routier</surname> <given-names>A</given-names>
</name>
<name>
<surname>Bottani</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Convolutional neural networks for classification of alzheimer's disease: overview and reproducible evaluation</article-title>. <source>Med image Anal</source>. (<year>2020</year>) <volume>63</volume>:<fpage>101694</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.media.2020.101694</pub-id>
</citation>
</ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname> <given-names>D</given-names>
</name>
<name>
<surname>Popuri</surname> <given-names>K</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>GW</given-names>
</name>
<name>
<surname>Balachandar</surname> <given-names>R</given-names>
</name>
<name>
<surname>Beg</surname> <given-names>MF</given-names>
</name>
<name>
<surname>Weiner</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Multimodal and multiscale deep neural networks for the early diagnosis of alzheimer&#x2019;s disease using structural mr and fdg-pet images</article-title>. <source>Sci Rep</source>. (<year>2018</year>) <volume>8</volume>:<fpage>5697</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-018-22871-z</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ahmed</surname> <given-names>S</given-names>
</name>
<name>
<surname>Choi</surname> <given-names>KY</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>BC</given-names>
</name>
<name>
<surname>Kwon</surname> <given-names>GR</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>KH</given-names>
</name>
<etal/>
</person-group>. <article-title>Ensembles of patch-based classifiers for diagnosis of alzheimer diseases</article-title>. <source>IEEE Access</source>. (<year>2019</year>) <volume>7</volume>:<page-range>73373&#x2013;83</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/ACCESS.2019.2920011</pub-id>
</citation>
</ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nawaz</surname> <given-names>H</given-names>
</name>
<name>
<surname>Maqsood</surname> <given-names>M</given-names>
</name>
<name>
<surname>Afzal</surname> <given-names>S</given-names>
</name>
<name>
<surname>Aadil</surname> <given-names>F</given-names>
</name>
<name>
<surname>Mehmood</surname> <given-names>I</given-names>
</name>
<name>
<surname>Rho</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>A deep feature-based real-time system for alzheimer disease stage detection</article-title>. <source>Multimedia Tools Appl</source>. (<year>2021</year>) <volume>80</volume>:<page-range>35789&#x2013;807</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11042-020-09087-y</pub-id>
</citation>
</ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jain</surname> <given-names>R</given-names>
</name>
<name>
<surname>Jain</surname> <given-names>N</given-names>
</name>
<name>
<surname>Aggarwal</surname> <given-names>A</given-names>
</name>
<name>
<surname>Hemanth</surname> <given-names>DJ</given-names>
</name>
</person-group>. <article-title>Convolutional neural network based alzheimer&#x2019;s disease classification from magnetic resonance brain images</article-title>. <source>Cogn Syst Res</source>. (<year>2019</year>) <volume>57</volume>:<page-range>147&#x2013;59</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cogsys.2018.12.015</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pan</surname> <given-names>D</given-names>
</name>
<name>
<surname>Zeng</surname> <given-names>A</given-names>
</name>
<name>
<surname>Jia</surname> <given-names>L</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Frizzell</surname> <given-names>T</given-names>
</name>
<name>
<surname>Song</surname> <given-names>X</given-names>
</name>
</person-group>. <article-title>Early detection of alzheimer&#x2019;s disease using magnetic resonance imaging: A novel approach combining convolutional neural networks and ensemble learning</article-title>. <source>Front Neurosci</source>. (<year>2020</year>) <volume>14</volume>:<elocation-id>259</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fnins.2020.00259</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Murugan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Venkatesan</surname> <given-names>C</given-names>
</name>
<name>
<surname>Sumithra</surname> <given-names>MG</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>XZ</given-names>
</name>
<name>
<surname>Elakkiya</surname> <given-names>B</given-names>
</name>
<name>
<surname>Akila</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Demnet: A deep learning model for early diagnosis of alzheimer diseases and dementia from mr images</article-title>. <source>IEEE Access</source>. (<year>2021</year>) <volume>9</volume>:<page-range>90319&#x2013;29</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/ACCESS.2021.3090474</pub-id>
</citation>
</ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fathi</surname> <given-names>S</given-names>
</name>
<name>
<surname>Ahmadi</surname> <given-names>A</given-names>
</name>
<name>
<surname>Dehnad</surname> <given-names>A</given-names>
</name>
<name>
<surname>Almasi-Dooghaee</surname> <given-names>M</given-names>
</name>
<name>
<surname>Sadegh</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>for the alzheimer&#x2019;s disease neuroimaging I. A deep learning-based ensemble method for early diagnosis of alzheimer&#x2019;s disease using mri images</article-title>. <source>Neuroinformatics</source>. (<year>2024</year>) <volume>22</volume>:<fpage>89</fpage>&#x2013;<lpage>105</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12021-023-09646-2</pub-id>
</citation>
</ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>L</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>S</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Three-round learning strategy based on 3d deep convolutional gans for alzheimer&#x2019;s disease staging</article-title>. <source>Sci Rep</source>. (<year>2023</year>) <volume>13</volume>:<fpage>5750</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-023-33055-9</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Illakiya</surname> <given-names>T</given-names>
</name>
<name>
<surname>Ramamurthy</surname> <given-names>K</given-names>
</name>
<name>
<surname>Siddharth</surname> <given-names>MV</given-names>
</name>
<name>
<surname>Mishra</surname> <given-names>R</given-names>
</name>
<name>
<surname>Udainiya</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Ahanet: adaptive hybrid attention network for alzheimer&#x2019;s disease classification using brain magnetic resonance imaging</article-title>. <source>Bioengineering</source>. (<year>2023</year>) <volume>10</volume>:<fpage>714</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/bioengineering10060714</pub-id>
</citation>
</ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Illakiya</surname> <given-names>T</given-names>
</name>
<name>
<surname>Karthik</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>A deep feature fusion network with global context and cross-dimensional dependencies for classification of mild cognitive impairment from brain mri</article-title>. <source>Image Vision Computing</source>. (<year>2024</year>) <volume>144</volume>:<elocation-id>104967</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.imavis.2024.104967</pub-id>
</citation>
</ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>He</surname> <given-names>X</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Ong</surname> <given-names>CZL</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Teng</surname> <given-names>Q</given-names>
</name>
</person-group>. <article-title>An end-to-end multimodal 3d cnn framework with multi-level features for the prediction of mild cognitive impairment</article-title>. <source>Knowledge-Based Syst</source>. (<year>2023</year>) <volume>281</volume>:<elocation-id>111064</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.knosys.2023.111064</pub-id>
</citation>
</ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Hou</surname> <given-names>W</given-names>
</name>
</person-group>. <article-title>Conv-swinformer: integration of cnn and shift window attention for alzheimer&#x2019;s disease classification</article-title>. <source>Comput Biol Med</source>. (<year>2023</year>) <volume>164</volume>:<elocation-id>107304</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.107304</pub-id>
</citation>
</ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Illakiya</surname> <given-names>T</given-names>
</name>
<name>
<surname>Karthik</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>A dimension centric proximate attention network and swin transformer for age-based classification of mild cognitive impairment from brain mri</article-title>. <source>IEEE Access</source>. (<year>2023</year>) <volume>11</volume>:<page-range>128018&#x2013;31</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/ACCESS.2023.3332122</pub-id>
</citation>
</ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Helaly</surname> <given-names>HA</given-names>
</name>
<name>
<surname>Badawy</surname> <given-names>M</given-names>
</name>
<name>
<surname>Haikal</surname> <given-names>AY</given-names>
</name>
</person-group>. <article-title>Deep learning approach for early detection of alzheimer&#x2019;s disease</article-title>. <source>Cogn Comput</source>. (<year>2022</year>) <volume>14</volume>:<page-range>1711&#x2013;27</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12559-021-09946-2</pub-id>
</citation>
</ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ioffe</surname> <given-names>S</given-names>
</name>
<name>
<surname>Szegedy</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Batch normalization: accelerating deep network training by reducing internal covariate shift</article-title>. <source>Int Conf Mach Learn</source>. (<year>2015</year>) <volume>37</volume>:<fpage>448</fpage>&#x2013;<lpage>56</lpage>.</citation>
</ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fatima</surname> <given-names>M</given-names>
</name>
<name>
<surname>Khan</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Shaheen</surname> <given-names>S</given-names>
</name>
<name>
<surname>Almujally</surname> <given-names>NA</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>S-H</given-names>
</name>
</person-group>. <article-title>B2c3netf2: breast cancer classification using an end-to-end deep learning feature fusion and satin bowerbird optimization controlled newton raphson feature selection</article-title>. <source>CAAI Trans Intell Technol</source>. (<year>2023</year>) <volume>8</volume>(<issue>4</issue>):<fpage>1374</fpage>&#x2013;<lpage>90</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1049/cit2.12219</pub-id>
</citation>
</ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zahoor</surname> <given-names>S</given-names>
</name>
<name>
<surname>Shoaib</surname> <given-names>U</given-names>
</name>
<name>
<surname>Lali</surname> <given-names>IU</given-names>
</name>
</person-group>. <article-title>Breast cancer mammograms classification using deep neural network and entropy-controlled whale optimization algorithm</article-title>. <source>Diagnostics</source>. (<year>2022</year>) <volume>12</volume>:<fpage>557</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/diagnostics12020557</pub-id>
</citation>
</ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Xiao</surname> <given-names>T</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>L</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<etal/>
</person-group>. <article-title>Ensemble of 3d densely connected convolutional network for diagnosis of mild cognitive impairment and alzheimer&#x2019;s disease</article-title>. <source>Neurocomputing</source>. (<year>2019</year>) <volume>333</volume>:<page-range>145&#x2013;56</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.neucom.2018.12.018</pub-id>
</citation>
</ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mohammed</surname> <given-names>BA</given-names>
</name>
<name>
<surname>Senan</surname> <given-names>EM</given-names>
</name>
<name>
<surname>Rassem</surname> <given-names>TH</given-names>
</name>
<name>
<surname>Makbol</surname> <given-names>NM</given-names>
</name>
<name>
<surname>Alanazi</surname> <given-names>AA</given-names>
</name>
<name>
<surname>Al-Mekhlafi</surname> <given-names>ZG</given-names>
</name>
<etal/>
</person-group>. <article-title>Multi-method analysis of medical records and mri images for early diagnosis of dementia and alzheimer&amp;Rsquo;S disease based on deep learning and hybrid methods</article-title>. <source>Electronics</source>. (<year>2021</year>) <volume>10</volume>:<fpage>2860</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/electronics10222860</pub-id>
</citation>
</ref>
<ref id="B43">
<label>43</label>
<citation citation-type="confproc">
<person-group person-group-type="editor">
<name>
<surname>Acharya</surname> <given-names>H</given-names>
</name>
<name>
<surname>Mehta</surname> <given-names>R</given-names>
</name>
<name>
<surname>Singh</surname> <given-names>DK</given-names>
</name>
</person-group> eds. (<year>2021</year>). <article-title>Alzheimer disease classification using transfer learning</article-title>, in: <conf-name>2021 5th International Conference on Computing Methodologies and Communication (ICCMC)</conf-name>; <conf-date>8-10 April 2021</conf-date>. <publisher-loc>Erode, India</publisher-loc>.</citation>
</ref>
<ref id="B44">
<label>44</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>El-Latif</surname> <given-names>AAA</given-names>
</name>
<name>
<surname>Chelloug</surname> <given-names>SA</given-names>
</name>
<name>
<surname>Alabdulhafith</surname> <given-names>M</given-names>
</name>
<name>
<surname>Hammad</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Accurate detection of alzheimer's disease using lightweight deep learning model on mri data</article-title>. <source>Diagnostics</source>. (<year>2023</year>) <volume>13</volume>:<elocation-id>1216</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/diagnostics13071216</pub-id>
</citation>
</ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Loddo</surname> <given-names>A</given-names>
</name>
<name>
<surname>Buttau</surname> <given-names>S</given-names>
</name>
<name>
<surname>Di Ruberto</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Deep learning based pipelines for alzheimer's disease diagnosis: A comparative study and a novel deep-ensemble method</article-title>. <source>Comput Biol Med</source>. (<year>2022</year>) <volume>141</volume>:<elocation-id>105032</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compbiomed.2021.105032</pub-id>
</citation>
</ref>
<ref id="B46">
<label>46</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kaplan</surname> <given-names>E</given-names>
</name>
<name>
<surname>Dogan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Tuncer</surname> <given-names>T</given-names>
</name>
<name>
<surname>Baygin</surname> <given-names>M</given-names>
</name>
<name>
<surname>Altunisik</surname> <given-names>E</given-names>
</name>
</person-group>. <article-title>Feed-forward lpqnet based automatic alzheimer's disease detection model</article-title>. <source>Comput Biol Med</source>. (<year>2021</year>) <volume>137</volume>:<elocation-id>104828</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compbiomed.2021.104828</pub-id>
</citation>
</ref>
<ref id="B47">
<label>47</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ching</surname> <given-names>WP</given-names>
</name>
<name>
<surname>Abdullah</surname> <given-names>SS</given-names>
</name>
<name>
<surname>Shapiai</surname> <given-names>MI</given-names>
</name>
<name>
<surname>Islam</surname> <given-names>AM</given-names>
</name>
</person-group>. <article-title>Transfer learning for alzheimer's disease diagnosis using efficientnet-B0 convolutional neural network</article-title>. <source>J Adv Res Appl Sci Eng Technol</source>. (<year>2024</year>) <volume>35</volume>:<page-range>181&#x2013;91</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.37934/araset.34.3.181191</pub-id>
</citation>
</ref>
<ref id="B48">
<label>48</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mohammad</surname> <given-names>F</given-names>
</name>
<name>
<surname>Al Ahmadi</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Alzheimer&#x2019;s disease prediction using deep feature extraction and optimization</article-title>. <source>Mathematics</source>. (<year>2023</year>) <volume>11</volume>:<fpage>3712</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/math11173712</pub-id>
</citation>
</ref>
<ref id="B49">
<label>49</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hasan</surname> <given-names>ME</given-names>
</name>
<name>
<surname>Wagler</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>New convolutional neural network and graph convolutional network-based architecture for AI applications in alzheimer&#x2019;s disease and dementia-stage classification</article-title>. <source>AI</source>. (<year>2024</year>) <volume>5</volume>:<page-range>342&#x2013;63</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ai5010017</pub-id>
</citation>
</ref>
<ref id="B50">
<label>50</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shukla</surname> <given-names>A</given-names>
</name>
<name>
<surname>Tiwari</surname> <given-names>R</given-names>
</name>
<name>
<surname>Tiwari</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Alz-convnets for classification of alzheimer disease using transfer learning approach</article-title>. <source>SN Comput Sci</source>. (<year>2023</year>) <volume>4</volume>:<fpage>404</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s42979-023-01853-7</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>