<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Aging Neurosci.</journal-id>
<journal-title>Frontiers in Aging Neuroscience</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Aging Neurosci.</abbrev-journal-title>
<issn pub-type="epub">1663-4365</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fnagi.2025.1510192</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Neuroscience</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Identification of Parkinson&#x2019;s disease using MRI and genetic data from the PPMI cohort: an improved machine learning fusion approach</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Yang</surname> <given-names>Yifeng</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2555084/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Hu</surname> <given-names>Liangyun</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Chen</surname> <given-names>Yang</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Gu</surname> <given-names>Weidong</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Lin</surname> <given-names>Guangwu</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/367141/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Xie</surname> <given-names>YuanZhong</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x002A;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Nie</surname> <given-names>Shengdong</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c003"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1855318/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Medical Imaging, Huadong Hospital, Fudan University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Center for Functional Neurosurgery, RuiJin Hospital, Shanghai Jiao Tong University School of Medicine</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>School of Health Science and Engineering, University of Shanghai for Science and Technology</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Anesthesiology, Huadong Hospital, Fudan University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>Medical Imaging Center, Taian Central Hospital</institution>, <addr-line>Shandong</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Shi-Nan Wu, Eye Center, Xiamen University, China</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Anupa A. Vijayakumari, Cleveland Clinic, United States</p><p>Qinghe Zhang, University of South China, China</p></fn>
<corresp id="c001">&#x002A;Correspondence: Guangwu Lin, <email>lingw01000@163.com</email></corresp>
<corresp id="c002">YuanZhong Xie, <email>xie01088@126.com</email></corresp>
<corresp id="c003">Shengdong Nie, <email>nsd4647@163.com</email></corresp>
<fn fn-type="equal" id="fn002"><p><sup>&#x2020;</sup>These authors share first authorship</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>04</day>
<month>02</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>17</volume>
<elocation-id>1510192</elocation-id>
<history>
<date date-type="received">
<day>12</day>
<month>10</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>01</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Yang, Hu, Chen, Gu, Lin, Xie and Nie.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Yang, Hu, Chen, Gu, Lin, Xie and Nie</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<sec>
<title>Objective</title>
<p>This study aim to leverage advanced machine learning techniques to develop and validate novel MRI imaging features and single nucleotide polymorphism (SNP) gene data fusion methodologies to enhance the early identification and diagnosis of Parkinson&#x2019;s disease (PD).</p>
</sec>
<sec>
<title>Methods</title>
<p>We leveraged a comprehensive dataset from the Parkinson&#x2019;s Progression Markers Initiative (PPMI), which includes high-resolution neuroimaging data, genetic single-nucleotide polymorphism (SNP) profiles, and detailed clinical information from individuals with early-stage PD and healthy controls. Two multi-modal fusion strategies were used: feature-level fusion, where we employed a hybrid feature selection algorithm combining Fisher discriminant analysis, an ensemble Lasso (EnLasso) method, and partial least squares (PLS) regression to identify and integrate the most informative features from neuroimaging and genetic data; and decision-level fusion, where we developed an adaptive ensemble stacking (AE_Stacking) model to synergistically integrate the predictions from multiple base classifiers trained on individual modalities.</p>
</sec>
<sec>
<title>Results</title>
<p>The AE_Stacking model achieving the highest average balanced accuracy of 95.36% and an area under the receiver operating characteristic curve (AUC) of 0.974, significantly outperforming feature-level fusion and single-modal models (<italic>p</italic> &#x003C; 0.05). Furthermore, by analyzing the features selected across multiple iterations of our models, we identified stable brain region features [lh 6r (FD) and rh 46 (GI)] and key genetic markers (rs356181 and rs2736990 SNPs within the SNCA gene region; rs213202 SNP within the VPS52 gene region), highlighting their potential as reliable early diagnostic indicators for the disease.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>The AE_Stacking model, trained on MRI and genetic data, demonstrates potential in distinguishing individuals with PD. Our findings enhance understanding of the disease and advance us toward the goal of precision medicine for neurodegenerative disorder.</p>
</sec>
</abstract>
<kwd-group>
<kwd>Parkinson&#x2019;s disease</kwd>
<kwd>imaging genomics</kwd>
<kwd>stable feature selection</kwd>
<kwd>multi-modal fusion</kwd>
<kwd>machine learning</kwd>
</kwd-group>
<counts>
<fig-count count="7"/>
<table-count count="5"/>
<equation-count count="8"/>
<ref-count count="55"/>
<page-count count="16"/>
<word-count count="9839"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Parkinson&#x2019;s Disease and Aging-related Movement Disorders</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="S1" sec-type="intro">
<title>1 Introduction</title>
<p>Parkinson&#x2019;s disease (PD) is marked by the degeneration of dopamine-producing neurons in the substantia nigra, and the accumulation of alpha-synuclein protein in the midbrain. While PD is predominantly sporadic, genetic factors are increasingly recognized in its development. Numerous studies highlight the importance of genetics, identifying genes such as SNCA, LRRK2, PINK1, and GBA, which are linked to both dominant and recessive forms of inherited PD (<xref ref-type="bibr" rid="B6">Blauwendraat et al., 2020</xref>; <xref ref-type="bibr" rid="B12">Fernandez-Santiago and Sharma, 2022</xref>; <xref ref-type="bibr" rid="B41">Tranchant, 2019</xref>). These genes play crucial roles in maintaining cellular health, and disruptions can lead to neurodegeneration, affecting symptoms, onset age, and disease progression (<xref ref-type="bibr" rid="B1">Alfradique-Dunham et al., 2021</xref>; <xref ref-type="bibr" rid="B8">Chu et al., 2009</xref>; <xref ref-type="bibr" rid="B9">Davis et al., 2016</xref>; <xref ref-type="bibr" rid="B17">Iwaki et al., 2019</xref>). Thus, monitoring gene expression changes is vital for early diagnosis and prediction of PD.</p>
<p>The fusion of genetic and imaging data has emerged as a promising approach to understanding the interplay between genetic predispositions and brain structure in PD. Recent studies have highlighted that combining genetic and neuroimaging markers can significantly enhance predictive and diagnostic accuracy for PD (<xref ref-type="bibr" rid="B19">Kim et al., 2017</xref>; <xref ref-type="bibr" rid="B43">van Nuenen et al., 2009</xref>; <xref ref-type="bibr" rid="B50">Won et al., 2019</xref>; <xref ref-type="bibr" rid="B49">Won et al., 2020</xref>). For example, Kim et al. utilized a linear regression model incorporating single nucleotide polymorphism (SNP) genetic features and structural connectivity data to predict clinical scores on the Movement Disorder Society-Unified Parkinson&#x2019;s Disease Rating Scale (MDS-UPDRS). Their model demonstrated superior predictive performance, with a correlation coefficient (between model prediction outcomes and actual MDS-UPDRS score) of 0.788 (<xref ref-type="bibr" rid="B19">Kim et al., 2017</xref>). Won et al. employed the Lasso algorithm to select key features from structural connectivity and SNP genetic data, constructing a linear regression model to predict Geriatric Depression Scale (GDS) scores. This model exhibited a meaningful correlation (<italic>r</italic> = 0.749) between predicted and actual GDS scores (<xref ref-type="bibr" rid="B50">Won et al., 2019</xref>). Building on these findings, the same team applied sparse typical correlation analysis to integrate imaging genetic features, achieving a correlation of <italic>r</italic> = 0.5486 between predicted and actual ages at PD onset (<xref ref-type="bibr" rid="B49">Won et al., 2020</xref>). These studied underscores the feasibility of predicting disease onset by fusing multi-modal data.</p>
<p>For individual PD diagnosis, Xia et al. developed a clustered evolutionary random neural network model to analyze fused functional magnetic resonance imaging (fMRI) and SNP data. This model achieved an impressive accuracy of 88.57% in identifying PD patients and uncovered additional PD-related genes and brain regions (<xref ref-type="bibr" rid="B4">Bi et al., 2021a</xref>). Lei et al. proposed a joint learning framework based on MRI features using a multi-branch octave convolutional neural network (FMOCNN) to diagnose PD in gene-related cohorts. The accuracy of this method in identifying individuals with genetic cohort PD (GenPD) and genetic mutation but not PD cohort (GenUn) was 84.91% (<xref ref-type="bibr" rid="B21">Lei et al., 2022</xref>). The fusion of multimodal information from images and genes leverages complementary data, providing a more comprehensive characterization of the pathological mechanisms of PD. This integrated approach offers a new perspective for the diagnosis and prediction of PD.</p>
<p>Machine learning (ML) techniques offer a robust method for processing large and complex genome-wide SNP datasets (<xref ref-type="bibr" rid="B25">Makarious et al., 2022</xref>; <xref ref-type="bibr" rid="B39">Szymczak et al., 2009</xref>). However, analyzing genomic data poses significant challenges due to its high-dimensional nature, where the number of features usually far exceeds the number of samples. This high-dimensionality engenders a plethora of redundant information, which would lead to multicollinearity among the high-dimensional genetic variables, complicating model training. This complexity can lead to multicollinearity among key variables, complicating model training. Limited sample sizes further increase the risk of overfitting, even with regularization methods (<xref ref-type="bibr" rid="B30">Pudjihartono et al., 2022</xref>). Overcoming the challenges of &#x201C;curse of dimensionality&#x201D; is essential for developing accurate predictive models from genomic data.</p>
<p>Our aim is to improve early PD identification by leveraging features from high-dimensional imaging and genetic data. This involves addressing differences between genetic and imaging data to enable advanced multimodal integration. Firstly, we preprocess MRI and SNP gene data separately and extract relevant features. We then developed two multimodal data fusion methods, feature-level and decision-level fusion, to fuse them. For feature-level fusion, we employ a combined feature selection method called Fisher-EnLasso-PLS, which enables collaborative analysis of multimodal data, effectively reducing data complexity while more accurately capturing key features associated with the disease. For decision-level fusion, we develop an AE_Stacking model to enhance the integration of image and genetic features. This approach maintains the multidimensional and complex nature of diseases. By integrating multiple data sources and models, it could enhance prediction accuracy and robustness, minimizing potential error from relying on a single data source or single model.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>2 Materials and methods</title>
<sec id="S2.SS1">
<title>2.1 Participants</title>
<p>The data in this study accessed from the Parkinson&#x2019;s Progression Markers Initiative (PPMI) database,<sup><xref ref-type="fn" rid="footnote1">1</xref></sup> a multicenter database that includes neuroimaging, gene data such as single-nucleotide polymorphisms (SNP) and relevant clinical information of various PD individuals and matched healthy controls. Inclusion criteria for individuals of the early PD cohort were baseline participants diagnosed with PD for two years or less, whose DAT scans indicated a dopaminergic deficit, and who had not commenced any medication. For the health controls (HC), they had never been diagnosed with any major neurological disorder and had no first-degree relatives with idiopathic PD.</p>
<sec id="S2.SS1.SSS1">
<title>2.1.1 Clinical neuropsychological assessments</title>
<p>Patients with PD were assessed using the Unified Parkinson&#x2019;s Disease Rating Scale (UPDRS) part III examination scale (range 0&#x2013;108), and Hoehn &#x0026; Yahr scale (H&#x0026;Y) stage I &#x0026; II. For each subject, several available clinical neuropsychological evaluation scales were also used: the University of Pennsylvania Smell Identification Test (UPSIT), Geriatric Depression Scale (GDS), Montreal Cognitive Assessment (MOCA), and Scales for Outcomes in Parkinson&#x2019;s Disease&#x2014;Autonomic Dysfunction (SCOPA-AUT).</p>
</sec>
<sec id="S2.SS1.SSS2">
<title>2.1.2 SNP data acquisition</title>
<p>Subjects&#x2019; genotyping SNP information was collected on the NeuroX genotyping chip (<xref ref-type="bibr" rid="B14">Ghani et al., 2015</xref>; <xref ref-type="bibr" rid="B28">Nalls et al., 2015</xref>). The NeuroX array is an Illumina Infinium iSelect HD Custom Genotyping array containing 267,607 Illumina standard contains exonic variants and an additional 24,706 custom variants designed for neurological disease studies. The content of the NeuroX is available on the PPMI site.<sup><xref ref-type="fn" rid="footnote2">2</xref></sup></p>
</sec>
<sec id="S2.SS1.SSS3">
<title>2.1.3 MRI acquisition</title>
<p>For data consistency, only 3T MRI scanner (SIEMENS MAGNETOM Trio scanner) with high-resolution MPRAGE T1 sequence was chosen with the following parameters: repetition time (TR) = 2300.0 ms, echo time (TE) = 3.0 ms, Inversion time (TI) = 900.0 ms, flip angle = 9.0 degree, and slicing thickness = 1.0 mm. Participants with missing images or incomplete scans were excluded from the study. A total of 209 subjects (135 PD patients and 74 HC) were final downloaded.</p>
</sec>
</sec>
<sec id="S2.SS2">
<title>2.2 Data preprocessing</title>
<sec id="S2.SS2.SSS1">
<title>2.2.1 SNP data selection, cleaning, and quality control</title>
<p>In this paper, genotyping data were collected from the PPMI dataset for a total of 619 subjects, each containing 267,607 SNP loci. Quality control of SNP data was performed using Plink v1.09 software and referring to the ENIGMA protocol (<xref ref-type="bibr" rid="B31">Purcell et al., 2007</xref>; <xref ref-type="bibr" rid="B40">Thompson et al., 2022</xref>). The quality control of SNP data included sample quality control and SNP locus quality control, as follows:</p>
<p>Sample quality control: (1) sample detection rate detection; (2) sex check; (3) sibling pair identification; (4) population stratification;</p>
<p>Quality control: (1) minor allele frequency (MAF) &#x003C; 1%; (2) genotype call rate &#x003C; 95%; (3) Hardy-Weinberg equilibrium (HWE) test <italic>p</italic> &#x003C; 10-6.</p>
<p>SNP loci that did not meet the criteria were excluded. After rigorous quality control, a total of 532 subjects (367 PD patients and 165 HC) were retained, each of which contained 48,414 high-quality SNP locus information for use in subsequent experiments.</p>
</sec>
<sec id="S2.SS2.SSS2">
<title>2.2.2 MRI data processing and feature extraction</title>
<p>A computational anatomy toolbox (CAT 12.7-r1727)<sup><xref ref-type="fn" rid="footnote3">3</xref></sup> based on statistical parametric mapping software (SPM 12)<sup><xref ref-type="fn" rid="footnote4">4</xref></sup> was used to preprocess the data, including voxel-based morphometry (VBM) and surface-based morphometry (SBM) analysis (<xref ref-type="supplementary-material" rid="TS1">Supplementary Figure S1</xref>). As a supplement to the VBM, the SBM allows the calculation of multiple GM tissue features at varying scales (<xref ref-type="bibr" rid="B11">Farokhian et al., 2017</xref>; <xref ref-type="bibr" rid="B35">Seiger et al., 2018</xref>). The standardized structural processing pipeline includes head motion correction, MR field inhomogeneity correction, brain extraction, automated segmentation of GM, WM, and cerebrospinal fluid (CSF) (WMH corrected), topological defect correction, cortical surface reconstruction, and tessellation of the boundary between the WM and cortical GM. Cortical morphological parameters including cortical thickness (CT), surface area (SA), fractal dimension (FD) and gyrification index (GI) were calculated to quantify the local microstructural changes of brain GM structure (<xref ref-type="bibr" rid="B24">Luders et al., 2006</xref>; <xref ref-type="bibr" rid="B34">Sandu et al., 2014</xref>; <xref ref-type="bibr" rid="B46">Wang et al., 2021</xref>). Next, the template-based matching method was applied to define regions of interest (ROIs) and to extract multiple structural morphological parameters from ROIs. For this study, spatially matching the GMV map with Brainnetome atlas could determine the volume of the 246 subregions (<xref ref-type="bibr" rid="B10">Fan et al., 2016</xref>). Cortical areas were defined by the high-resolution Human Connectome Project multimodal parcellation (HCP-MMP1.0) (<xref ref-type="bibr" rid="B15">Glasser et al., 2016</xref>). Mean cortical thickness, surface area, thickness, fractal dimension and gyrification index were extracted from 360 cortical parcels in the HCP-MPP1.0. Finally, MRI data from 128 PD patients and 71 HC participants were retained after image quality control. There were total 1686 (246 + 360 &#x00D7; 4) extracted feature dimensions for each participant.</p>
</sec>
<sec id="S2.SS2.SSS3">
<title>2.2.3 SNP and MRI data merging</title>
<p>Samples with SNP genotype data were combined with samples with MRI imaging data. The final sample with data from both modalities consisted of 167 cases, including 113 early PD patients and 54 HC healthy controls (<xref ref-type="fig" rid="F1">Figure 1</xref>). All data collection was approved by the relevant institutions, and participants signed a written informed consent.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Schematic overview of data screening. For T1 WI-MRI, a total of 209 subjects were downloaded from the PPMI database, including 135 individuals with Parkinson&#x2019;s disease (PD) and 74 health controls (HC). The images underwent preprocessing steps including segmentation and normalization, and were final registered to the MNI standard brain space. Following image quality control procedures, 7 PD subjects and 3 HC were excluded due to poor registration results. Ultimately, 128 PD and 71 HC subjects were retained for region of interest (ROI) definition and multidimensional MRI feature extraction. For genetic data, 619 subjects were downloaded from the PPMI database, including 383 PD and 178 HC, with 58 subjects&#x2019; phenotypes were missing. Firstly, based on the multi-dimensional scaling (MDS) protocol, 16 PD and 13 HC were excluded due to anomalies in the phenotype data. Subsequently, quality control was performed on the SNP sites, resulting in the exclusion of 219,193 SNPs that did not meet the quality criteria. Finally, a total of 167 subjects had both modalities of data, consisting of 113 PD patients and 54 HC, with each subject contributing 1,686 MRI features and 48,414 high-quality SNP data.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-17-1510192-g001.tif"/>
</fig>
</sec>
</sec>
<sec id="S2.SS3">
<title>2.3 Feature selection</title>
<p>A novel hybrid feature selection method (Fisher-EnLasso-PLS), which integrates Fisher discriminant analysis, lasso-based integrated stable feature selection algorithm and partial least squares (PLS) algorithm, was designed to optimize the feature selection process in high-dimensional imaging genetics data through phased refined feature screening strategy. Fisher discriminant analysis initially selects features that enhance class distinction, the Lasso-based algorithm selects robust features via sparsity, and the PLS algorithm captures the relationships between features and the response variable. By combining these techniques, this hybrid feature selection method could not only reduces dimensionality but also extracts essential information while minimizing the risk of model overfitting. The method is detailed below:</p>
<p>Firstly, Fisher discriminant analysis is employed to initially filter out irrelevant features. This method is efficient and computationally simple, demonstrating strong performance in high-dimensional gene feature selection (<xref ref-type="bibr" rid="B37">Sun et al., 2019</xref>; <xref ref-type="bibr" rid="B55">Zhang et al., 2021</xref>). A higher Fisher score indicates a feature&#x2019;s capacity to differentiate between PD and HC samples.</p>
<p>Following this initial filtration, the number of candidate features is reduced to a more manageable level. However, it is important to note that Fisher&#x2019;s method primarily emphasizes feature correlation and does not account for redundancy or interaction among features. To address this limitation, the ensemble Lasso (EnLasso) algorithm is applied next. EnLasso leverages data perturbation and ensemble learning to synthesize results from multiple training subsets, thus enhancing the accuracy and robustness of feature selection (<xref ref-type="bibr" rid="B45">Wang et al., 2022</xref>). Specifically, using stratified tenfold cross-validation, 90% of the training samples are selected and subsequently balanced through the SVM-SMOTE resampling method, which alleviates inaccuracies in feature selection stemming from class imbalances. The SVM-SMOTE method integrates the principles of SVM with synthetic data generation techniques; it leverages SVM to identify the boundary samples of the training set&#x2014;support vectors&#x2014;and performs adaptive interpolation within the kernel space on these support vectors to generate new samples, which has good performance in non-linear and high-dimensional data scenarios. The Lasso algorithm is then applied to these subsets, with training sample perturbations enhancing the stability of feature selection results. This process is repeated 10 times to produce M candidate feature subsets<italic>S</italic><sub><italic>i</italic></sub> (1 &#x2264; <italic>i</italic> &#x2264; <italic>M</italic>). An ensemble strategy then amalgamates these subsets by comprehensively assessing both feature occurrence frequency (<italic>FS</italic><sub><italic>q</italic></sub>) and assigned weights (<italic>FS</italic><sub><italic>w</italic></sub>), resulting in an importance score (IS) for each feature, calculated using the following formula:</p>
<disp-formula id="S2.E1">
<label>(1)</label>
<mml:math id="M1">
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:msub>
<mml:mi>S</mml:mi>
<mml:mi>q</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>f</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>M</mml:mi>
</mml:mfrac>
<mml:munderover>
<mml:mo largeop="true" movablelimits="false" symmetric="true">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>M</mml:mi>
</mml:munderover>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mi>f</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>S</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mi>D</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula><mml:math id="INEQ3"><mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mo>&#x2062;</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>D</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mo>{</mml:mo><mml:mi>f</mml:mi><mml:mo>:</mml:mo><mml:mrow><mml:msubsup><mml:mi mathvariant="normal">&#x03C9;</mml:mi><mml:mi>f</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>i</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:msubsup><mml:mo>&#x2260;</mml:mo><mml:mn>0</mml:mn></mml:mrow><mml:mo>}</mml:mo></mml:mrow></mml:mrow></mml:math></inline-formula> was defined as all the selected features performed by the feature selection algorithm on the <italic>th i</italic> sampled training subset <italic>D</italic><sub><italic>i</italic></sub>. When the feature was selected, it was assigned 1, otherwise it was 0. <italic>FS</italic><sub><italic>q</italic></sub> metric quantifies the consistency with which a feature is selected across multiple iterations of the feature selection algorithm when applied to various training subsets. The higher the <italic>FS</italic><sub><italic>q</italic></sub>, the stronger the stability of the feature itself.</p>
<disp-formula id="S2.E2">
<label>(2)</label>
<mml:math id="M2">
<mml:mrow>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:msub>
<mml:mi>S</mml:mi>
<mml:mi>w</mml:mi>
</mml:msub>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>f</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>M</mml:mi>
</mml:mfrac>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:munderover>
<mml:mo largeop="true" movablelimits="false" symmetric="true">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>M</mml:mi>
</mml:munderover>
<mml:msubsup>
<mml:mi mathvariant="normal">&#x03C9;</mml:mi>
<mml:mi>f</mml:mi>
<mml:msub>
<mml:mi>D</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:msubsup>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Where <inline-formula><mml:math id="INEQ5"><mml:msubsup><mml:mi mathvariant="normal">&#x03C9;</mml:mi><mml:mi>f</mml:mi><mml:msub><mml:mi>D</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:msubsup></mml:math></inline-formula> represented the weight assigned to the feature <italic>f</italic> when performing the feature selection algorithm on the <italic>th i</italic> sampled training subset <italic>D</italic><sub><italic>i</italic></sub>. <italic>FS</italic><sub><italic>w</italic></sub> reflectes the feature&#x2019;s contribution to accurately identifying the target variable. Features with higher weights are more influential in distinguishing between classes, thereby enhancing the model&#x2019;s classification performance.</p>
<disp-formula id="S2.E3">
<label>(3)</label>
<mml:math id="M3">
<mml:mrow>
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>S</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>f</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mn>2</mml:mn>
</mml:mfrac>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:msub>
<mml:mi>S</mml:mi>
<mml:mi>q</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:msub>
<mml:mi>S</mml:mi>
<mml:mi>w</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>By integrating <italic>FS</italic><sub><italic>q</italic></sub> and <italic>FS</italic><sub><italic>w</italic></sub>, we calculated the IS, which is a composite measure that encapsulates both the frequency of feature occurrence and the weights assigned to them. The IS ensures that the selected features are not only consistently chosen across different iterations but also have a substantialcontribuation on the model&#x2019;s predictive capabilities. By sorting the features in descending order based on their IS values, a new ranked list of features is generated, from which the top-k features are selected using a forward search strategy.</p>
<p>In the final stage, to account for feature interaction, the PLS algorithm was employed for further dimensionality reduction, extracting principal components most pertinent to PD. Unlike PCA, which is an unsupervised method that considers only the characteristic variable data, PLS maximizes covariance between independent and dependent variables. It combines principal component analysis, correlation analysis, and regression not only addresses feature interactions to eliminate correlations among the data but also incorporates label vectors, effectively preserving key information related to the target task (<xref ref-type="bibr" rid="B22">Li et al., 2008</xref>).</p>
</sec>
<sec id="S2.SS4">
<title>2.4 Feature fusion</title>
<p>There are two kinds of feature fusion methods: feature level and decision level.</p>
<sec id="S2.SS4.SSS1">
<title>2.4.1 Feature level fusion</title>
<p>Feature-level multimodal fusion combines features from different modalities into a new matrix for joint feature selection and model training. This study merged genetic and MRI image features into a 50,100-dimensional matrix. To facilitate feature selection from this high-dimensional sparse data, we devised two optimization strategies, shown in <xref ref-type="fig" rid="F2">Figure 2</xref>.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Framework of the fusion method of SNPs and MRI features based on feature level.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-17-1510192-g002.tif"/>
</fig>
<list list-type="simple">
<list-item>
<label>1.</label>
<p>Fusion1</p>
</list-item>
</list>
<p>The first strategy employs the Fisher-EnLasso-PLS algorithm, as detailed in the <italic>Feature Selection</italic> section, for joint feature selection on the fusion matrix. Subsequently, model training is conducted to develop a multimodal fusion classification model, referred to as Fusion1.</p>
<list list-type="simple">
<list-item>
<label>1.</label>
<p>Fusion2</p>
</list-item>
</list>
<p>Given the inherent differences between genetic and MRI modalities in characterizing Parkinson&#x2019;s disease (PD), feature variable groups exist within the multimodal feature matrix. Traditional Lasso, which relies on l1 regularization, focuses solely on penalizing individual feature variables and overlooks group effects, thus limiting its efficacy in multimodal joint feature selection. To address this limitation, we replaced the Lasso method in Fusion1 with the Sparse Group Lasso (sgLasso) algorithm. This method incorporates both l1 and l2 constraints, addressing inter-group and intra-group sparsity, thus refining the joint feature matrix and isolating a higher quality feature subset (<xref ref-type="bibr" rid="B36">Simon et al., 2013</xref>).</p>
<disp-formula id="S2.E4">
<label>(4)</label>
<mml:math id="M4">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi mathvariant="normal">&#x03B2;</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>g</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>L</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>a</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>s</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>o</mml:mi>
</mml:mrow>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:munder>
<mml:mrow>
<mml:mi>arg</mml:mi>
<mml:mo movablelimits="false">&#x2061;</mml:mo>
<mml:mi>min</mml:mi>
</mml:mrow>
<mml:mi mathvariant="normal">&#x03B2;</mml:mi>
</mml:munder>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mn>2</mml:mn>
</mml:mfrac>
<mml:mo>&#x2062;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mo>-</mml:mo>
<mml:mrow>
<mml:munderover>
<mml:mo largeop="true" movablelimits="false" symmetric="true">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>L</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2062;</mml:mo>
<mml:msup>
<mml:mi mathvariant="normal">&#x03B2;</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mrow>
</mml:mrow>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="normal">&#x03BB;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:munderover>
<mml:mo largeop="true" movablelimits="false" symmetric="true">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>L</mml:mi>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:msup>
<mml:mi mathvariant="normal">&#x03B2;</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="normal">&#x03BB;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#x2062;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi mathvariant="normal">&#x03B2;</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Among them, parameter <italic>&#x03BB;</italic><sub>1</sub> is used to adjust the inter-group sparsity, and parameter <italic>&#x03BB;</italic><sub>2</sub> is used to adjust the intra-group sparsity.</p>
<p>The sgLasso method was incorporated into the hybrid feature selection process named Fisher-EnsgLasso-PLS, and forming a new feature fusion strategy referred to as Fusion2.</p>
</sec>
<sec id="S2.SS4.SSS2">
<title>2.4.2 Decision level fusion</title>
<p>The decision-level multimodal fusion method trains each modality separately to create N base classification models, then use ensemble learning to combine their predictions for a final result. The Stacking ensemble approach, ground in the principle of &#x201C;collective intelligence&#x201D; (<xref ref-type="bibr" rid="B27">Naimi and Balzer, 2018</xref>), merges outputs from diverse models using a meta-learner, enhancing classification accuracy and robustness beyond individual models. However, the choice of primary base classifiers is often subjective and not automated. We introduced an Adaptive-Selection-Enhanced Stacking ensemble learning framework (AE_Stacking), depicted in <xref ref-type="fig" rid="F3">Figure 3</xref>. This framework adaptively selects<italic>M</italic> (<italic>M</italic> &#x2264; <italic>N</italic>)top-performing models from <italic>N</italic>base models and assigns weights based on their initial performance (see the GitHub repository).<sup><xref ref-type="fn" rid="footnote5">5</xref></sup> This enhances model diversity and representation, boosting overall integration performance. The implementation process is as follows:</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>Framework of adaptive-selection-enhanced stacking ensemble learning (AE_Stacking).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-17-1510192-g003.tif"/>
</fig>
<sec id="S2.SS4.SSS2.Px1">
<title>2.4.2.1 Step 1: data division</title>
<p>The training data is denoted as <italic>T<sub>r</sub></italic>, and the test data as <italic>T<sub>e</sub></italic>. Training set samples are divided into K subsets <italic>T</italic><sub><italic>r</italic></sub>{<italic>T</italic><sub><italic>r</italic>1</sub>,<italic>T</italic><sub><italic>r</italic>2</sub>,&#x2026;,<italic>T</italic><sub><italic>rk</italic></sub>} via K-fold cross-validation. The first-layer base classifiers are represented as <italic>C</italic><sub><italic>layer</italic>1</sub> {<italic>C</italic><sub>1</sub>, <italic>C</italic><sub>2</sub>,&#x2026;, <italic>C</italic><sub><italic>N</italic></sub>}, and the second-layer meta-learner model as <italic>Clayer</italic> 2;</p>
</sec>
<sec id="S2.SS4.SSS2.Px2">
<title>2.4.2.2 Step 2: training first-layer base classifiers</title>
<p>Each base classifier <italic>Ci</italic> is trained using K-1 folds, making predictions on the remaining fold to obtain predicted probability values for each model.</p>
</sec>
<sec id="S2.SS4.SSS2.Px3">
<title>2.4.2.3 Step 3: adaptive selection and boosting</title>
<p>The balanced accuracy <inline-formula><mml:math id="INEQ9"><mml:mrow><mml:mi>B</mml:mi><mml:mo>&#x2062;</mml:mo><mml:mi>a</mml:mi><mml:mo>&#x2062;</mml:mo><mml:mi>c</mml:mi><mml:mo>&#x2062;</mml:mo><mml:msubsup><mml:mi>c</mml:mi><mml:mi>k</mml:mi><mml:mi>i</mml:mi></mml:msubsup></mml:mrow></mml:math></inline-formula> for each base classifier is calculated on K-fold training samples. Base models with <italic>Bacc</italic> exceeding a predefined threshold &#x03C4; are selected as the first-layer base learners.</p>
<disp-formula id="S2.E5">
<label>(5)</label>
<mml:math id="M5">
<mml:mrow>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>a</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>c</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>c</mml:mi>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mn>2</mml:mn>
</mml:mfrac>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
<mml:mo>+</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="S2.E6">
<label>(6)</label>
<mml:math id="M6">
<mml:mrow>
<mml:msub>
<mml:mover accent='true'>
<mml:mi>C</mml:mi>
<mml:mo>&#x2322;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mtable>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mtext>&#x00A0;</mml:mtext>
<mml:mi>B</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>c</mml:mi>
<mml:msup>
<mml:mi>c</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mo>&#x003E;</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>N</mml:mi>
</mml:mfrac>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mstyle displaystyle='true'>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>N</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>K</mml:mi>
</mml:mfrac>
<mml:mstyle displaystyle='true'>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>K</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>c</mml:mi>
<mml:msubsup>
<mml:mi>c</mml:mi>
<mml:mi>k</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:mstyle>
<mml:mtext>&#x2009;</mml:mtext>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>j</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>t</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>o</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>h</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>w</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>e</mml:mi>
<mml:mtext>&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;&#x00A0;</mml:mtext>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where TP, TN, FP, and FN correspond to true positives, true negatives, false positives, and false negatives, respectively.</p>
<p>The prediction probability scores of the selected<italic>M</italic> base models on the training samples <italic>T</italic><sub><italic>rk</italic></sub> are concatenated to obtain initial prediction results <italic>P</italic>{<italic>p</italic><sup>1</sup>,<italic>p</italic><sup>2</sup>,&#x2026;,<italic>p<sup>M</sup></italic>}. Additionally, weights &#x03BB;<italic><sup>i</sup></italic>for the selected base learner are computed according to their <inline-formula><mml:math id="INEQ12"><mml:mrow><mml:mi>B</mml:mi><mml:mo>&#x2062;</mml:mo><mml:mi>a</mml:mi><mml:mo>&#x2062;</mml:mo><mml:mi>c</mml:mi><mml:mo>&#x2062;</mml:mo><mml:msubsup><mml:mi>c</mml:mi><mml:mi>k</mml:mi><mml:mi>i</mml:mi></mml:msubsup></mml:mrow></mml:math></inline-formula>:</p>
<disp-formula id="S2.E7">
<label>(7)</label>
<mml:math id="M7">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="normal">&#x03BC;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>M</mml:mi>
</mml:mfrac>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:munderover>
<mml:mo largeop="true" movablelimits="false" symmetric="true">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>M</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>a</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>c</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:msubsup>
<mml:mi>c</mml:mi>
<mml:mi>k</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="S2.E8">
<label>(8)</label>
<mml:math id="M8">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="normal">&#x03BB;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo>-</mml:mo>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>M</mml:mi>
</mml:mfrac>
<mml:mo>&#x2022;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>-</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msup>
<mml:mi mathvariant="normal">&#x03BC;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msup>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mfrac>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>The weight parameter &#x03BB;<italic><sup>i</sup></italic> fine-tunes each base learner, enhancing integration performance.</p>
</sec>
<sec id="S2.SS4.SSS2.Px4">
<title>2.4.2.4 Step 4: meta-learner training and prediction</title>
<p>The weighted initial predictions from Step 3 (<italic>P</italic>{<italic>p</italic><sup>1</sup>,<italic>p</italic><sup>2</sup>,&#x2026;,<italic>p<sup>M</sup></italic>}) serve as inputs for training the second-layer learner. Each base learner makes K predictions on the test set <italic>T<sub>e</sub></italic> during the first-layer.</p>
<p>The initial prediction result for each base learner (<italic>Q</italic>{<italic>q</italic><sup>1</sup>,<italic>q</italic><sup>2</sup>,&#x2026;,<italic>q<sup>M</sup></italic>}) is obtained by weighted averaging the K test results, which is then multiplied by &#x03BB;<italic><sup>i</sup></italic> to form the new test set for the meta-learner model. The meta-learner&#x2019;s performance on this new test set determines the final results.</p>
</sec>
</sec>
</sec>
<sec id="S2.SS5">
<title>2.5 Modeling and evaluation</title>
<p>In this study, we employed eight well-established ML classification algorithms: Logistic regression (LR), Support Vector Machine (SVM), multilayer perceptron (MLP), Adaptive Boosting (AdaBoost), Random forest (RF), Gradient boosting decision tree (GBDT), Extreme gradient boosting (XGBoost) and Light gradient boosting machine (LightGBM). These algorithms were utilized to develop binary classification models for differentiating between PD and HC, followed by a comparative analysis of their performance.</p>
<sec id="S2.SS5.SSS1">
<title>2.5.1 Modeling</title>
<p>To evaluate the efficacy of multimodal fusion of SNPs and MRI data in enhancing PD classification performance, we implemented two distinct strategies:</p>
<sec id="S2.SS5.SSS1.Px1">
<title>2.5.1.1 Strategy 1: feature-level multimodal fusion classification</title>
<p>We compared the classification performance of three different input models&#x2014;MRI, SNP, and their combination&#x2014;using eight classifiers. For the fusion of MRI and SNP features, we evaluated Fusion1 and Fusion2 method. Hyperparameter optimization ranges for each classifier are in <xref ref-type="supplementary-material" rid="TS1">Supplementary Table S1</xref>, with tuning done via nested five-fold cross-validation and grid search.</p>
</sec>
</sec>
<sec id="S2.SS5.SSS2">
<title>2.5.1.2 Strategy 2: decision-level multimodal fusion classification</title>
<p>In this strategy, the aforementioned eight classifiers served as candidate base classifiers within our proposed AE_Stacking framework. This framework automatically selects the optimal base classifier for ensemble combination and feature enhancement. A simple logistic regression model was employed as the meta-learner to mitigate the risk of overfitting. To demonstrate the superiority of decision-level multimodal fusion of imaging and genetic features, we conducted several comparative experiments: (1) comparison against single-modality single-classifier performance; (2) comparison with single-modality multi-classifier performance, where the ensemble model&#x2019;s input consisted solely of single-modality features, assessing performance solely based on multi-classifier fusion; and (3) comparison with the feature-level fusion model.</p>
</sec>
<sec id="S2.SS5.SSS3">
<title>2.5.2 Evaluation</title>
<p>The dataset was hierarchically divided into training, validation, and testing sets at a ratio of 8:1:1. To ensure fairness and address the limitations of sample size, the data was randomly shuffled, and the above steps were repeated ten times, resulting in ten distinct sets of training, validation, and test sets. The training set was used for model training, the validation set for optimal feature subset determination and hyperparameter tuning, and the test set for recording the balanced accuracy (Bacc), sensitivity (Sen), specificity (Spe), G-mean, F1-score, and AUC values as classification performance metrics. The mean and standard deviation (mean &#x00B1; SD) of the results from ten runs were reported for performance comparison between models.</p>
</sec>
</sec>
<sec id="S2.SS6">
<title>2.6 Statistical analysis</title>
<p>SPSS (IBM SPSS 26.0, SPSS Inc.) software was used for statistical analyses. For the comparison of demographic variables, the chi-square test (&#x03C7;<sup>2</sup>-test) was used to assess the differences in sex and t test was performed for comparisons of age. The Mann&#x2013;Whitney U test was used to compare non-normally distributed data. All statistical tests were two-tailed, and <italic>p</italic> &#x003C; 0.05 was considered significant.</p>
</sec>
</sec>
<sec id="S3" sec-type="results">
<title>3 Results</title>
<sec id="S3.SS1">
<title>3.1 Clinical information</title>
<p>The demographic, clinical, and neuropsychological characteristics of 113 patients with PD and 54 HC are summarized in <xref ref-type="table" rid="T1">Table 1</xref>. The groups exhibited no significant differences in age, sex, or education level (<italic>p</italic> &#x003E; 0.05). Significant differences in clinical non-motor symptoms were observed in the MDS-UPDRS-III, UPSIT, and SCOPA-AUT scales (<italic>p</italic> &#x003C; 0.0001) across all PD and HC participants.</p>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Demographics, clinical and neuropsychological characteristics of study participants.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="left" style="color:#ffffff;background-color: #7f8080;"></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>PD (<italic>n</italic> = 113)</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>HC (<italic>n</italic> = 54)</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold><italic>p</italic>-value</bold></td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Sex (male/female)</td>
<td valign="top" align="center">66/47</td>
<td valign="top" align="center">33/21</td>
<td valign="top" align="center">0.626</td>
</tr>
<tr>
<td valign="top" align="left">Age (years)</td>
<td valign="top" align="center">61.02 &#x00B1; 8.74</td>
<td valign="top" align="center">62.23 &#x00B1; 8.05</td>
<td valign="top" align="center">0.345</td>
</tr>
<tr>
<td valign="top" align="left">Education level (years)</td>
<td valign="top" align="center">15.41 &#x00B1; 3.02</td>
<td valign="top" align="center">15.37 &#x00B1; 2.97</td>
<td valign="top" align="center">0.859</td>
</tr>
<tr>
<td valign="top" align="left">Hoehn &#x0026; Yahr</td>
<td valign="top" align="center">1.61 &#x00B1; 0.49</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">MDS-UPDRS-III</td>
<td valign="top" align="center">21.04 &#x00B1; 9.00</td>
<td valign="top" align="center">0.50 &#x00B1; 1.27</td>
<td valign="top" align="center">&#x003C;0.001<xref ref-type="table-fn" rid="t1fns1">&#x002A;&#x002A;</xref></td>
</tr>
<tr>
<td valign="top" align="left">UPSIT</td>
<td valign="top" align="center">22.13 &#x00B1; 8.61</td>
<td valign="top" align="center">33.30 &#x00B1; 4.71</td>
<td valign="top" align="center">&#x003C;0.001<xref ref-type="table-fn" rid="t1fns1">&#x002A;&#x002A;</xref></td>
</tr>
<tr>
<td valign="top" align="left">GDS</td>
<td valign="top" align="center">4.60 &#x00B1; 1.78</td>
<td valign="top" align="center">4.77 &#x00B1; 1.82</td>
<td valign="top" align="center">0.479</td>
</tr>
<tr>
<td valign="top" align="left">MoCA</td>
<td valign="top" align="center">27.71 &#x00B1; 2.02</td>
<td valign="top" align="center">28.24 &#x00B1; 1.09</td>
<td valign="top" align="center">0.304</td>
</tr>
<tr>
<td valign="top" align="left">SCOPA-AUT</td>
<td valign="top" align="center">9.62 &#x00B1; 6.67</td>
<td valign="top" align="center">6.24 &#x00B1; 4.58</td>
<td valign="top" align="center">&#x003C;0.001<xref ref-type="table-fn" rid="t1fns1">&#x002A;&#x002A;</xref></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn><p>Data are presented as means (standard deviation). PD, Parkinson&#x2019;s disease; HC, health control; MDS-UPDRS-III, Part three of the Unified Parkinson Disease Rating Scale; UPSIT, University of Pennsylvania Smell Identification Test; MoCA, Montreal Cognitive Assessment; GDS, the Geriatric Depression Scaled; SCOPA-AUT, the Scales for Outcomes in PD Autonomic; &#x03C7;<sup>2</sup>-test was performed for comparisons of sex; <italic>t</italic> test was performed for comparisons of age; Mann-Whitney U test was applied to compare non-normal distribution data;</p></fn>
<fn id="t1fns1"><p>&#x002A;&#x002A;<italic>p</italic> &#x003C; 0.001; &#x002A;<italic>p</italic> &#x003C; 0.05.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="S3.SS2">
<title>3.2 Classification performance of SNP</title>
<p>This study first evaluated the classification performance for PD using single-modality SNP genotype data, and validated the efficacy of the Fisher-EnLasso-PLS feature selection method through ablation studies. The integration of genetic and imaging data risks reducing sample size and introducing bias. To address this, experiments were conducted on a dataset comprising 532 subjects (367 PD patients and 165 healthy controls). A linear kernel SVM with L1 regularization was trained, validated, and tested on the selected features. <xref ref-type="table" rid="T2">Table 2</xref> presents the average classification performance and the optimal number of features derived from ten experimental runs per method.</p>
<table-wrap position="float" id="T2">
<label>TABLE 2</label>
<caption><p>Ablation comparison experiments.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="left" style="color:#ffffff;background-color: #7f8080;"><bold>Feature selection method</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>Average number of features</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>Bacc</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>G-mean</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>F1</bold></td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Fisher</td>
<td valign="top" align="center">313</td>
<td valign="top" align="center">86.55 &#x00B1; 6.62</td>
<td valign="top" align="center">85.95 &#x00B1; 6.99</td>
<td valign="top" align="center">82.79 &#x00B1; 8.11</td>
</tr>
<tr>
<td valign="top" align="left">Fisher-EnLasso</td>
<td valign="top" align="center">259</td>
<td valign="top" align="center">87.53 &#x00B1; 6.11</td>
<td valign="top" align="center">87.07 &#x00B1; 6.22</td>
<td valign="top" align="center">83.84 &#x00B1; 7.02</td>
</tr>
<tr>
<td valign="top" align="left">Fisher-PCA</td>
<td valign="top" align="center">46</td>
<td valign="top" align="center">89.63 &#x00B1; 5.44</td>
<td valign="top" align="center">89.45 &#x00B1; 4.85</td>
<td valign="top" align="center">85.83 &#x00B1; 7.49</td>
</tr>
<tr>
<td valign="top" align="left">Fisher-PLS</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">90.05 &#x00B1; 4.76</td>
<td valign="top" align="center">90.00 &#x00B1; 5.45</td>
<td valign="top" align="center">85.18 &#x00B1; 6.78</td>
</tr>
<tr>
<td valign="top" align="left">Fisher-EnLasso-PCA</td>
<td valign="top" align="center">27</td>
<td valign="top" align="center">91.61 &#x00B1; 3.40</td>
<td valign="top" align="center">91.41 &#x00B1; 3.60</td>
<td valign="top" align="center">89.04 &#x00B1; 3.98</td>
</tr>
<tr>
<td valign="top" align="left">Fisher-EnLasso-PLS</td>
<td valign="top" align="center">9</td>
<td valign="top" align="center">94.54 &#x00B1; 2.17</td>
<td valign="top" align="center">94.50 &#x00B1; 2.20</td>
<td valign="top" align="center">92.36 &#x00B1; 2.40</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The Fisher-EnLasso-PLS hybrid feature selection method demonstrated superior performance, achieving the highest accuracy with fewer features. It attained an average balanced accuracy (Bacc) of 94.54%. The EnLasso stage, following Fisher selection, effectively eliminated redundancies and reduced dimensionality, while EnLasso alone only marginally improved performance, increasing average Bacc by 0.98% compared to the Fisher-only method.</p>
<p>In comparisons between Fisher-PCA and Fisher-PLS, the classification performance was inferior to the Fisher-EnLasso-PCA and Fisher-EnLasso-PLS techniques, underscoring the EnLasso algorithm&#x2019;s efficacy in removing unnecessary complex features. Moreover, PLS proved more effective than PCA in dimensionality reduction. The Fisher-EnLasso-PLS algorithm, utilizing cascaded PLS, achieved a 2.93% higher average accuracy than Fisher-EnLasso-PCA with cascaded PCA, along with a narrower standard deviation. To illustrate performance differences, PCA and PLS were used to reduce the feature space to two dimensions after Fisher-EnLasso selection, visualizing data distribution and SVM (linear kernel, l1 = 0.01) decision boundaries in the initial experiment. <xref ref-type="fig" rid="F4">Figure 4</xref> shows that PLS-extracted principal components more effectively distinguished between positive and negative samples than PCA.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>Visualization of the data (training set) distribution after Fisher-EnLasso feature selection. <bold>(A)</bold> The visualization result using the PCA algorithm. <bold>(B)</bold> The visualization result using the PLS algorithm; decision dividers are plotted based on the SVM model. &#x201C;0&#x201D; indicates PD patient samples; &#x201C;1&#x201D; denotes HC control samples.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-17-1510192-g004.tif"/>
</fig>
</sec>
<sec id="S3.SS3">
<title>3.3 Classification performance of SNP and MRI fusion</title>
<sec id="S3.SS3.SSS1">
<title>3.3.1 Feature-level fusion classification outcomes</title>
<p>The effectiveness of classification using feature-level integration of SNP and MRI data is detailed in <xref ref-type="table" rid="T3">Table 3</xref>. Key findings include: (i) Single SNP features consistently exhibited superior classification capability compared to MRI imaging features; (ii) The Fusion2 method generally achieved higher accuracy than Fusion1, surpassing the best performance of individual modalities. For instance, Fusion2&#x2019;s accuracy, combining image and genetic data, exceeded the top-performing MLP model by 8.49% for MRI features and by 1.8% for SNP features; (iii) Multimodal fusion did not universally outperform unimodal approaches. Specifically, the SNP-based model outperformed multimodal fusion when using RF, AdaBoost, and GBDT classifiers, potentially due to suboptimal &#x201C;learning&#x201D; of MRI features, which could introduce noise and diminish classifier performance.</p>
<table-wrap position="float" id="T3">
<label>TABLE 3</label>
<caption><p>Classification performance based on multi-modal fusion features and single-modal features.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="left" style="color:#ffffff;background-color: #7f8080;"><bold>Classifier</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>MRI</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>SNP</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>Fusion1</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>Fusion2</bold></td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">LR</td>
<td valign="top" align="center">78.72 &#x00B1; 8.71</td>
<td valign="top" align="center">87.15 &#x00B1; 5.51</td>
<td valign="top" align="center">85.84 &#x00B1; 5.11</td>
<td valign="top" align="center">87.72 &#x00B1; 4.39</td>
</tr>
<tr>
<td valign="top" align="left">SVM</td>
<td valign="top" align="center">80.68 &#x00B1; 11.36</td>
<td valign="top" align="center">85.51 &#x00B1; 9.33</td>
<td valign="top" align="center">84.93 &#x00B1; 8.89</td>
<td valign="top" align="center">89.13 &#x00B1; 7.56</td>
</tr>
<tr>
<td valign="top" align="left">RF</td>
<td valign="top" align="center">70.64 &#x00B1; 11.63</td>
<td valign="top" align="center">87.00 &#x00B1; 8.86</td>
<td valign="top" align="center">78.77 &#x00B1; 10.68</td>
<td valign="top" align="center">72.92 &#x00B1; 9.77</td>
</tr>
<tr>
<td valign="top" align="left">MLP</td>
<td valign="top" align="center">83.60 &#x00B1; 7.04</td>
<td valign="top" align="center">90.29 &#x00B1; 6.48</td>
<td valign="top" align="center">89.64 &#x00B1; 5.57</td>
<td valign="top" align="center">92.09 &#x00B1; 3.91</td>
</tr>
<tr>
<td valign="top" align="left">AdaBoost</td>
<td valign="top" align="center">74.19 &#x00B1; 9.59</td>
<td valign="top" align="center">85.67 &#x00B1; 9.67</td>
<td valign="top" align="center">73.43 &#x00B1; 8.37</td>
<td valign="top" align="center">76.40 &#x00B1; 7.09</td>
</tr>
<tr>
<td valign="top" align="left">GBDT</td>
<td valign="top" align="center">72.08 &#x00B1; 7.01</td>
<td valign="top" align="center">84.29 &#x00B1; 8.41</td>
<td valign="top" align="center">73.93 &#x00B1; 8.50</td>
<td valign="top" align="center">76.57 &#x00B1; 8.21</td>
</tr>
<tr>
<td valign="top" align="left">XGBoost</td>
<td valign="top" align="center">81.31 &#x00B1; 10.79</td>
<td valign="top" align="center">87.27 &#x00B1; 6.82</td>
<td valign="top" align="center">85.18 &#x00B1; 6.76</td>
<td valign="top" align="center">88.73 &#x00B1; 5.79</td>
</tr>
<tr>
<td valign="top" align="left">LightGBM</td>
<td valign="top" align="center">78.04 &#x00B1; 10.77</td>
<td valign="top" align="center">84.48 &#x00B1; 5.41</td>
<td valign="top" align="center">83.54 &#x00B1; 8.48</td>
<td valign="top" align="center">85.57 &#x00B1; 4.54</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn><p>The values in bold represent the best mean accuracy achieved in each feature fusion model.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="S3.SS3.SSS2">
<title>3.3.2 Decision-level fusion classification results</title>
<p>To demonstrate the effectiveness of decision-level fusion with the AE_Stacking technique for integrating image and genetic features, ablation studies were conducted. This method was benchmarked against the best single-modal model with one classifier, single-modal models with multiple classifiers, and feature-level fusion models. As shown in <xref ref-type="table" rid="T3">Table 3</xref>, MLP emerged as the top performer for both unimodal and feature-level fusion, serving as the primary benchmark. We also tested the single-modal multi-classifier approach by inputting each modality&#x2019;s features into AE_Stacking and adjusting the multi-classifier configuration. Additionally, we evaluated a model trained on a multimodal feature matrix with feature-level fusion as input to AE_Stacking. The data in <xref ref-type="table" rid="T4">Table 4</xref> revealed that the AE_Stacking decision-level fusion achieved the highest average balanced accuracy, sensitivity, G-mean, and F1 scores-95.36, 94.36, 95.30, and 93.41%, respectively, surpassing feature-level fusion (<italic>p</italic> &#x003C; 0.05). Moreover, AE_Stacking models with integrated multi-classifiers consistently delivered improved classification outcomes, characterized by a high mean and a reduced standard deviation (<italic>p</italic> &#x003C; 0.05), when compared to single classifier models, irrespective of whether unimodal or feature-level multimodal fusion was utilized. This underscores both the efficacy and stability of the proposed strategy.</p>
<table-wrap position="float" id="T4">
<label>TABLE 4</label>
<caption><p>Classification performance based on decision-level fusion.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="left" style="color:#ffffff;background-color: #7f8080;"></td>
<td valign="top" align="center" colspan="2" style="color:#ffffff;background-color: #7f8080;"><bold>MRI</bold></td>
<td valign="top" align="center" colspan="2" style="color:#ffffff;background-color: #7f8080;"><bold>SNP</bold></td>
<td valign="top" align="center" colspan="2" style="color:#ffffff;background-color: #7f8080;"><bold>Fusion2</bold></td>
<td valign="top" align="center" colspan="2" style="color:#ffffff;background-color: #7f8080;"><bold>MRI+SNP</bold></td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" style="color:#ffffff;background-color: #7f8080;"></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>MLP</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>AE_Stacking</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>MLP</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>AE_Stacking</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>MLP</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>AE_Stacking</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>MLP</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>AE_Stacking</bold></td>
</tr>
<tr>
<td valign="top" align="left">Bacc</td>
<td valign="top" align="center">83.88 &#x00B1; 9.30</td>
<td valign="top" align="center">85.27 &#x00B1; 5.66</td>
<td valign="top" align="center">90.29 &#x00B1; 6.48</td>
<td valign="top" align="center">91.09 &#x00B1; 6.15</td>
<td valign="top" align="center">92.09 &#x00B1; 5.80</td>
<td valign="top" align="center">93.27 &#x00B1; 5.57</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">95.36 &#x00B1; 4.77</td>
</tr>
<tr>
<td valign="top" align="left">Sen</td>
<td valign="top" align="center">78.67 &#x00B1; 20.50</td>
<td valign="top" align="center">76.00 &#x00B1; 14.97</td>
<td valign="top" align="center">84.36 &#x00B1; 13.73</td>
<td valign="top" align="center">84.00 &#x00B1; 13.63</td>
<td valign="top" align="center">86.00 &#x00B1; 12.72</td>
<td valign="top" align="center">92.00 &#x00B1; 9.80</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">94.36 &#x00B1; 7.37</td>
</tr>
<tr>
<td valign="top" align="left">Spe</td>
<td valign="top" align="center">89.09 &#x00B1; 10.60</td>
<td valign="top" align="center">94.55 &#x00B1; 9.92</td>
<td valign="top" align="center">97.35 &#x00B1; 3.50</td>
<td valign="top" align="center">96.36 &#x00B1; 6.80</td>
<td valign="top" align="center">98.18 &#x00B1; 3.64</td>
<td valign="top" align="center">94.55 &#x00B1; 7.27</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">96.36 &#x00B1; 3.40</td>
</tr>
<tr>
<td valign="top" align="left">G-mean</td>
<td valign="top" align="center">82.19 &#x00B1; 12.91</td>
<td valign="top" align="center">84.48 &#x00B1; 7.15</td>
<td valign="top" align="center">90.29 &#x00B1; 7.95</td>
<td valign="top" align="center">89.71 &#x00B1; 7.41</td>
<td valign="top" align="center">91.55 &#x00B1; 6.14</td>
<td valign="top" align="center">93.03 &#x00B1; 5.95</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">95.30 &#x00B1; 4.45</td>
</tr>
<tr>
<td valign="top" align="left">F1</td>
<td valign="top" align="center">77.05 &#x00B1; 6.18</td>
<td valign="top" align="center">80.45 &#x00B1; 4.45</td>
<td valign="top" align="center">88.23 &#x00B1; 9.36</td>
<td valign="top" align="center">87.43 &#x00B1; 8.64</td>
<td valign="top" align="center">90.14 &#x00B1; 8.30</td>
<td valign="top" align="center">90.44 &#x00B1; 6.37</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">93.41 &#x00B1; 4.81</td>
</tr>
</tbody>
</table></table-wrap>
<p><xref ref-type="fig" rid="F5">Figure 5</xref> presents the ROC curves and AUC metrics for each model, with 95% confidence intervals indicated in parentheses. The AE_Stacking-based multimodal fusion model notably achieved the highest AUC of 0.974, with a 95% confidence interval spanning from 0.93 to 1.00.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>ROC curves for each model.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-17-1510192-g005.tif"/>
</fig>
</sec>
</sec>
<sec id="S3.SS4">
<title>3.4 Cerebral regions and genetic markers associated with PD</title>
<p>The weights of each feature in ten experiments were averaged and then ranked in descending order to determine their relative contributions for PD. For MRI image features, we identified the top 10 ranked brain regions in each method. Due to the high dimensionality of the genetic data, we reported the top 30 ranked SNP loci. <xref ref-type="fig" rid="F6">Figure 6</xref> illustrates the Venn diagrams of brain regions and genes identified as the best features by unimodal and multimodal methods.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p>Venn diagram of optimal features. <bold>(A)</bold> the optimal MRI image feature. &#x201C;lh&#x201D; represented regions located in the left cerebral cortex, while &#x201C;rh&#x201D; represented regions located in the right cerebral cortex. The characters in parentheses indicated the feature parameter index for each brain region. For detailed information on brain anatomy and definitions of brain regions, it could refer to websites <ext-link ext-link-type="uri" xlink:href="http://www.brainnetome.org/">http://www.brainnetome.org/</ext-link> and <ext-link ext-link-type="uri" xlink:href="http://www.humanconnectome.org/">http://www.humanconnectome.org/</ext-link>; <bold>(B)</bold> the optimal SNPs gene features.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-17-1510192-g006.tif"/>
</fig>
<p>Among MRI features, the FD feature corresponding to the 6r brain region in the left cerebral cortex [lh 6r (FD)], the GI feature corresponding to the 46 brain region on the right [rh 46 (GI)], and the right posterior inferotemporal region [rh PIT (GI)] consistently appeared in the top 10 features across all three sets of experiments. This indicates that they are the most stable imaging features with strong discriminative power for PD in MRI modality. The location of the these three regions in the brain were shown in <xref ref-type="supplementary-material" rid="TS1">Supplementary Figure S2</xref>. Compared to the HC group, the lh 6r (FD) feature showed a significant increase in the PD group, while the rh 46 (GI) and rh PIT (GI) features exhibited significant atrophy (<xref ref-type="fig" rid="F7">Figures 7A&#x2013;C</xref>).</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption><p>Distribution plot of inter-group differences in the optimal stable features. <bold>(A&#x2013;C)</bold> The optimal MRI image feature. Compared to the HC group, the lh 6r(FD) feature showed a significant increase in the PD group, while the rh 46(GI) and rh PIT(GI) features both exhibited significant atrophy; <bold>(D&#x2013;P)</bold> the optimal SNPs features. All of these SNPs showed statistically significant differences between the PD group and the HC group.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-17-1510192-g007.tif"/>
</fig>
<p>For SNP loci, we referenced the international 1,000 genomes project (1,000 genomes) for gene annotation of the stable SNP loci ranked in the top 30 and reviewed relevant literature. As shown in <xref ref-type="table" rid="T5">Table 5</xref>, the SNPs with high discriminatory power were mainly located in the SNCA gene, the coding region of the VPS52 gene, and the SLC14A1 gene, all of which have been confirmed to be associated with PD. These SNPs demonstrated statistically significant differences between the PD and HC groups (<xref ref-type="fig" rid="F7">Figures 7D&#x2013;P</xref>).</p>
<table-wrap position="float" id="T5">
<label>TABLE 5</label>
<caption><p>TOP30 SNPs and corresponding gene annotations.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="left" style="color:#ffffff;background-color: #7f8080;"><bold>SNPs</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>Rs code</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>Chromosome location</bold></td>
<td valign="top" align="center" style="color:#ffffff;background-color: #7f8080;"><bold>Genes</bold></td>
<td valign="top" align="left" style="color:#ffffff;background-color: #7f8080;"><bold>Literature coverage</bold></td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">NeuroX_rs356181</td>
<td valign="top" align="center">rs356181</td>
<td valign="top" align="center">chr4: 90626111</td>
<td valign="top" align="center">SNCA</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B6">Blauwendraat et al. (2020)</xref>, <xref ref-type="bibr" rid="B18">Jia et al. (2022)</xref>, and <xref ref-type="bibr" rid="B33">Sampedro et al. (2018)</xref></td>
</tr>
<tr>
<td valign="top" align="left">exm2271486</td>
<td valign="top" align="center">rs7939948</td>
<td valign="top" align="center">chr11:36311014</td>
<td valign="top" align="center">COMMD9</td>
<td valign="top" align="left">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">exm2252875</td>
<td valign="top" align="center">rs1131636</td>
<td valign="top" align="center">chr17:1801189</td>
<td valign="top" align="center">RPA1</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B53">Yuan et al. (2020)</xref></td>
</tr>
<tr>
<td valign="top" align="left">exm19101</td>
<td valign="top" align="center">rs486557</td>
<td valign="top" align="center">chr1:15616139</td>
<td valign="top" align="center">FHAD1</td>
<td valign="top" align="left">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">exm2266280</td>
<td valign="top" align="center">rs1588787</td>
<td valign="top" align="center">chr6:163354979</td>
<td valign="top" align="center">PACRG</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B23">Liu et al. (2021)</xref></td>
</tr>
<tr>
<td valign="top" align="left">exm2264280</td>
<td valign="top" align="center">rs7015855</td>
<td valign="top" align="center">chr8:13660787</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="left">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">exm2266447</td>
<td valign="top" align="center">rs12704649</td>
<td valign="top" align="center">chr7:92674917</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="left">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">exm-rs213202</td>
<td valign="top" align="center">rs213202</td>
<td valign="top" align="center">chr6:33232055</td>
<td valign="top" align="center">VPS52</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B47">Wei et al. (2023)</xref></td>
</tr>
<tr>
<td valign="top" align="left">exm-rs213204</td>
<td valign="top" align="center">rs213204</td>
<td valign="top" align="center">chr6:33241076</td>
<td valign="top" align="center">VPS52</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B47">Wei et al. (2023)</xref></td>
</tr>
<tr>
<td valign="top" align="left">exm-rs2736990</td>
<td valign="top" align="center">rs2736990</td>
<td valign="top" align="center">chr4:90678541</td>
<td valign="top" align="center">SNCA</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B6">Blauwendraat et al. (2020)</xref>; <xref ref-type="bibr" rid="B18">Jia et al. (2022)</xref>, and <xref ref-type="bibr" rid="B33">Sampedro et al. (2018)</xref></td>
</tr>
<tr>
<td valign="top" align="left">NeuroX_rs7238033</td>
<td valign="top" align="center">rs7238033</td>
<td valign="top" align="center">chr18:43316966</td>
<td valign="top" align="center">SLC14A1</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B32">Recabarren and Alarcon (2017)</xref></td>
</tr>
<tr>
<td valign="top" align="left">exm1124271</td>
<td valign="top" align="center">rs57740714</td>
<td valign="top" align="center">chr14:94912896</td>
<td valign="top" align="center">SERPINA11</td>
<td valign="top" align="left">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">NeuroX_dbSNP_rs35534739</td>
<td valign="top" align="center">rs113343065</td>
<td valign="top" align="center">chr6:32583490</td>
<td valign="top" align="center">HLA-DQA1</td>
<td valign="top" align="left"><xref ref-type="bibr" rid="B48">Wissemann et al. (2013)</xref> and <xref ref-type="bibr" rid="B51">Yu et al. (2021)</xref></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn><p>&#x201C;&#x2013;&#x201D; indicates that no related genes and related literature reports were found.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
</sec>
<sec id="S4" sec-type="discussion">
<title>4 Discussion</title>
<p>The purpose of this study is to establish a multi-modal fusion learning model that enhances the diagnostic capabilities for PD by integrating MRI image data and genetic information. Our findings indicate that the decision-level fusion model (AE_Stacking) achieved the highest accuracy (95.36%) and AUC (0.974) in identifying PD, significantly outperforming models based solely on imaging or genetic data. Furthermore, the decision-level fusion model demonstrated superior performance compared to feature-level fusion models. By analyzing the latent features extracted by the model, we identified risk factors highly correlated with the disease, providing new insights into PD diagnosis.</p>
<p>Numerous studies have utilized ML or deep learning algorithms to investigate the value of various data modalities in PD diagnosis, such as clinical assessment scales (<xref ref-type="bibr" rid="B2">Ara&#x00FA;jo et al., 2023</xref>; <xref ref-type="bibr" rid="B44">Vitorio et al., 2023</xref>), electroencephalographic monitoring (<xref ref-type="bibr" rid="B29">Nour et al., 2023</xref>; <xref ref-type="bibr" rid="B38">Suuronen et al., 2023</xref>), cerebrospinal fluid biomarker detection (<xref ref-type="bibr" rid="B16">H&#x00F6;glinger et al., 2024</xref>; <xref ref-type="bibr" rid="B42">Tsukita et al., 2023</xref>), neuroimaging, and genetic testing. However, clinical assessment scales are often subjective, lacking adequate sensitivity and specificity; cerebrospinal fluid collection is invasive; and electroencephalographic monitoring is heavily influenced by individual variability, struggling to reflect changes in deeper brain regions. Consequently, these methods face considerable challenges in early PD screening. Imaging genomics represents an emerging field in data science. Neuroimaging genomics enable the integrated analysis of brain imaging and genomic data, providing new insights into brain phenotypes, genetic, and molecular characteristics and their influence on both normal and disordered brain functions and behaviors. For example, the G/A polymorphism may cause more extensive brain white matter damage in PD (<xref ref-type="bibr" rid="B52">Yu et al., 2022</xref>). Early-onset Parkinson&#x2019;s disease with atypical molecular imaging abnormalities in a patient carrying the de novo PRKCG mutation (<xref ref-type="bibr" rid="B7">Chen et al., 2022</xref>). Key genetic signatures of large-scale PD pathology have contributed to focal neuronal vulnerability to disease progression (<xref ref-type="bibr" rid="B3">Basaia et al., 2022</xref>). Therefore, exploring the underlying causes of PD from the source can provide more reliable and accurate foundations for PD diagnosis.</p>
<p>Effectively mining the associative information between imaging and genetic data poses a considerable challenge. Unlike the work of <xref ref-type="bibr" rid="B4">Bi et al. (2021a</xref>,<xref ref-type="bibr" rid="B5">b</xref>), they used correlations of gene and brain functional information from fMRI as model inputs. Although high accuracy rates (88.57%) were achieved, solely relying on fused features risked obscuring unique modality-specific information, potentially diminishing the model&#x2019;s overall performance by not fully leveraging the distinct contributions of each data type. To overcome these limitations, we developed and compared two fusion methods: feature-level and decision-level fusion. As shown in <xref ref-type="table" rid="T4">Table 4</xref> and <xref ref-type="fig" rid="F5">Figure 5</xref>, compared with the feature-level fusion method, the model using the designed AE_Stacking ensemble learning method for decision-level fusion achieved the highest classification accuracy (95.36%) and AUC value [0.974 (95%CI: 0.93&#x2013;1.00]. In the feature-level fusion approach, the direct concatenation of SNP features with MRI features fails to facilitate meaningful interaction between disparate modal features. This limitation hinders the model&#x2019;s ability to learn disease-related features from the fusion data. Conversely, the decision-level fusion strategy is similar to multi-task learning. By treating the two modal features as independent inputs, the model can perceive the learning process of each modality as a distinct task. Consequently, this fusion strategy effectively leverages both the commonalities and differences among various modalities to integrate the features of each modality comprehensively. The main advantage of using the AE_Stacking decision-level fusion strategy is the integration of the results of multiple strong classification base models. This method not only considers the independent contribution of each single modality feature to PD diagnosis, but also achieves complementary advantages of multiple base models through a &#x201C;strong combination&#x201D; approach, so the overall model has higher PD recognition performance. In addition, compared with the general Stacking integration technology, the designed AE_Stacking integration learning method can automatically select models with better classification performance from the candidate classifiers as strong base classifiers, thereby enhancing the diversity of base classifiers. Then increase the weight of the base learner with high classification performance, and reduce the weight of the base learner with relatively low classification performance, so that the meta-learner can pay more attention to the base learners with stronger performance. Compared with direct input, the AE_Stacking method improves performance by automatically selecting the best performing base learners, thereby increasing diversity and allowing the meta-learner to focus on more powerful models, and therefore enhancing integration performance. Future research could be integrated with more multimodal data to develop comprehensive predictive models.</p>
<p>Finally, by statistically analyzing the features selected for high frequency in each single-modal as well as two multimodal feature fusions process, we identified a subset of stable brain region features that consistently belonged to the distinguished circle of the top 10 features across the entirety of our experimental datasets. The FD attribute pertaining to the left cerebral cortex&#x2019;s 6r region [lh 6r (FD)] and the GI attribute linked to the right hemisphere&#x2019;s 46 region [rh 46 (GI)] demonstrated remarkable stability, suggesting their potential as robust imaging biomarkers for PD. Interestingly, the most discriminative features in our model were based on advanced measurements of cortical geometry&#x2014;specifically FD and GI&#x2014;rather than traditional metrics like GMV, CT, and SA. This suggests that cortical surface geometry measurements may provide more sensitive biomarkers for PD diagnosis. This observation suggests that measurements of cortical surface geometry may offer more sensitive biomarkers for the diagnosis of PD. The heightened discriminative power of FD and GI could be attributed to their intrinsic sensitivity to the nuanced changes in cortical structure that are often subtle or overlooked by traditional volumetric methods. Specifically, fractal dimension captures the complexity and intricacy of the cortical folding patterns, while the gyrification index quantifies the degree of cortical folding, providing insights into the brain&#x2019;s structural integrity and potential deviations caused by pathological processes. In addition, the changes observed in these cortical features are also reflect the combined effects of GM, WM, and the overall dynamics of cortical connectivity. Together, these elements provide a microscopic view of the structural alterations in the brains of individuals with PD.</p>
<p>Our genetic probe into SNP data unveiled that the most discriminative loci were predominantly situated within three genes: SNCA, with SNPs rs356181 and rs2736990; VPS52, with SNPs rs213202 and rs213204; and SLC14A1, with SNP rs7238033. The SNCA gene, in particular, has been recognized as an autosomal dominant culprit in PD (<xref ref-type="bibr" rid="B18">Jia et al., 2022</xref>). The rs356181 variant within the SNCA locus has been found to regulate the influence of cerebrospinal fluid-related biomarkers on cortical atrophy and is associated with diminished cognitive function in PD patients (<xref ref-type="bibr" rid="B33">Sampedro et al., 2018</xref>). The PACRG gene has been reported to be a bidirectional promoter shared with the Parkin/Park2 gene (<xref ref-type="bibr" rid="B23">Liu et al., 2021</xref>). The SLC14A1 gene exhibits altered expression in PD-affected individuals and is conjectured to be instrumental in the regulation of A&#x03B2; production and apoptosis, potentially contributing to the pathological hallmarks of Alzheimer&#x2019;s disease, PD, and muscular dystrophy (<xref ref-type="bibr" rid="B32">Recabarren and Alarcon, 2017</xref>). Genetic variation can affect the corresponding cell function, thereby changing the normal brain phenotype. Therefore, combining genes with brain imaging will help understand the abnormalities of brain structure and function and the role of gene expression risk factors in the progression of PD (<xref ref-type="bibr" rid="B13">Garc&#x00ED;a-Mar&#x00ED;n et al., 2023</xref>; <xref ref-type="bibr" rid="B54">Zang et al., 2023</xref>). In the future, clinical symptoms should be further combined to explore the association between genotype, brain phenotype and clinical phenotype through joint analysis of fusion imaging genes. In addition, the combination of machine learning or deep learning technology is expected to predict PD risk and possible clinical manifestations at the individual level. The identification of these stable imaging biomarkers and genetic loci holds significant promise for personalized treatment strategies.</p>
<p>While our methodology enhances PD diagnostic efficacy, it is essential to acknowledge its limitations. The PLS method, used for dimensionality reduction, may restrict analysis and interpretation of important fusion features. Moreover, our study&#x2019;s focus was specifically on the integration of genetic and MRI data for PD identification. While this approach has provided valuable insights, it also presents a limitation in terms of the breadth of data types considered. Future research should aim to expand the scope by incorporating additional imaging modalities, such as positron emission tomography (PET) or functional MRI (fMRI), which could offer different perspectives on the neurobiological changes associated with PD. In addition, genetic factors exhibit variation across different ethnic cultures. Ethnic heterogeneity is a further key determinant, influencing disparities in epidemiology, clinical manifestations and mortality. Therefore, it becomes necessary to take into account ethnic-cultural factors and more clinical manifestations to develop models that are both specific and sensitive to the unique genetic profiles present in diverse population. Finally, a growing number of genetic studies have demonstrated that there are disparities in the genetic mechanisms across different PD syndromes as well as in the severity of the disease (<xref ref-type="bibr" rid="B20">Koziorowski et al., 2021</xref>; <xref ref-type="bibr" rid="B26">Mart&#x00ED;nez Carrasco et al., 2023</xref>). This suggests that in the future, the multimodal fusion strategy of imaging and genetic data can also be applied to the differential diagnosis of PD and the evaluation and prediction of disease severity, thereby enhancing the accuracy and reliability of diagnosis and enabling the development of more refined and effective healthcare solutions.</p>
</sec>
<sec id="S5" sec-type="conclusion">
<title>5 Conclusion</title>
<p>In conclusion, the AE_Stacking model, trained with MRI and genetic data, demonstrates promising diagnostic values in detection of PD. By integrating multimodal data, the model has the potential to reveal complex patterns of disease progression. As the clinical sample size expands and data quality improves, this method is expected to be applied to more complex clinical tasks, such as staging disease progression, identifying high-risk populations, and supporting the differential diagnosis of related neurological disorders. Additionally, these consistent neuroimaging features and specific genetic variants identified highlight their potential as early diagnostic indicators for PD, while would also proffer new insights for personalized clinical interventions. Future research should focus on biological evaluations to demonstrate relevant neurobiological signals or markers and clarify the psychological or behavioral structures linked to specific brain pathways or regions, thereby strengthening the model&#x2019;s reliability.</p>
</sec>
</body>
<back>
<sec id="S6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found in the article/<xref ref-type="supplementary-material" rid="TS1">Supplementary material</xref>.</p>
</sec>
<sec id="S7" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by the Parkinson&#x2019;s Progression Markers Initiative (PPMI) database was used in this study. For up-to-date information on the study, visit [PPMI website] (<ext-link ext-link-type="uri" xlink:href="https://www.ppmi-info.org/">https://www.ppmi-info.org/</ext-link>). PPMI&#x2014;a public-private partnership&#x2014;is funded by the Michael J. Fox Foundation for Parkinson&#x2019;s Research and funding partners. The study protocol and informed consent forms are available upon request from the PPMI website. All participants provided informed consent in accordance with the ethical standards of the institutional and/or national research committee and with the 1964 Helsinki declaration and its later amendments or comparable ethical standards. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="S8" sec-type="author-contributions">
<title>Author contributions</title>
<p>YY: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Software, Validation, Visualization, Writing &#x2013; original draft. LH: Conceptualization, Investigation, Methodology, Validation, Writing &#x2013; review &#x0026; editing. YC: Data curation, Software, Supervision, Visualization, Writing &#x2013; review &#x0026; editing. WG: Funding acquisition, Supervision, Writing &#x2013; review &#x0026; editing. GL: Funding acquisition, Supervision, Writing &#x2013; review &#x0026; editing. YX: Supervision, Writing &#x2013; review &#x0026; editing. SN: Conceptualization, Supervision, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec id="S9" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. This study has received funding by grant from the Clinical Research and Cultivation Project of Shanghai ShenKang Hospital Development Center (SHDC2022CRT025) and the Joint Research Development Project between Shenkang and United Imaging on Clinical Research and Translation (SKLY2022CRT402), Science and Technology Commission of Shanghai Municipality (23Y11907700), and the National Natural Science Foundation of China (82271286).</p>
</sec>
<sec id="S10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="S11">
<title>Generative AI statement</title>
<p>The authors declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec id="S12" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="S13" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fnagi.2025.1510192/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fnagi.2025.1510192/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.docx" id="TS1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<fn-group>
<fn id="footnote1">
<label>1</label>
<p><ext-link ext-link-type="uri" xlink:href="http://www.ppmi-info.org/dat">www.ppmi-info.org/dat</ext-link></p></fn>
<fn id="footnote2">
<label>2</label>
<p><ext-link ext-link-type="uri" xlink:href="https://ida.loni.usc.edu/pages/access/geneticData.jsp">https://ida.loni.usc.edu/pages/access/geneticData.jsp</ext-link></p></fn>
<fn id="footnote3">
<label>3</label>
<p><ext-link ext-link-type="uri" xlink:href="http://dbm.neuro.uni-jena.de/cat/">http://dbm.neuro.uni-jena.de/cat/</ext-link></p></fn>
<fn id="footnote4">
<label>4</label>
<p><ext-link ext-link-type="uri" xlink:href="https://www.fil.ion.ucl.ac.uk/spm/">https://www.fil.ion.ucl.ac.uk/spm/</ext-link></p></fn>
<fn id="footnote5">
<label>5</label>
<p><ext-link ext-link-type="uri" xlink:href="https://github.com/yyflib/Multimodal-ensemble-learning">https://github.com/yyflib/Multimodal-ensemble-learning</ext-link></p></fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alfradique-Dunham</surname> <given-names>I.</given-names></name> <name><surname>Al-Ouran</surname> <given-names>R.</given-names></name> <name><surname>von Coelln</surname> <given-names>R.</given-names></name> <name><surname>Blauwendraat</surname> <given-names>C.</given-names></name> <name><surname>Hill</surname> <given-names>E.</given-names></name> <name><surname>Luo</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>Genome-Wide association study meta-analysis for Parkinson disease motor subtypes.</article-title> <source><italic>Neurol. Genet.</italic></source> <volume>7</volume>:<issue>e557</issue>.</citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ara&#x00FA;jo</surname> <given-names>H.</given-names></name> <name><surname>Smaili</surname> <given-names>S.</given-names></name> <name><surname>Morris</surname> <given-names>R.</given-names></name> <name><surname>Graham</surname> <given-names>L.</given-names></name> <name><surname>Das</surname> <given-names>J.</given-names></name> <name><surname>McDonald</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2023</year>). <article-title>Combination of clinical and gait measures to classify fallers and non-fallers in Parkinson&#x2019;s disease.</article-title> <source><italic>Sensors (Basel)</italic></source> <volume>23</volume>:<issue>4651</issue>.</citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Basaia</surname> <given-names>S.</given-names></name> <name><surname>Agosta</surname> <given-names>F.</given-names></name> <name><surname>Diez</surname> <given-names>I.</given-names></name> <name><surname>Bueichek</surname> <given-names>E.</given-names></name> <name><surname>Uquillas</surname> <given-names>F.</given-names></name> <name><surname>Delgado-Alvarado</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2022</year>). <article-title>Neurogenetic traits outline vulnerability to cortical disruption in Parkinson&#x2019;s disease.</article-title> <source><italic>Neuroimage Clin.</italic></source> <volume>33</volume>:<issue>102941</issue>. <pub-id pub-id-type="doi">10.1016/j.nicl.2022.102941</pub-id> <pub-id pub-id-type="pmid">35091253</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bi</surname> <given-names>X.</given-names></name> <name><surname>Hu</surname> <given-names>X.</given-names></name> <name><surname>Xie</surname> <given-names>Y.</given-names></name> <name><surname>Wu</surname> <given-names>H.</given-names></name></person-group> (<year>2021a</year>). <article-title>A novel CERNNE approach for predicting Parkinson&#x2019;s disease-associated genes and brain regions based on multimodal imaging genetics data.</article-title> <source><italic>Med. Image Anal.</italic></source> <volume>67</volume>:<issue>101830</issue>. <pub-id pub-id-type="doi">10.1016/j.media.2020.101830</pub-id> <pub-id pub-id-type="pmid">33096519</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bi</surname> <given-names>X.</given-names></name> <name><surname>Xing</surname> <given-names>Z.</given-names></name> <name><surname>Xu</surname> <given-names>R.</given-names></name> <name><surname>Hu</surname> <given-names>X.</given-names></name></person-group> (<year>2021b</year>). <article-title>An efficient WRF framework for discovering risk genes and abnormal brain regions in Parkinson&#x2019;s disease based on imaging genetics data.</article-title> <source><italic>J. Comput. Sci. Technol.</italic></source> <volume>36</volume> <fpage>361</fpage>&#x2013;<lpage>374</lpage>.</citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Blauwendraat</surname> <given-names>C.</given-names></name> <name><surname>Nalls</surname> <given-names>M. A.</given-names></name> <name><surname>Singleton</surname> <given-names>A. B.</given-names></name></person-group> (<year>2020</year>). <article-title>The genetic architecture of Parkinson&#x2019;s disease.</article-title> <source><italic>Lancet Neurol.</italic></source> <volume>19</volume> <fpage>170</fpage>&#x2013;<lpage>178</lpage>.</citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Liu</surname> <given-names>P.</given-names></name> <name><surname>Cen</surname> <given-names>Z.</given-names></name> <name><surname>Liao</surname> <given-names>Y.</given-names></name> <name><surname>Lin</surname> <given-names>Z.</given-names></name> <name><surname>Luo</surname> <given-names>W.</given-names></name></person-group> (<year>2022</year>). <article-title>Early-onset Parkinson&#x2019;s disease with atypical molecular imaging abnormalities in a patient carrying the de novo PRKCG mutation.</article-title> <source><italic>Parkinsonism Relat. Disord.</italic></source> <volume>95</volume> <fpage>100</fpage>&#x2013;<lpage>102</lpage>. <pub-id pub-id-type="doi">10.1016/j.parkreldis.2022.01.020</pub-id> <pub-id pub-id-type="pmid">35091391</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chu</surname> <given-names>Y.</given-names></name> <name><surname>Dodiya</surname> <given-names>H.</given-names></name> <name><surname>Aebischer</surname> <given-names>P.</given-names></name> <name><surname>Olanow</surname> <given-names>C.</given-names></name> <name><surname>Kordower</surname> <given-names>J.</given-names></name></person-group> (<year>2009</year>). <article-title>Alterations in lysosomal and proteasomal markers in Parkinson&#x2019;s disease: Relationship to alpha-synuclein inclusions.</article-title> <source><italic>Neurobiol. Dis.</italic></source> <volume>35</volume> <fpage>385</fpage>&#x2013;<lpage>398</lpage>. <pub-id pub-id-type="doi">10.1016/j.nbd.2009.05.023</pub-id> <pub-id pub-id-type="pmid">19505575</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Davis</surname> <given-names>A.</given-names></name> <name><surname>Andruska</surname> <given-names>K.</given-names></name> <name><surname>Benitez</surname> <given-names>B.</given-names></name> <name><surname>Racette</surname> <given-names>B.</given-names></name> <name><surname>Perlmutter</surname> <given-names>J.</given-names></name> <name><surname>Cruchaga</surname> <given-names>C.</given-names></name></person-group> (<year>2016</year>). <article-title>Variants in GBA, SNCA, and MAPT influence Parkinson disease risk, age at onset, and progression.</article-title> <source><italic>Neurobiol. Aging</italic></source> <volume>37</volume>:<issue>e209.e1</issue>. <pub-id pub-id-type="doi">10.1016/j.neurobiolaging.2015.09.014</pub-id> <pub-id pub-id-type="pmid">26601739</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fan</surname> <given-names>L.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Zhuo</surname> <given-names>J.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>The human brainnetome atlas: A new brain atlas based on connectional architecture.</article-title> <source><italic>Cereb. Cortex</italic></source> <volume>26</volume> <fpage>3508</fpage>&#x2013;<lpage>3526</lpage>. <pub-id pub-id-type="doi">10.1093/cercor/bhw157</pub-id> <pub-id pub-id-type="pmid">27230218</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Farokhian</surname> <given-names>F.</given-names></name> <name><surname>Beheshti</surname> <given-names>I.</given-names></name> <name><surname>Sone</surname> <given-names>D.</given-names></name> <name><surname>Matsuda</surname> <given-names>H.</given-names></name></person-group> (<year>2017</year>). <article-title>Comparing CAT12 and VBM8 for detecting brain morphological abnormalities in temporal lobe epilepsy.</article-title> <source><italic>Front. Neurol.</italic></source> <volume>8</volume>:<issue>428</issue>. <pub-id pub-id-type="doi">10.3389/fneur.2017.00428</pub-id> <pub-id pub-id-type="pmid">28883807</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fernandez-Santiago</surname> <given-names>R.</given-names></name> <name><surname>Sharma</surname> <given-names>M.</given-names></name></person-group> (<year>2022</year>). <article-title>What have we learned from genome-wide association studies (GWAS) in Parkinson disease?</article-title> <source><italic>Ageing Res. Rev.</italic></source> <volume>79</volume>:<issue>101648</issue>.</citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Garc&#x00ED;a-Mar&#x00ED;n</surname> <given-names>L. M.</given-names></name> <name><surname>Reyes-P&#x00E9;rez</surname> <given-names>P.</given-names></name> <name><surname>Diaz-Torres</surname> <given-names>S.</given-names></name> <name><surname>Medina-Rivera</surname> <given-names>A.</given-names></name> <name><surname>Martin</surname> <given-names>N. G.</given-names></name> <name><surname>Mitchell</surname> <given-names>B. L.</given-names></name><etal/></person-group> (<year>2023</year>). <article-title>Shared molecular genetic factors influence subcortical brain morphometry and Parkinson&#x2019;s disease risk.</article-title> <source><italic>NPJ Parkinsons Dis.</italic></source> <volume>9</volume>:<issue>73</issue>. <pub-id pub-id-type="doi">10.1038/s41531-023-00515-y</pub-id> <pub-id pub-id-type="pmid">37164954</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ghani</surname> <given-names>M.</given-names></name> <name><surname>Lang</surname> <given-names>A. E.</given-names></name> <name><surname>Zinman</surname> <given-names>L.</given-names></name> <name><surname>Nacmias</surname> <given-names>B.</given-names></name> <name><surname>Sorbi</surname> <given-names>S.</given-names></name> <name><surname>Bessi</surname> <given-names>V.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Mutation analysis of patients with neurodegenerative disorders using NeuroX array.</article-title> <source><italic>Neurobiol. Aging</italic></source> <volume>36</volume> <fpage>545.e9</fpage>&#x2013;<lpage>14</lpage>.</citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Glasser</surname> <given-names>M. F.</given-names></name> <name><surname>Coalson</surname> <given-names>T. S.</given-names></name> <name><surname>Robinson</surname> <given-names>E. C.</given-names></name> <name><surname>Hacker</surname> <given-names>C.</given-names></name> <name><surname>Harwell</surname> <given-names>J.</given-names></name> <name><surname>Yacoub</surname> <given-names>E.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>A multi-modal parcellation of human cerebral cortex.</article-title> <source><italic>Nature</italic></source> <volume>536</volume> <fpage>171</fpage>&#x2013;<lpage>178</lpage>.</citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>H&#x00F6;glinger</surname> <given-names>G.</given-names></name> <name><surname>Adler</surname> <given-names>C.</given-names></name> <name><surname>Berg</surname> <given-names>D.</given-names></name> <name><surname>Klein</surname> <given-names>C.</given-names></name> <name><surname>Outeiro</surname> <given-names>T.</given-names></name> <name><surname>Poewe</surname> <given-names>W.</given-names></name><etal/></person-group> (<year>2024</year>). <article-title>A biological classification of Parkinson&#x2019;s disease: The SynNeurGe research diagnostic criteria.</article-title> <source><italic>Lancet Neurol.</italic></source> <volume>23</volume> <fpage>191</fpage>&#x2013;<lpage>204</lpage>.</citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iwaki</surname> <given-names>H.</given-names></name> <name><surname>Blauwendraat</surname> <given-names>C.</given-names></name> <name><surname>Leonard</surname> <given-names>H.</given-names></name> <name><surname>Liu</surname> <given-names>G.</given-names></name> <name><surname>Maple-Gr&#x00F8;dem</surname> <given-names>J.</given-names></name> <name><surname>Corvol</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Genetic risk of Parkinson disease and progression: An analysis of 13 longitudinal cohorts.</article-title> <source><italic>Neurol. Genet.</italic></source> <volume>5</volume>:<issue>e348</issue>.</citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jia</surname> <given-names>F.</given-names></name> <name><surname>Fellner</surname> <given-names>A.</given-names></name> <name><surname>Kumar</surname> <given-names>K. R.</given-names></name></person-group> (<year>2022</year>). <article-title>Monogenic Parkinson&#x2019;s disease: Genotype, phenotype, pathophysiology, and genetic testing.</article-title> <source><italic>Genes</italic></source> <volume>13</volume>:<issue>471</issue>.</citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>M.</given-names></name> <name><surname>Kim</surname> <given-names>J.</given-names></name> <name><surname>Lee</surname> <given-names>S.</given-names></name> <name><surname>Park</surname> <given-names>H.</given-names></name></person-group> (<year>2017</year>). <article-title>Imaging genetics approach to Parkinson&#x2019;s disease and its correlation with clinical score.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>7</volume>:<issue>46700</issue>.</citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koziorowski</surname> <given-names>D.</given-names></name> <name><surname>Figura</surname> <given-names>M.</given-names></name> <name><surname>Milanowski</surname> <given-names>&#x0141;M.</given-names></name> <name><surname>Szlufik</surname> <given-names>S.</given-names></name> <name><surname>Alster</surname> <given-names>P.</given-names></name> <name><surname>Madetko</surname> <given-names>N.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>Mechanisms of neurodegeneration in various forms of Parkinsonism-similarities and differences.</article-title> <source><italic>Cells</italic></source> <volume>10</volume>:<issue>656</issue>. <pub-id pub-id-type="doi">10.3390/cells10030656</pub-id> <pub-id pub-id-type="pmid">33809527</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lei</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Huang</surname> <given-names>Z.</given-names></name> <name><surname>Liu</surname> <given-names>C.</given-names></name> <name><surname>Zhou</surname> <given-names>F.</given-names></name><etal/></person-group> (<year>2022</year>). <article-title>Gene-related Parkinson&#x2019;s disease diagnosis via feature-based multi-branch octave convolution network.</article-title> <source><italic>Comput. Biol. Med.</italic></source> <volume>148</volume>:<issue>105859</issue>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2022.105859</pub-id> <pub-id pub-id-type="pmid">35930956</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>G.</given-names></name> <name><surname>Bu</surname> <given-names>H.</given-names></name> <name><surname>Yang</surname> <given-names>M. Q.</given-names></name> <name><surname>Zeng</surname> <given-names>X.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name></person-group> (<year>2008</year>). <article-title>Selecting subsets of newly extracted features from PCA and PLS in microarray data analysis.</article-title> <source><italic>BMC Genomics</italic></source> <volume>9</volume>:<issue>S24</issue>. <pub-id pub-id-type="doi">10.1186/1471-2164-9-S2-S24</pub-id> <pub-id pub-id-type="pmid">18831790</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>T.</given-names></name> <name><surname>Zhao</surname> <given-names>H.</given-names></name> <name><surname>Jian</surname> <given-names>S.</given-names></name> <name><surname>Gong</surname> <given-names>S.</given-names></name> <name><surname>Li</surname> <given-names>S.</given-names></name> <name><surname>Ma</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>Functional expression, purification and identification of interaction partners of PACRG.</article-title> <source><italic>Molecules</italic></source> <volume>26</volume>:<issue>2308</issue>. <pub-id pub-id-type="doi">10.3390/molecules26082308</pub-id> <pub-id pub-id-type="pmid">33923444</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luders</surname> <given-names>E.</given-names></name> <name><surname>Thompson</surname> <given-names>P. M.</given-names></name> <name><surname>Narr</surname> <given-names>K.</given-names></name> <name><surname>Toga</surname> <given-names>A.</given-names></name> <name><surname>Gaser</surname> <given-names>C. A.</given-names></name></person-group> (<year>2006</year>). <article-title>curvature-based approach to estimate local gyrification on the cortical surface.</article-title> <source><italic>Neuroimage</italic></source> <volume>29</volume> <fpage>1224</fpage>&#x2013;<lpage>1230</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuroimage.2005.08.049</pub-id> <pub-id pub-id-type="pmid">16223589</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Makarious</surname> <given-names>M. B.</given-names></name> <name><surname>Leonard</surname> <given-names>H. L.</given-names></name> <name><surname>Vitale</surname> <given-names>D.</given-names></name> <name><surname>Iwaki</surname> <given-names>H.</given-names></name> <name><surname>Sargent</surname> <given-names>L.</given-names></name> <name><surname>Dadu</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2022</year>). <article-title>Multi-modality machine learning predicting Parkinson&#x2019;s disease.</article-title> <source><italic>npj Parkinson&#x2019;s Dis.</italic></source> <volume>8</volume>:<issue>35</issue>.</citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mart&#x00ED;nez Carrasco</surname> <given-names>A.</given-names></name> <name><surname>Real</surname> <given-names>R.</given-names></name> <name><surname>Lawton</surname> <given-names>M.</given-names></name> <name><surname>Hertfelder Reynolds</surname> <given-names>R.</given-names></name> <name><surname>Tan</surname> <given-names>M.</given-names></name> <name><surname>Wu</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2023</year>). <article-title>Genome-wide analysis of motor progression in parkinson disease.</article-title> <source><italic>Neurol. Genet.</italic></source> <volume>9</volume>:<issue>e200092</issue>.</citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Naimi</surname> <given-names>A. I.</given-names></name> <name><surname>Balzer</surname> <given-names>L. B.</given-names></name></person-group> (<year>2018</year>). <article-title>Stacked generalization: An introduction to super learning.</article-title> <source><italic>Eur. J. Epidemiol.</italic></source> <volume>33</volume> <fpage>459</fpage>&#x2013;<lpage>464</lpage>. <pub-id pub-id-type="doi">10.1007/s10654-018-0390-z</pub-id> <pub-id pub-id-type="pmid">29637384</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nalls</surname> <given-names>M. A.</given-names></name> <name><surname>Bras</surname> <given-names>J.</given-names></name> <name><surname>Hernandez</surname> <given-names>D. G.</given-names></name> <name><surname>Keller</surname> <given-names>M.</given-names></name> <name><surname>Majounie</surname> <given-names>E.</given-names></name> <name><surname>Renton</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>NeuroX, a fast and efficient genotyping platform for investigation of neurodegenerative diseases.</article-title> <source><italic>Neurobiol. Aging</italic></source> <volume>36</volume> <fpage>1605.e7</fpage>&#x2013;<lpage>12</lpage>.</citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nour</surname> <given-names>M.</given-names></name> <name><surname>Senturk</surname> <given-names>U.</given-names></name> <name><surname>Polat</surname> <given-names>K.</given-names></name></person-group> (<year>2023</year>). <article-title>Diagnosis and classification of Parkinson&#x2019;s disease using ensemble learning and 1D-PDCovNN.</article-title> <source><italic>Comput. Biol. Med.</italic></source> <volume>161</volume>:<issue>107031</issue>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.107031</pub-id> <pub-id pub-id-type="pmid">37211002</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pudjihartono</surname> <given-names>N.</given-names></name> <name><surname>Fadason</surname> <given-names>T.</given-names></name> <name><surname>Kempa-Liehr</surname> <given-names>A. W.</given-names></name> <name><surname>O&#x2019;Sullivan</surname> <given-names>J. A.</given-names></name></person-group> (<year>2022</year>). <article-title>review of feature selection methods for machine learning-based disease risk prediction.</article-title> <source><italic>Front. Bioinformatics</italic></source> <volume>29</volume>:<issue>27312</issue>. <pub-id pub-id-type="doi">10.3389/fbinf.2022.927312</pub-id> <pub-id pub-id-type="pmid">36304293</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Purcell</surname> <given-names>S.</given-names></name> <name><surname>Neale</surname> <given-names>B.</given-names></name> <name><surname>Todd-Brown</surname> <given-names>K.</given-names></name> <name><surname>Thomas</surname> <given-names>L.</given-names></name> <name><surname>Ferreira</surname> <given-names>M.</given-names></name> <name><surname>Bender</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>PLINK: A tool set for whole-genome association and population-based linkage analyses.</article-title> <source><italic>Am. J Hum. Genet.</italic></source> <volume>81</volume> <fpage>559</fpage>&#x2013;<lpage>575</lpage>.</citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Recabarren</surname> <given-names>D.</given-names></name> <name><surname>Alarcon</surname> <given-names>M.</given-names></name></person-group> (<year>2017</year>). <article-title>Gene networks in neurodegenerative disorders.</article-title> <source><italic>Life Sci.</italic></source> <volume>183</volume> <fpage>83</fpage>&#x2013;<lpage>97</lpage>.</citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sampedro</surname> <given-names>F.</given-names></name> <name><surname>Mar&#x00ED;n-Lahoz</surname> <given-names>J.</given-names></name> <name><surname>Mart&#x00ED;nez-Horta</surname> <given-names>S.</given-names></name> <name><surname>Pagonabarraga</surname> <given-names>J.</given-names></name> <name><surname>Kulisevsky</surname> <given-names>J.</given-names></name></person-group> (<year>2018</year>). <article-title>Cortical thinning associated with age and CSF biomarkers in early Parkinson&#x2019;s disease is modified by the SNCA rs356181 polymorphism.</article-title> <source><italic>Neurodegener. Dis.</italic></source> <volume>18</volume> <fpage>233</fpage>&#x2013;<lpage>238</lpage>. <pub-id pub-id-type="doi">10.1159/000493103</pub-id> <pub-id pub-id-type="pmid">30336481</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sandu</surname> <given-names>A.</given-names></name> <name><surname>Staff</surname> <given-names>R. T.</given-names></name> <name><surname>Mcneil</surname> <given-names>C. J.</given-names></name> <name><surname>Mustafa</surname> <given-names>N.</given-names></name> <name><surname>Ahearn</surname> <given-names>T.</given-names></name> <name><surname>Whalley</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Structural brain complexity and cognitive decline in late life&#x2014;a longitudinal study in the Aberdeen 1936 Birth Cohort.</article-title> <source><italic>Neuroimage</italic></source> <volume>100</volume> <fpage>558</fpage>&#x2013;<lpage>563</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuroimage.2014.06.054</pub-id> <pub-id pub-id-type="pmid">24993896</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Seiger</surname> <given-names>R.</given-names></name> <name><surname>Ganger</surname> <given-names>S.</given-names></name> <name><surname>Kranz</surname> <given-names>G. S.</given-names></name> <name><surname>Hahn</surname> <given-names>A.</given-names></name> <name><surname>Lanzenberger</surname> <given-names>R.</given-names></name></person-group> (<year>2018</year>). <article-title>cortical thickness estimations of FreeSurfer and the CAT12 toolbox in patients with Alzheimer&#x2019;s disease and healthy controls.</article-title> <source><italic>J. Neuroimaging</italic></source> <volume>28</volume> <fpage>515</fpage>&#x2013;<lpage>523</lpage>.</citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Simon</surname> <given-names>N.</given-names></name> <name><surname>Friedman</surname> <given-names>J.</given-names></name> <name><surname>Hastie</surname> <given-names>T.</given-names></name> <name><surname>Tibshirani</surname> <given-names>R. A.</given-names></name></person-group> (<year>2013</year>). <article-title>Sparse-group lasso.</article-title> <source><italic>J. Comput. Graph. Stat.</italic></source> <volume>22</volume> <fpage>231</fpage>&#x2013;<lpage>245</lpage>.</citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>L.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Qian</surname> <given-names>Y.</given-names></name> <name><surname>Xu</surname> <given-names>C.</given-names></name> <name><surname>Zhang</surname> <given-names>G.</given-names></name> <name><surname>Tian</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Joint neighborhood entropy-based gene selection method with fisher score for tumor classification.</article-title> <source><italic>Appl. Intell.</italic></source> <volume>49</volume> <fpage>1245</fpage>&#x2013;<lpage>1259</lpage>.</citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Suuronen</surname> <given-names>I.</given-names></name> <name><surname>Airola</surname> <given-names>A.</given-names></name> <name><surname>Pahikkala</surname> <given-names>T.</given-names></name> <name><surname>Murtojarvi</surname> <given-names>M.</given-names></name> <name><surname>Kaasinen</surname> <given-names>V.</given-names></name> <name><surname>Railo</surname> <given-names>H.</given-names></name></person-group> (<year>2023</year>). <article-title>Budget-based classification of Parkinson&#x2019;s disease from resting state EEG.</article-title> <source><italic>IEEE J. Biomed. Health Inform.</italic></source> <volume>27</volume> <fpage>3740</fpage>&#x2013;<lpage>3747</lpage>. <pub-id pub-id-type="doi">10.1109/JBHI.2023.3235040</pub-id> <pub-id pub-id-type="pmid">37018586</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Szymczak</surname> <given-names>S.</given-names></name> <name><surname>Biernacka</surname> <given-names>J. M.</given-names></name> <name><surname>Cordell</surname> <given-names>H. J.</given-names></name> <name><surname>Gonz&#x00E1;lez-Recio</surname> <given-names>O.</given-names></name> <name><surname>K&#x00F6;nig</surname> <given-names>I.</given-names></name> <name><surname>Zhang</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Machine learning in genome-wide association studies.</article-title> <source><italic>Genet. Epidemiol.</italic></source> <volume>33</volume> <fpage>S51</fpage>&#x2013;<lpage>S57</lpage>.</citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thompson</surname> <given-names>P.</given-names></name> <name><surname>Jahanshad</surname> <given-names>N.</given-names></name> <name><surname>Schmaal</surname> <given-names>L.</given-names></name> <name><surname>Turner</surname> <given-names>J.</given-names></name> <name><surname>Winkler</surname> <given-names>A.</given-names></name> <name><surname>Thomopoulos</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2022</year>). <article-title>The enhancing NeuroImaging genetics through meta-analysis consortium: 10 Years of global collaborations in human brain mapping.</article-title> <source><italic>Hum. Brain Mapp.</italic></source> <volume>43</volume> <fpage>15</fpage>&#x2013;<lpage>22</lpage>. <pub-id pub-id-type="doi">10.1002/hbm.25672</pub-id> <pub-id pub-id-type="pmid">34612558</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tranchant</surname> <given-names>C.</given-names></name></person-group> (<year>2019</year>). <article-title>Introduction and classical environmental risk factors for Parkinson.</article-title> <source><italic>Rev. Neurol.</italic></source> <volume>175</volume> <fpage>650</fpage>&#x2013;<lpage>651</lpage>. <pub-id pub-id-type="doi">10.1016/j.neurol.2019.04.006</pub-id> <pub-id pub-id-type="pmid">31227125</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tsukita</surname> <given-names>K.</given-names></name> <name><surname>Sakamaki-Tsukita</surname> <given-names>H.</given-names></name> <name><surname>Kaiser</surname> <given-names>S.</given-names></name> <name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Messa</surname> <given-names>M.</given-names></name> <name><surname>Serrano-Fernandez</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2023</year>). <article-title>High-Throughput CSF proteomics and machine learning to identify proteomic signatures for Parkinson disease development and progression.</article-title> <source><italic>Neurology</italic></source> <volume>101</volume> <fpage>e1434</fpage>&#x2013;<lpage>e1447</lpage>. <pub-id pub-id-type="doi">10.1212/WNL.0000000000207725</pub-id> <pub-id pub-id-type="pmid">37586882</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>van Nuenen</surname> <given-names>B.</given-names></name> <name><surname>van Eimeren</surname> <given-names>T.</given-names></name> <name><surname>van der Vegt</surname> <given-names>J.</given-names></name> <name><surname>Buhmann</surname> <given-names>C.</given-names></name> <name><surname>Klein</surname> <given-names>C.</given-names></name> <name><surname>Bloem</surname> <given-names>B.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Mapping preclinical compensation in Parkinson&#x2019;s disease: An imaging genomics approach.</article-title> <source><italic>Mov. Disord.</italic></source> <volume>24</volume> <fpage>S703</fpage>&#x2013;<lpage>S710</lpage>. <pub-id pub-id-type="doi">10.1002/mds.22635</pub-id> <pub-id pub-id-type="pmid">19877238</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vitorio</surname> <given-names>R.</given-names></name> <name><surname>Mancini</surname> <given-names>M.</given-names></name> <name><surname>Carlson-Kuhta</surname> <given-names>P.</given-names></name> <name><surname>Horak</surname> <given-names>F.</given-names></name> <name><surname>Shah</surname> <given-names>V.</given-names></name></person-group> (<year>2023</year>). <article-title>Should we use both clinical and mobility measures to identify fallers in Parkinson&#x2019;s disease?</article-title> <source><italic>Parkinsonism Relat. Disord.</italic></source> <volume>106</volume>:<issue>105235</issue>.</citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>A.</given-names></name> <name><surname>Liu</surname> <given-names>H.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>G.</given-names></name></person-group> (<year>2022</year>). <article-title>Ensemble feature selection for stable biomarker identification and cancer classification from microarray expression data.</article-title> <source><italic>Comput. Biol. Med.</italic></source> <volume>142</volume>:<issue>105208</issue>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2021.105208</pub-id> <pub-id pub-id-type="pmid">35016102</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>E.</given-names></name> <name><surname>Jia</surname> <given-names>Y.</given-names></name> <name><surname>Ya</surname> <given-names>Y.</given-names></name> <name><surname>Xu</surname> <given-names>J.</given-names></name> <name><surname>Mao</surname> <given-names>C.</given-names></name> <name><surname>Luo</surname> <given-names>W.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>Patterns of Sulcal depth and cortical thickness in Parkinson&#x2019;s disease.</article-title> <source><italic>Brain Imaging Behav.</italic></source> <volume>15</volume> <fpage>2340</fpage>&#x2013;<lpage>2346</lpage>.</citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wei</surname> <given-names>Y.</given-names></name> <name><surname>Bai</surname> <given-names>L.</given-names></name> <name><surname>Bai</surname> <given-names>J.</given-names></name></person-group> (<year>2023</year>). <article-title>The function of Golgi apparatus in LRRK2-associated Parkinson&#x2019;s disease.</article-title> <source><italic>Front. Mol. Neurosci.</italic></source> <volume>16</volume>:<issue>1097633</issue>. <pub-id pub-id-type="doi">10.3389/fnmol.2023.1097633</pub-id> <pub-id pub-id-type="pmid">36896008</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wissemann</surname> <given-names>W. T.</given-names></name> <name><surname>Hill-Burns</surname> <given-names>E. M.</given-names></name> <name><surname>Zabetian</surname> <given-names>C. P.</given-names></name> <name><surname>Factor</surname> <given-names>S.</given-names></name> <name><surname>Patsopoulos</surname> <given-names>N.</given-names></name> <name><surname>Hoglund</surname> <given-names>B.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Association of Parkinson disease with structural and regulatory variants in the HLA region.</article-title> <source><italic>Am. J. Hum. Genet.</italic></source> <volume>93</volume> <fpage>984</fpage>&#x2013;<lpage>993</lpage>.</citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Won</surname> <given-names>J. H.</given-names></name> <name><surname>Kim</surname> <given-names>M.</given-names></name> <name><surname>Youn</surname> <given-names>J.</given-names></name> <name><surname>Park</surname> <given-names>H.</given-names></name></person-group> (<year>2020</year>). <article-title>Prediction of age at onset in parkinson&#x2019;s disease using objective specific neuroimaging genetics based on a sparse canonical correlation analysis.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>10</volume>:<issue>11662</issue>. <pub-id pub-id-type="doi">10.1038/s41598-020-68301-x</pub-id> <pub-id pub-id-type="pmid">32669683</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Won</surname> <given-names>J.</given-names></name> <name><surname>Kim</surname> <given-names>M.</given-names></name> <name><surname>Park</surname> <given-names>B.</given-names></name> <name><surname>Youn</surname> <given-names>J.</given-names></name> <name><surname>Park</surname> <given-names>H.</given-names></name></person-group> (<year>2019</year>). <article-title>Effectiveness of imaging genetics analysis to explain degree of depression in Parkinson&#x2019;s disease.</article-title> <source><italic>PLoS One</italic></source> <volume>14</volume>:<issue>e0211699</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0211699</pub-id> <pub-id pub-id-type="pmid">30742647</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>E.</given-names></name> <name><surname>Ambati</surname> <given-names>A.</given-names></name> <name><surname>Andersen</surname> <given-names>M. S.</given-names></name> <name><surname>Krohn</surname> <given-names>L.</given-names></name> <name><surname>Estiar</surname> <given-names>M.</given-names></name> <name><surname>Saini</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>Fine mapping of the HLA locus in Parkinson&#x2019;s disease in Europeans.</article-title> <source><italic>npj Parkinson&#x2019;s Dis.</italic></source> <volume>7</volume>:<issue>84</issue>.</citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Cai</surname> <given-names>G.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>X.</given-names></name> <name><surname>Hong</surname> <given-names>W.</given-names></name><etal/></person-group> (<year>2022</year>). <article-title>Evaluating white matter alterations in Parkinson&#x2019;s disease-related parkin S/N167 mutation carriers using tract-based spatial statistics.</article-title> <source><italic>Quant. Imaging Med. Surg.</italic></source> <volume>12</volume> <fpage>4272</fpage>&#x2013;<lpage>4285</lpage>. <pub-id pub-id-type="doi">10.21037/qims-21-1007</pub-id> <pub-id pub-id-type="pmid">35919057</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname> <given-names>Q.</given-names></name> <name><surname>Zhang</surname> <given-names>S.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Xiao</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Comprehensive analysis of core genes and key pathways in Parkinson&#x2019;s disease.</article-title> <source><italic>Am. J. Transl. Res.</italic></source> <volume>12</volume>:<issue>5630</issue>.</citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zang</surname> <given-names>Z.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Song</surname> <given-names>T.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Nie</surname> <given-names>B.</given-names></name> <name><surname>Mei</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2023</year>). <article-title>Association between gene expression and functional-metabolic architecture in Parkinson&#x2019;s disease.</article-title> <source><italic>Hum. Brain Mapp.</italic></source> <volume>44</volume> <fpage>5387</fpage>&#x2013;<lpage>5401</lpage>. <pub-id pub-id-type="doi">10.1002/hbm.26443</pub-id> <pub-id pub-id-type="pmid">37605831</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Xu</surname> <given-names>D.</given-names></name> <name><surname>Hao</surname> <given-names>K.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>W.</given-names></name> <name><surname>Liu</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>FS&#x2013;GBDT: Identification multicancer-risk module via a feature selection algorithm by integrating Fisher score and GBDT.</article-title> <source><italic>Brief. Bioinform.</italic></source> <volume>22</volume>:<issue>bbaa189</issue>. <pub-id pub-id-type="doi">10.1093/bib/bbaa189</pub-id> <pub-id pub-id-type="pmid">34020547</pub-id></citation></ref>
</ref-list>
</back>
</article>