<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Neurosci.</journal-id>
<journal-title>Frontiers in Neuroscience</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Neurosci.</abbrev-journal-title>
<issn pub-type="epub">1662-453X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fnins.2024.1394234</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Neuroscience</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Adaptive spatial-temporal neural network for ADHD identification using functional fMRI</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Qiu</surname> <given-names>Bo</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2669792/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Qianqian</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1639225/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Xizhi</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Wenyang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Shao</surname> <given-names>Wei</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1901081/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Wang</surname> <given-names>Mingliang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2548979/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>School of Computer Science, Nanjing University of Information Science and Technology</institution>, <addr-line>Nanjing</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Radiology and BRIC, University of North Carolina at Chapel Hill</institution>, <addr-line>Chapel Hill, NC</addr-line>, <country>United States</country></aff>
<aff id="aff3"><sup>3</sup><institution>College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics</institution>, <addr-line>Nanjing</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>Nanjing Xinda Institute of Safety and Emergency Management</institution>, <addr-line>Nanjing</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Feng Liu, Tianjin Medical University General Hospital, China</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Shijie Zhao, Northwestern Polytechnical University, China</p>
<p>Kangcheng Wang, Shandong Normal University, China</p>
<p>Zheyi Zhou, Beijing Normal University, China</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Mingliang Wang <email>wml489&#x00040;nuist.edu.cn</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>30</day>
<month>05</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>18</volume>
<elocation-id>1394234</elocation-id>
<history>
<date date-type="received">
<day>01</day>
<month>03</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>15</day>
<month>05</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2024 Qiu, Wang, Li, Li, Shao and Wang.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Qiu, Wang, Li, Li, Shao and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Computer aided diagnosis methods play an important role in Attention Deficit Hyperactivity Disorder (ADHD) identification. Dynamic functional connectivity (dFC) analysis has been widely used for ADHD diagnosis based on resting-state functional magnetic resonance imaging (rs-fMRI), which can help capture abnormalities of brain activity. However, most existing dFC-based methods only focus on dependencies between two adjacent timestamps, ignoring global dynamic evolution patterns. Furthermore, the majority of these methods fail to adaptively learn dFCs. In this paper, we propose an adaptive spatial-temporal neural network (ASTNet) comprising three modules for ADHD identification based on rs-fMRI time series. Specifically, we first partition rs-fMRI time series into multiple segments using non-overlapping sliding windows. Then, adaptive functional connectivity generation (AFCG) is used to model spatial relationships among regions-of-interest (ROIs) with adaptive dFCs as input. Finally, we employ a temporal dependency mining (TDM) module which combines local and global branches to capture global temporal dependencies from the spatially-dependent pattern sequences. Experimental results on the ADHD-200 dataset demonstrate the superiority of the proposed ASTNet over competing approaches in automated ADHD classification.</p></abstract>
<kwd-group>
<kwd>dynamic functional connectivity</kwd>
<kwd>temporal dependency</kwd>
<kwd>local and global evolution patterns</kwd>
<kwd>adaptive learning</kwd>
<kwd>fMRI</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content></contract-sponsor>
<counts>
<fig-count count="3"/>
<table-count count="4"/>
<equation-count count="10"/>
<ref-count count="45"/>
<page-count count="12"/>
<word-count count="8082"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Brain Imaging Methods</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>1 Introduction</title>
<p>Attention Deficit Hyperactivity Disorder (ADHD), with an incidence rate of 7.2% (Thomas et al., <xref ref-type="bibr" rid="B28">2015</xref>), has been the most prevalent psychiatric disorder among adolescents. Individuals affected by ADHD often commonly encounter difficulties in behavior management, hyperactivity, and maintaining attention or focus. However, due to complex pathological mechanisms of ADHD, most current diagnosis methods for ADHD primarily rely on clinical behavioral observations, which may be subjective. Undoubtedly, computer aided diagnosis methods provides a more objective and comprehensive assessment, aiming to help enhance accuracy and efficiency of ADHD diagnosis.</p>
<p>Resting-state functional magnetic resonance imaging (rs-fMRI), which can capture changes in blood flow in response to stimulation, has emerged as a valuable tool for diagnosing diverse psychiatric diseases (Damoiseaux, <xref ref-type="bibr" rid="B7">2012</xref>; Jie et al., <xref ref-type="bibr" rid="B15">2014a</xref>; Wang et al., <xref ref-type="bibr" rid="B34">2019a</xref>; Wang M. et al., <xref ref-type="bibr" rid="B33">2022</xref>). Functional connectivities (FCs), derived from the rs-fMRI, provide insights into quantifying the temporal correlation of functional activation across different brain regions. FCs are usually defined by the correlation (i.e., Pearson correlation) between blood-oxygen-level-dependent (BOLD) signals. In recent years, researchers have designed various learning-based computer-aided diagnostic methods for ADHD analysis and they have observed that ADHD patients exhibit abnormal FCs between ROIs. These abnormal FCs can serve as potential biomarkers for clinical diagnosis of ADHD. Previous FC-based methods were usually conducted with the assumption that FC remains constant during fMRI recording. Recently, more and more studies have confirmed that brain activity is actually dynamic (Arieli et al., <xref ref-type="bibr" rid="B1">1996</xref>; Makeig et al., <xref ref-type="bibr" rid="B25">2004</xref>; Onton et al., <xref ref-type="bibr" rid="B26">2006</xref>), and analysis based on this can reveal changes in FCs over time (Du et al., <xref ref-type="bibr" rid="B11">2018</xref>; Zhang et al., <xref ref-type="bibr" rid="B44">2021</xref>). These changes can help us understand how cognitive states evolve over time, which is critical for better understanding the pathology of brain diseases. For this reason, there has been a shift toward dynamic connectivity analysis in recent efforts (Bahrami et al., <xref ref-type="bibr" rid="B2">2021</xref>; Wang Z. et al., <xref ref-type="bibr" rid="B38">2022</xref>; Yang et al., <xref ref-type="bibr" rid="B40">2022</xref>).</p>
<p>Specifically, most dFC-based methods can be roughly categorized into two groups: (1) conventional machine learning methods (Wang et al., <xref ref-type="bibr" rid="B37">2017</xref>; Vergara et al., <xref ref-type="bibr" rid="B30">2018</xref>; Feng et al., <xref ref-type="bibr" rid="B13">2022</xref>) and (2) deep learning methods (Wang et al., <xref ref-type="bibr" rid="B32">2019b</xref>; Yan et al., <xref ref-type="bibr" rid="B39">2019</xref>; Lin et al., <xref ref-type="bibr" rid="B23">2022</xref>). Previous machine learning methods first extract features manually and then feed them into subsequent prediction models. These approaches take fMRI feature learning and downstream model training as independent processes, possibly leading to suboptimal model performance. In contrast, deep learning methods usually perform feature learning and downstream prediction tasks in an end-to-end manner, which can learn task-oriented discriminative fetatures to facilitate ADHD identification. By automatically learning features from the dFC network, deep learning methods provide a cohesive framework for feature learning and classification. Considering that the functional connectivity network can be mathematically modeled as a graph, graph convolutional network (GCN), renowned for their effectiveness in processing the graph data, has been widely used in FC analysis. However, it is worth noting that many GCN methods are designed based on predefined FCs, which hinders the adaptive learning of interactions between different brain ROIs. Furthermore, most dFC-based methods only focus on temporal dependencies between adjacent timestamps, ignoring important global dynamic evolution.</p>
<p>To solve this issue, we propose a novel adaptive spatial-temporal neural network (ASTNet) that can not only adaptively learn functional connectivities between brain ROIs but also mine global temporal dependencies in dFCs. As illustrated in <xref ref-type="fig" rid="F1">Figure 1</xref>, the proposed ASTNet consists of three components, i.e., the partition of rs-fMRI time series, adaptive functional connectivity generation, and temporal dependency mining. Specifically, we first divide the rs-fMRI time series into multiple segments using non-overlapping sliding windows to characterize the temporal variability of fMRI time series. After that, for each time-series segment, we design an adaptive functional connectivity generation (AFCG) module that first adaptively learns FCs between ROIs and then use GCN to capture topological information of brain network. Finally, a temporal dependency mining (TDM) module which integrates local and global branches, is proposed to capture temporal dependencies from the spatially-dependent pattern sequences. Within the TDM module, the global branch investigates variations in individual points within the FC structure, such as the emergence or disappearance and the strengthening or weakening of connections, which is referred to as spatial variation. Meanwhile, the local branch examines temporal changes between dFCs, known as temporal variation. To further obtain subject-level representation, we concatenate the generated features from these two branches, followed by a fully connected layer for disease classification. Experimental results on 620 subjects in the ADHD-200 dataset demonstrate the effectiveness of our ASTNet in adaptive graph learning and temporal dependence mining. This demonstrates the importance and great potential of our model in ADHD identification, with great promise in practical applications.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>Overview of the proposed adaptive spatial-temporal neural network (ASTNet), including three components: <bold>(A)</bold> partitioning rs-fMRI time series into T segments via non-overlapping sliding windows, <bold>(B)</bold> adaptive functional connectivity generation (AFCG), where the adjacency matrix is first learned via adaptive graph learning (AGL) module for each time window and then fed into graph convolutional network (GCN), and <bold>(C)</bold> a temporal dependency mining module (TDM) to capture temporal dynamics across all time windows. With the output of the TDM, a fully-connected layer is further used for disease classification.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnins-18-1394234-g0001.tif"/>
</fig>
</sec>
<sec id="s2">
<title>2 Related work</title>
<sec>
<title>2.1 Static FC-based method</title>
<p>Conventional FC-based methods usually first extract handcrafted features from functional connectivity networks and then train a classifier (e.g., support vector machine, SVM) for disease prediction (Bai et al., <xref ref-type="bibr" rid="B3">2009</xref>; Jie et al., <xref ref-type="bibr" rid="B15">2014a</xref>,<xref ref-type="bibr" rid="B16">b</xref>; Plis et al., <xref ref-type="bibr" rid="B27">2014</xref>; Bi et al., <xref ref-type="bibr" rid="B4">2018</xref>). For example, Bi et al. (<xref ref-type="bibr" rid="B4">2018</xref>) designed a random SVM cluster method for AD identification. This method firstly randomly selected samples and FC features to establish multiple SVMs, and then employed an ensemble strategy for the final prediction. Jie et al. (<xref ref-type="bibr" rid="B15">2014a</xref>) extracted and integrated multiple properties of static FC networks (e.g., connectivity strength and local clustering coefficient) for diagnosing brain diseases and achieved better performance compared with single network measures. Even so, these methods usually rely on handcrafted feature representations for classification models, thereby possibly producing sub-optimal classification performance.</p>
<p>More recently, deep learning methods have been proposed to automatically learn data-driven features from dFC networks. These methods offer a unified framework for fMRI feature learning and brain disorder prediction, ultimately achieving better performance. For example, Liang et al. (<xref ref-type="bibr" rid="B22">2021</xref>) proposed a novel convolutional neural network combined with a prototype learning (CNNPL) framework to classify brain functional networks for the diagnosis of autism spectrum disorder. Specifically, it used traditional convolutional neural networks to extract high-level features from pre-defined FCs and further designed a prototype learning strategy to automatically learn prototypes of each category for ASD classification. Eslami et al. (<xref ref-type="bibr" rid="B12">2019</xref>) proposed to extract the lower dimensional feature representation of FCs using an autoencoder, followed by a single layer perceptron (SLP) for ASD identification. Kawahara et al. (<xref ref-type="bibr" rid="B17">2017</xref>) developed three distinct convolutional layers&#x02014;edge-to-edge (E2E), edge-to-node (E2N), and node-to-graph layer (N2G)&#x02014;to capture the spatial characteristics of structural brain connectivity for cognitive and motor developmental score prediction in premature infants. Due to the graph-structured nature of brain functional networks, graph neural network (GNN), which can learn expressive graph representations, have shown significant potential in FC-based brain disease diagnosis. For example, Ktena et al. (<xref ref-type="bibr" rid="B19">2018</xref>) proposed learning a graph similarity metric using a siamese graph convolutional neural network for ASD classification. Yao et al. (<xref ref-type="bibr" rid="B41">2021</xref>) developed a mutual multi-scale triplet graph convolutional network for brain disorder diagnosis using functional or structural connectivity. Li et al. (<xref ref-type="bibr" rid="B20">2020</xref>) designed an ROI-aware graph convolutional layer that leveraged fMRI&#x00027;s topological and functional information for ASD diagnosis.</p>
<p>These deep learning methods greatly improve the efficiency and classification/regression performance in FC-based analysis due to their end-to-end architecture. However, these methods mainly study static patterns of brain networks, thereby ignoring the dynamic characteristics of brain FCs. Besides, GNN-based methods generally take a fixed graph structure as input, whose reliability remains to be discussed.</p>
</sec>
<sec>
<title>2.2 Dynamic FC-based method</title>
<p>Several dynamic functional analysis methods have recently been proposed for brain disease classification (Wang et al., <xref ref-type="bibr" rid="B32">2019b</xref>, <xref ref-type="bibr" rid="B35">2023</xref>; Yan et al., <xref ref-type="bibr" rid="B39">2019</xref>; Gadgil et al., <xref ref-type="bibr" rid="B14">2020</xref>; Lin et al., <xref ref-type="bibr" rid="B23">2022</xref>; Liu et al., <xref ref-type="bibr" rid="B24">2022</xref>; Liang et al., <xref ref-type="bibr" rid="B21">2023</xref>). For example, Wang et al. (<xref ref-type="bibr" rid="B32">2019b</xref>) proposed a spatial-temporal convolutional-recurrent neural network (STNet) for Alzheimer&#x00027;s disease progression prediction using rs-fMRI time series. Specifically, a convolutional component was first employed to construct the FC within each time-series segment. Then, the long short-term memory (LSTM) units were used to model the temporal dynamics patterns of these successive FCs. Finally, a fully connected layer is used to perform disease progression prediction. Lin et al. (<xref ref-type="bibr" rid="B23">2022</xref>) developed a convolutional recurrent neural network (CRNN) for dynamic FCs analysis and automated brain disease diagnosis. In this method, a sequence of pre-constructed FC networks was input into three convolutional layers to extract temporal features, and an LSTM layer was used to capture temporal information from multiple time segments, followed by three fully connected layers for brain disease classification. To take advantage of spatio-temporal information of fMRI data, Yan et al. (<xref ref-type="bibr" rid="B39">2019</xref>) designed a multi-scale RNN framework to classify schizophrenia. Specifically, stacked convolution layers were used to extract different scale features, followed by a two-layer stacked Gated Recurrent Unit (GRU) to mine dynamic information conveyed in fMRI series. Gadgil et al. (<xref ref-type="bibr" rid="B14">2020</xref>) trained a spatio-temporal graph convolutional network (ST-GCN) on each segment of the BOLD time series to predict gender and age. In this method, a positive and symmetric &#x0201C;edge importance&#x0201D; matrix was first integrated to determine the importance of spatial graph edges. Then, three layers of ST-GC units were used to perform spatial graph convolution, followed by a fully connected layer for final prediction. Liang et al. (<xref ref-type="bibr" rid="B21">2023</xref>) proposed a self-supervised multi-task learning model for detecting AD progression, in which a masked map auto-encoder and temporal contrast learning were jointly pre-trained to capture the structural and evolutionary features of longitudinal brain networks. Liu et al. (<xref ref-type="bibr" rid="B24">2022</xref>) proposed a method based on nested residual convolutional denoising autoencoder (NRCDAE) and convolutional gated recurrent unit (GRU) for ADHD diagnosis. Specifically, the NRCDAE was used to reduce the spatial dimension of rs-fMRI and extract the 3D spatial features. Then, the 3D convolutional GRU was adopted to extract the spatial and temporal features simultaneously for classification. Although existing dynamic FC-based methods consider the temporal dynamics in the prediction of disease progression, those methods fail to capture the global temporal changing patterns of the whole brain (i.e., the longitudinal network-level patterns).</p>
</sec>
</sec>
<sec id="s3">
<title>3 Materials and method</title>
<p>In this section, we introduce the materials used in this work, the proposed method, as well as implementation details.</p>
<sec>
<title>3.1 Material</title>
<sec>
<title>3.1.1 Data acquisition</title>
<p>We use the ADHD-200 dataset to validate the effectiveness of the proposed method. The ADHD-200 dataset includes 973 subjects collected from eight different imaging sites. Specifically, the dataset contains 362 ADHD patients, 585 normal controls (NC), and 26 undiagnosed subjects and can be accessed from the NeuroImaging Tools &#x00026; Resource Collaboratory (NITRC) website.<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref> Each participant&#x00027;s data in the ADHD-200 dataset consists of a resting-state functional MRI scan, a structural MRI scan, and the corresponding phenotypic information. Note that ADHD patients in the ADHD-200 dataset are further categorized into three subtypes: ADHD-Combined, ADHD-Hyperactive/Impulsive, and ADHD-Inattentive. To simplify the binary classification task, all subtypes in the ADHD-200 dataset are uniformly labeled as 1. During the ADHD-200 Global Competition, the ADHD-200 dataset is divided into a training set and a test set, each with corresponding phenotypic information. The numbers of subjects are 768 and 197, respectively. In this paper, we also follow this division in our experiments for a fair comparison. Note that in our performance evaluation, we exclude 26 subjects without released labels in the test set. Furthermore, we also discard subjects from the Pitt and Washu imaging sites in our study because their training sets only contained normal control (NC) subjects. Thus, a total of 620 subjects are used in this study, including 340 ADHD patients and 280 NCs. The detailed demographic information of involved subjects and data partition for experiments are provided in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Demographic information and data partition of the studied subjects from ADHD-200 dataset.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Item</bold></th>
<th valign="top" align="center"><bold>PKU</bold></th>
<th valign="top" align="center"><bold>NYU</bold></th>
<th valign="top" align="center"><bold>OHSU</bold></th>
<th valign="top" align="center"><bold>NI</bold></th>
<th valign="top" align="center"><bold>KKI</bold></th>
<th valign="top" align="center"><bold>Total</bold></th>
</tr>
</thead>
<tbody>
<tr style="background-color:#dee1e1">
<td valign="top" align="left" colspan="7"><bold>Training dataset</bold></td>
</tr>
<tr>
<td valign="top" align="left">Number</td>
<td valign="top" align="center">194</td>
<td valign="top" align="center">216</td>
<td valign="top" align="center">79</td>
<td valign="top" align="center">48</td>
<td valign="top" align="center">83</td>
<td valign="top" align="center">620</td>
</tr>
<tr>
<td valign="top" align="left">NC</td>
<td valign="top" align="center">116</td>
<td valign="top" align="center">98</td>
<td valign="top" align="center">42</td>
<td valign="top" align="center">23</td>
<td valign="top" align="center">61</td>
<td valign="top" align="center">340</td>
</tr>
<tr>
<td valign="top" align="left">ADHD</td>
<td valign="top" align="center">78</td>
<td valign="top" align="center">118</td>
<td valign="top" align="center">37</td>
<td valign="top" align="center">25</td>
<td valign="top" align="center">22</td>
<td valign="top" align="center">280</td>
</tr>
<tr>
<td valign="top" align="left">Gender (M/F)</td>
<td valign="top" align="center">144/50</td>
<td valign="top" align="center">140/76</td>
<td valign="top" align="center">43/36</td>
<td valign="top" align="center">31/17</td>
<td valign="top" align="center">46/37</td>
<td valign="top" align="center">404/216</td>
</tr>
<tr style="background-color:#dee1e1">
<td valign="top" align="left" colspan="7"><bold>Test dataset</bold></td>
</tr>
<tr>
<td valign="top" align="left">Number</td>
<td valign="top" align="center">51</td>
<td valign="top" align="center">41</td>
<td valign="top" align="center">34</td>
<td valign="top" align="center">25</td>
<td valign="top" align="center">11</td>
<td valign="top" align="center">162</td>
</tr>
<tr>
<td valign="top" align="left">NC</td>
<td valign="top" align="center">27</td>
<td valign="top" align="center">12</td>
<td valign="top" align="center">28</td>
<td valign="top" align="center">14</td>
<td valign="top" align="center">8</td>
<td valign="top" align="center">89</td>
</tr>
<tr>
<td valign="top" align="left">ADHD</td>
<td valign="top" align="center">24</td>
<td valign="top" align="center">29</td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">11</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">73</td>
</tr>
<tr>
<td valign="top" align="left">Gender (M/F)</td>
<td valign="top" align="center">32/19</td>
<td valign="top" align="center">28/13</td>
<td valign="top" align="center">17/17</td>
<td valign="top" align="center">12/13</td>
<td valign="top" align="center">10/1</td>
<td valign="top" align="center">99/63</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>M, male; F, female.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<title>3.1.2 Data pre-processing</title>
<p>All resting-state fMRI data used in our study were preprocessed by the C-PAC pipeline.<xref ref-type="fn" rid="fn0002"><sup>2</sup></xref> This pipeline includes several processing steps such as skull stripping, slice timing correction, head motion realignment, intensity normalization, band-pass filtering (0.01&#x02013;0.1 Hz), and the regression of white matter, cerebrospinal fluid, and motion parameters. To minimize the impact of head motion on our results, we first removed fMRI data from participants whose heads moved more than 2.0 mm in any direction or 2&#x000B0; in any rotation. After that, we performed structural skull stripping and then mapped the remaining fMRI data to the Montreal Neurological Institute (MNI) space. A 6mm Gaussian kernel was used to spatially smooth the rs-fMRI data. Note that further our analysis excluded subjects with a frame displacement exceeding 2.5 min (FD &#x0003E; 0.5). Finally, the automated anatomical labeling (AAL) template was used to extract the mean rs-fMRI time series for a set of 116 pre-defined ROIs.</p>
</sec>
</sec>
<sec>
<title>3.2 Method</title>
<p>As illustrated in <xref ref-type="fig" rid="F1">Figure 1</xref>, the proposed ASTNet includes <italic>(1)</italic> partition of rs-fMRI time series, <italic>(2)</italic> adaptive functional connectivity generation, and <italic>(3)</italic> temporal dependency mining.</p>
<sec>
<title>3.2.1 Partition of rs-fMRI time series</title>
<p>To characterize the temporal variability of fMRI series, we first employ the sliding window strategy to partition all rs-fMRI time series into <italic>T</italic> non-overlapping windows, each with a fixed window size <italic>L</italic>. Specifically, for each window, we represent the segmented time series as <inline-formula><mml:math id="M1"><mml:msub><mml:mrow><mml:mi>G</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msup><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msubsup><mml:mrow><mml:mi>v</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mrow><mml:mi>v</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:mo>.</mml:mo><mml:mo>.</mml:mo><mml:mo>.</mml:mo><mml:mo>,</mml:mo><mml:msubsup><mml:mrow><mml:mi>v</mml:mi></mml:mrow><mml:mrow><mml:mi>N</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msubsup></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mo>&#x022A4;</mml:mo></mml:mrow></mml:msup><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>R</mml:mi></mml:mrow><mml:mrow><mml:mi>N</mml:mi><mml:mo>&#x000D7;</mml:mo><mml:mi>L</mml:mi></mml:mrow></mml:msup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mo>&#x022EF;</mml:mo><mml:mspace width="0.3em" class="thinspace"/><mml:mo>,</mml:mo><mml:mi>T</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>, where the <italic>t</italic> represents the <italic>t</italic>-th segments and <italic>N</italic> denotes the number of nodes. In our paper, the window size <italic>L</italic> is set as 20. For PKU, NYU, OHSU, NI, and KKI sites, the lengths of extracted fMRI time series are 231, 171, 72, 256, and 119 and the corresponding TR is 2.5, 1.96, 2, 2.5, and 2s, respectively. Since each site has a different scanning time (<italic>i.e</italic>., length of fMRI time series), we obtain <italic>T</italic> = 5, <italic>T</italic> = 12, <italic>T</italic> = 8, <italic>T</italic> = 3, and <italic>T</italic> = 11 segments for these five sites, respectively. The reason for choosing such window length is that window sizes around 30&#x02013;60 s can provide a robust estimation of the dynamic fluctuations in rs-fMRI data (Wang et al., <xref ref-type="bibr" rid="B31">2021</xref>). For each subject, the time-series segment S will be considered as the input of the proposed network.</p>
</sec>
<sec>
<title>3.2.2 Adaptive functional connectivity generation</title>
<p>In order to better explore the spatial relationships between brain regions, we employ an adaptive graph learning (AGL) strategy to learn functional connectivities, instead of relying on prior knowledge or manual labor. We define a non-negative function <xref ref-type="disp-formula" rid="E1">Equation (1)</xref> with a learnable weight vector <inline-formula><mml:math id="M2"><mml:mi>&#x003C9;</mml:mi><mml:mo>=</mml:mo><mml:msup><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>&#x003C9;</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>&#x003C9;</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mo>.</mml:mo><mml:mo>.</mml:mo><mml:mo>.</mml:mo><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>&#x003C9;</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>d</mml:mi></mml:mrow><mml:mrow><mml:mi>e</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:msup><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>R</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:mi>d</mml:mi><mml:mi>e</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002A;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:math></inline-formula> based on the graph data <italic>G</italic><sub><italic>t</italic></sub> for each window to represent the connection between any two brain nodes <italic>x</italic><sub><italic>m</italic></sub> and <italic>x</italic><sub><italic>n</italic></sub>:</p>
<disp-formula id="E1"><label>(1)</label><mml:math id="M3"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>m</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>g</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>m</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>e</mml:mi><mml:mi>x</mml:mi><mml:mi>p</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>R</mml:mi><mml:mi>E</mml:mi><mml:mi>L</mml:mi><mml:mi>U</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msup><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>&#x003C9;</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:msup><mml:mo>|</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>m</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mstyle displaystyle="false"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>N</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:mi>e</mml:mi><mml:mi>x</mml:mi><mml:mi>p</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>R</mml:mi><mml:mi>E</mml:mi><mml:mi>L</mml:mi><mml:mi>U</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msup><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>&#x003C9;</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:msup><mml:mo>|</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>m</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow></mml:mfrac><mml:mo>,</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where <italic>x</italic><sub><italic>i</italic></sub> represents the fMRI data of the <italic>i</italic>-th brain ROI, nonlinear activation function ReLU guarantees <italic>A</italic><sub><italic>mn</italic></sub> is nonnegative, and the softmax operation normalizes each row of <italic>A</italic>. To introduce prior knowledge, we incorporate the following regularization loss <xref ref-type="disp-formula" rid="E2">Equation (2)</xref>:</p>
<disp-formula id="E2"><label>(2)</label><mml:math id="M4"><mml:mrow><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>g</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>p</mml:mi><mml:mi>h</mml:mi><mml:mo>&#x0005F;</mml:mo><mml:mi>l</mml:mi><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>r</mml:mi><mml:mi>n</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>g</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle='true'><mml:munderover><mml:mo>&#x02211;</mml:mo><mml:mrow><mml:mi>m</mml:mi><mml:mo>,</mml:mo><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover><mml:mo stretchy="false">&#x0007C;</mml:mo></mml:mstyle><mml:mo stretchy="false">&#x0007C;</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mi>m</mml:mi></mml:msub><mml:mo>&#x02212;</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mi>n</mml:mi></mml:msub><mml:mo stretchy="false">&#x0007C;</mml:mo><mml:msubsup><mml:mo stretchy="false">&#x0007C;</mml:mo><mml:mn>2</mml:mn><mml:mn>2</mml:mn></mml:msubsup><mml:msub><mml:mstyle mathvariant='bold' mathsize='normal'><mml:mi>A</mml:mi></mml:mstyle><mml:mrow><mml:mi>m</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mo>&#x003BB;</mml:mo><mml:mo stretchy="false">&#x0007C;</mml:mo><mml:mo stretchy="false">&#x0007C;</mml:mo><mml:mstyle mathvariant='bold' mathsize='normal'><mml:mi>A</mml:mi></mml:mstyle><mml:mo stretchy="false">&#x0007C;</mml:mo><mml:msubsup><mml:mo stretchy="false">&#x0007C;</mml:mo><mml:mi>F</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>.</mml:mo></mml:mrow></mml:math></disp-formula>
<p>That is, the smaller distance ||<italic>x</italic><sub><italic>m</italic></sub>&#x02212;<italic>x</italic><sub><italic>n</italic></sub>||<sub>2</sub> between <italic>x</italic><sub><italic>m</italic></sub> and <italic>x</italic><sub><italic>n</italic></sub>, the larger <italic>A</italic><sub><italic>mn</italic></sub> is. This regularization allows nodes/ROIs with similar features to have greater connection weights. Furthermore, considering the sparsity nature of brain functional network (<italic>i.e</italic>., brain graph), the second term is introduced, where &#x003BB;&#x02267;0 is a regularization parameter. Through the proposed graph learning mechanism, we obtain an adaptively learned adjacency matrix <italic>A</italic> used for the subsequent graph convolution operation <xref ref-type="disp-formula" rid="E3">Equation (3)</xref>:</p>
<disp-formula id="E3"><label>(3)</label><mml:math id="M5"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msup><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>H</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>l</mml:mi><mml:mo>&#x0002B;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msup><mml:mo>=</mml:mo><mml:mi>&#x003C3;</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>A</mml:mi></mml:mstyle><mml:msup><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>H</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>l</mml:mi></mml:mrow></mml:msup><mml:msup><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>W</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>l</mml:mi></mml:mrow></mml:msup></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where <italic>H</italic><sup><italic>l</italic></sup> is the time series signal characteristics of brain network nodes in layer <italic>l</italic>, <italic>A</italic> represents the learned adjacency matrix, <italic>W</italic> denotes a learnable weight matrix, and &#x003C3; is the activation function. The fundamental principle underlying graph convolution is the iterative aggregation of neighboring node information to update the feature representation of the central node. Finally, we get the functional connectivity matrix by <xref ref-type="disp-formula" rid="E4">Equation (4)</xref>:</p>
<disp-formula id="E4"><label>(4)</label><mml:math id="M6"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>S</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msup><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>H</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>l</mml:mi></mml:mrow></mml:msup><mml:msup><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msup><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>H</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>l</mml:mi></mml:mrow></mml:msup></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mi>T</mml:mi></mml:mrow></mml:msup><mml:mo>,</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where <italic>H</italic><sup><italic>l</italic></sup> denotes the final node features generated from GCN and <italic>S</italic><sub><italic>t</italic></sub> measures the degree of second-order dependency between ROIs.</p>
</sec>
<sec>
<title>3.2.3 Temporal dependency mining</title>
<p>To capture temporal dynamic information within fMRI series across temporal dimension, we design the temporal dependency mining (TDM) module which includes two parallel architectures, i.e., local and global branches. The local branch is designed to explore the temporal evolution of adjacent sliding windows, providing insights into fine-grained changes. The global branch is used to capture the evolutionary patterns across all timestamps. Details are introduced below.</p>
<sec>
<title>3.2.3.1 Local temporal dependency mining branch</title>
<p>To capture the local temporal dependency of dFCs, we propose the use of a bi-directional Gated Recurrent Unit (BiGRU), which is a type of recurrent neural network (RNN). Different from unidirectional GRU, the bidirectional GRU (BiGRU) consists of two GRUs, where one GRU scans the sequence from the beginning to the end, while the other scans the sequence from the end to the beginning. This bidirectional structure enables the model to consider both past and future information simultaneously, thereby enhancing the accuracy of feature information capture in sequential data. Mathematically, the BiGRU can be represented as <xref ref-type="disp-formula" rid="E5">Equation (5)</xref>:</p>
<disp-formula id="E5"><label>(5)</label><mml:math id="M7"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>G</mml:mi><mml:mi>R</mml:mi><mml:mi>U</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mover class="overrightarrow"><mml:mrow><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:mrow><mml:mo>&#x020D7;</mml:mo></mml:mover></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x02295;</mml:mo><mml:mi>G</mml:mi><mml:mi>R</mml:mi><mml:mi>U</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mover class="overleftarrow"><mml:mrow><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:mrow><mml:mo>&#x020D6;</mml:mo></mml:mover></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where <italic>x</italic><sub><italic>t</italic></sub> denotes initial temporal state, <italic>h</italic><sub><italic>t</italic></sub> represents hidden state, and arrows represent different operation directions. The GRU is composed of two gating mechanisms, including the reset gate and the update gate. The calculation formulas for the GRU unit are as follows:</p>
<disp-formula id="E6"><label>(6)</label><mml:math id="M8"><mml:mtable class="eqnarray" columnalign="right"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>&#x003C3;</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>W</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>z</mml:mi></mml:mrow></mml:msub><mml:mo>&#x000B7;</mml:mo><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>&#x003C3;</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>W</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>r</mml:mi></mml:mrow></mml:msub><mml:mo>&#x000B7;</mml:mo><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mo>&#x0007E;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>n</mml:mi><mml:mi>h</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>W</mml:mi></mml:mstyle><mml:mo>&#x000B7;</mml:mo><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002A;</mml:mo><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>-</mml:mo><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x0002A;</mml:mo><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002A;</mml:mo><mml:msub><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mo>&#x0007E;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>.</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>In <xref ref-type="disp-formula" rid="E6">Equation (6)</xref>, the reset gate operation <italic>r</italic><sub><italic>t</italic></sub> controls the fusion of new input information with the previous &#x0201C;memory,&#x0201D; and the update gate <italic>z</italic><sub><italic>t</italic></sub> influences the amount of information to be forgotten from the previous moment. In the second formula, <italic>W</italic><sub><italic>r</italic></sub> denotes a weight matrix, while <italic>r</italic><sub><italic>t</italic></sub> is obtained by linearly transforming the concatenated matrix of <italic>x</italic><sub><italic>t</italic></sub> and <italic>h</italic><sub><italic>t</italic>&#x02212;1</sub>. This value is subsequently utilized in the third formula to update the hidden information of the candidate. For ease of understanding:</p>
<disp-formula id="E7"><label>(7)</label><mml:math id="M9"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mo>&#x0007E;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>t</mml:mi><mml:mi>a</mml:mi><mml:mi>n</mml:mi><mml:mi>h</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>W</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>x</mml:mi><mml:mi>h</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02299;</mml:mo><mml:msub><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:msub><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>W</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>h</mml:mi><mml:mi>h</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mi>b</mml:mi></mml:mrow><mml:mrow><mml:mi>h</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>In <xref ref-type="disp-formula" rid="E7">Equation (7)</xref> the value of <italic>r</italic><sub><italic>t</italic></sub> in the update gate influences the amount of information to be forgotten from the previous moment, as indicated by the Hadamard product with <italic>h</italic><sub><italic>t</italic>&#x02212;1</sub>. The first equation represents the update gate, while the fourth equation controls the extent to which previous information is incorporated into the current state. In the fourth equation, the closer <italic>z</italic><sub><italic>t</italic></sub> is to 1, the more information it retains or &#x0201C;remembers.&#x0201D; (1&#x02212;<italic>z</italic><sub><italic>t</italic></sub>)&#x0002A;<italic>h</italic><sub><italic>t</italic>&#x02212;1</sub> selectively forgets parts of the previous hidden state, while <inline-formula><mml:math id="M10"><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002A;</mml:mo><mml:msub><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>h</mml:mi></mml:mrow><mml:mo>&#x0007E;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> selectively incorporates candidate hidden states. In summary, the fourth equation combines forgetting some information passed down from <italic>h</italic><sub><italic>t</italic>&#x02212;1</sub> with incorporating relevant information from the current node, resulting in the final memory representation <italic>h</italic><sub><italic>t</italic></sub>. In this way, we can obtain the final local time dependency information between adjacent time-sliced fMRI data by recursively transmitting hidden state information.</p>
</sec>
<sec>
<title>3.2.3.2 Global temporal dependency mining branch</title>
<p>We employ global attention to capture the global temporal dependency of dFCs. For each segment, we first employ an MLP to extract potential hidden abnormal connection information, ensuring that spatial information at different stages remains intact despite the temporal interactions. Specifically, the upper triangular data of the symmetric matrix is first converted to a one-dimensional vector <italic>x</italic> and then fed into the MLP to obtain the characteristic information <italic>F</italic><sub><italic>t</italic></sub>, represented as <xref ref-type="disp-formula" rid="E8">Equation (8)</xref>:</p>
<disp-formula id="E8"><label>(8)</label><mml:math id="M11"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>F</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>g</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow><mml:mrow><mml:mi>M</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>w</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where <italic>w</italic><sub><italic>i</italic></sub> is learnable weight and <italic>g</italic> is activation function. Then, we incorporate a global attention mechanism to capture temporal dependencies between dynamic FCs. The formula of global attention is defined as <xref ref-type="disp-formula" rid="E9">Equation (9)</xref>:</p>
<disp-formula id="E9"><label>(9)</label><mml:math id="M12"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>M</mml:mi></mml:mstyle></mml:mrow><mml:mrow><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>F</mml:mi></mml:mstyle></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mi>&#x003C3;</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>M</mml:mi><mml:mi>L</mml:mi><mml:mi>P</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>A</mml:mi><mml:mi>v</mml:mi><mml:mi>g</mml:mi><mml:mi>P</mml:mi><mml:mi>o</mml:mi><mml:mi>o</mml:mi><mml:mi>l</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>F</mml:mi></mml:mstyle></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x0002B;</mml:mo><mml:mi>M</mml:mi><mml:mi>L</mml:mi><mml:mi>P</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>M</mml:mi><mml:mi>a</mml:mi><mml:mi>x</mml:mi><mml:mi>P</mml:mi><mml:mi>o</mml:mi><mml:mi>o</mml:mi><mml:mi>l</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mstyle mathvariant="bold-italic"><mml:mi>F</mml:mi></mml:mstyle></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where <italic>F</italic> represents the function connectivity information processed by previous MLP on T segments and &#x003C3; denotes the sigmoid function. Note that the MLP weights are shared for both inputs and the ReLU activation function. The obtained attention weights (i.e., <italic>M</italic><sub><italic>c</italic></sub>(<italic>F</italic>)) are used to combine information from multiple windows, resulting in a final feature representation expressed as a one-dimensional vector denoted as <inline-formula><mml:math id="M13"><mml:mover accent="false" class="mml-overline"><mml:mrow><mml:mi>d</mml:mi></mml:mrow><mml:mo accent="true">&#x000AF;</mml:mo></mml:mover></mml:math></inline-formula>. Finally, we concatenate the output of global and local branches, yielding a one-dimensional vector. Then, this one-dimensional vector is fed into three fully connected layers to obtain the final classification result.</p>
<p>It&#x00027;s worth noting that, to avoid the trivial solution (i.e., &#x003C9; = (0, 0,&#x02026;, 0), which is due to minimizing the above loss function <italic>L</italic><sub><italic>graph</italic>_<italic>learning</italic></sub> independently, we utilize it as a regularized term to form the final loss function <xref ref-type="disp-formula" rid="E10">Equation (10)</xref>:</p>
<disp-formula id="E10"><label>(10)</label><mml:math id="M14"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>L</mml:mi></mml:mrow><mml:mrow><mml:mi>l</mml:mi><mml:mi>o</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mi>L</mml:mi></mml:mrow><mml:mrow><mml:mi>c</mml:mi><mml:mi>r</mml:mi><mml:mi>o</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi><mml:mtext>_</mml:mtext><mml:mi>e</mml:mi><mml:mi>n</mml:mi><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>o</mml:mi><mml:mi>p</mml:mi><mml:mi>y</mml:mi></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mi>L</mml:mi></mml:mrow><mml:mrow><mml:mi>g</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>p</mml:mi><mml:mi>h</mml:mi><mml:mtext>_</mml:mtext><mml:mi>l</mml:mi><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>r</mml:mi><mml:mi>n</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>g</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where <italic>L</italic><sub><italic>cross</italic>_<italic>entropy</italic></sub> denotes the categorical_crossentropy of the classification task.</p>
</sec>
</sec>
</sec>
<sec>
<title>3.3 Implementation</title>
<p>We implement the framework using Python 3.7 and Pytorch library. For each subject, the adjacency matrix is constructed via our designed AGL strategy, where a random initialization technique initializes the vector &#x003C9; according to a normal distribution. Subsequently, the graph convolution process comprises three GCN layers, followed by batch normalization, ReLU activation, and a dropout rate of 0.5. We then perform a dot product operation on the representation generated from the GCN layers to construct symmetric matrices describing the degree of correlation between nodes. To reduce dimensionality, we flatten the upper triangular portion of each matrix into a vector. This vector is subsequently fed into an MLP consisting of three fully connected layers. Additionally, we incorporate two dropout layers to mitigate overfitting.</p>
<p>Subsequently, we employ an attention mechanism to obtain attention weights and compute the weighted sum of the vector data. This process yields a 32-dimensional vector, which serves as the final output of the global branch. For local analysis using the BiGRU, we perform experiments with different numbers of units, specifically 4, 16, and 64, for training data from various sites.</p>
</sec>
</sec>
<sec id="s4">
<title>4 Experiment and result analysis</title>
<sec>
<title>4.1 Methods for comparison</title>
<p>In the experiments, we compare our ASTNet model with the following eight methods, including the baseline methods and any other variants of the proposed method.</p>
<list list-type="order">
<list-item><p>MLP (Tolstikhin et al., <xref ref-type="bibr" rid="B29">2021</xref>): in this method, the static FC matrix for each subject is directly used as the input of the MLP model. Specifically, the MLP model comprises three fully-connected layers with hidden neurons of 1,024, 256, and 32, respectively.</p></list-item>
<list-item><p>AE (Wang et al., <xref ref-type="bibr" rid="B36">2014</xref>): auto-encoder (AE) is an unsupervised learning model that can learn a mapping supervised by input <italic>X</italic> itself. Specifically, AE extracts useful features from brain networks through bottleneck-like fully connected layers. The hidden layer dimension is determined by the data length in different sites.</p></list-item>
<list-item><p>GCN (Kipf and Welling, <xref ref-type="bibr" rid="B18">2016</xref>): this method first uses two layers of GCN based on Pearson correlation to update spatial correlation between ROIs where the data length in different sites determines dimensions. Then, the FCs, calculated from the dot product of node features, are used as the input to construct a three-layer MLP model with hidden neuron number of 1,024, 256, and 32, respectively.</p></list-item>
<list-item><p>AGL_s: in this method, FCs are learned by the adaptive method. Static adaptive graph learning (AGL_s) method replaces the Pearson correlation matrices with adaptive brain networks as the input. The network structure is the same as the previous MLP method.</p></list-item>
<list-item><p>BiGRU (Chung et al., <xref ref-type="bibr" rid="B6">2014</xref>): This method partitions fMRI data with a constant length of 20 time points. For each segment, we build a functional connectivity matrix. Then, these matrices are sent into the BiGRU model to study their temporal change information with different numbers of units, specifically 4, 16, and 64, for training data.</p></list-item>
<list-item><p>AGL_d: dynamic adaptive graph learning method (AGL_d) implies adaptive learning to construct adjacency matrices on each segment. Then, the TDM module is used to analyze time-varying information between different sliding window data. Specifically, the local branch adopts a two layers BiGRU with 4 units to make the final classification, and the Global branch explores temporal and spatial variability using global attention where MLP has three hidden layers 1,024, 256, and 32, respectively, and the ratio is set as 3 in attention mechanism.</p></list-item>
</list>
<p>Note that, we both have static and dynamic experiments for method MLP and GCN, named as MLP_s, MLP_d, GCN_s, and GCN_d. And we apply global branch in the TDM to mine temporal dependency for MLP_d and adopt the whole TDM module for GCN_d classification.</p>
</sec>
<sec>
<title>4.2 Experiment settings</title>
<p>We evaluate the proposed method on five different sites (i.e., PKU, NYU, OHSU, NI, and KKI) of the ADHD database based on rs-fMRI data. We divide data on each site into training data and test data, following Global Competition. The test set is unseen during the training stage.</p>
<p>To evaluate classification performance, three metrics are used, including accuracy (ACC), sensitivity (SEN), and specificity (SPE). These metrics are defined as follows: ACC = (TP &#x0002B; TN)/(TP &#x0002B; TN &#x0002B; FP &#x0002B; FN), SEN = TP/(TP &#x0002B; FN), SPE = TN/(TN &#x0002B; FP). Here, TP, TN, FP, and FN represent true positive, true negative, false positive, and false negative values, respectively. Higher values for these metrics indicate better classification performance.</p>
</sec>
<sec>
<title>4.3 Classification performance</title>
<p>The quantitative results achieved by different methods in the binary classification tasks are reported in <xref ref-type="table" rid="T2">Table 2</xref>. From <xref ref-type="table" rid="T2">Table 2</xref>, one could have three main observations.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Accuracy (ACC) values achieved by our proposed ASTNet and eight competing methods on five sites (<italic>i.e</italic>., PKU, NYU, OHSU, NI, and KKI) of ADHD-200 dataset.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Method</bold></th>
<th valign="top" align="center" colspan="3"><bold>PKU</bold></th>
<th valign="top" align="center" colspan="3"><bold>NYU</bold></th>
<th valign="top" align="center" colspan="3"><bold>OHSU</bold></th>
<th valign="top" align="center" colspan="3"><bold>NI</bold></th>
<th valign="top" align="center" colspan="3"><bold>KKI</bold></th>
<th valign="top" align="center"><bold>Avg-ACC</bold></th>
</tr>
</thead>
<tbody>
<tr style="background-color:#919498;color:#ffffff">
<td/>
<td valign="top" align="center"><bold>ACC</bold></td>
<td valign="top" align="center"><bold>SEN</bold></td>
<td valign="top" align="center"><bold>SPE</bold></td>
<td valign="top" align="center"><bold>ACC</bold></td>
<td valign="top" align="center"><bold>SEN</bold></td>
<td valign="top" align="center"><bold>SPE</bold></td>
<td valign="top" align="center"><bold>ACC</bold></td>
<td valign="top" align="center"><bold>SEN</bold></td>
<td valign="top" align="center"><bold>SPE</bold></td>
<td valign="top" align="center"><bold>ACC</bold></td>
<td valign="top" align="center"><bold>SEN</bold></td>
<td valign="top" align="center"><bold>SPE</bold></td>
<td valign="top" align="center"><bold>ACC</bold></td>
<td valign="top" align="center"><bold>SEN</bold></td>
<td valign="top" align="center"><bold>SPE</bold></td>
<td/>
</tr>
<tr>
<td valign="top" align="left">MLP_s</td>
<td valign="top" align="center">70.6</td>
<td valign="top" align="center">85.2</td>
<td valign="top" align="center">54.2</td>
<td valign="top" align="center">48.8</td>
<td valign="top" align="center">58.3</td>
<td valign="top" align="center">44.8</td>
<td valign="top" align="center">67.6</td>
<td valign="top" align="center">75.0</td>
<td valign="top" align="center">33.3</td>
<td valign="top" align="center">64.0</td>
<td valign="top" align="center">78.6</td>
<td valign="top" align="center">45.5</td>
<td valign="top" align="center">81.8</td>
<td valign="top" align="center">100.0</td>
<td valign="top" align="center">33.3</td>
<td valign="top" align="center">66.6</td>
</tr>
<tr>
<td valign="top" align="left">AE</td>
<td valign="top" align="center">66.7</td>
<td valign="top" align="center">88.9</td>
<td valign="top" align="center">41.7</td>
<td valign="top" align="center">53.7</td>
<td valign="top" align="center">66.7</td>
<td valign="top" align="center">48.3</td>
<td valign="top" align="center">70.6</td>
<td valign="top" align="center">82.1</td>
<td valign="top" align="center">16.7</td>
<td valign="top" align="center">64.0</td>
<td valign="top" align="center">78.6</td>
<td valign="top" align="center">45.5</td>
<td valign="top" align="center">72.7</td>
<td valign="top" align="center">75.0</td>
<td valign="top" align="center">66.7</td>
<td valign="top" align="center">65.5</td>
</tr>
<tr>
<td valign="top" align="left">GCN_s</td>
<td valign="top" align="center">64.7</td>
<td valign="top" align="center">66.7</td>
<td valign="top" align="center">62.5</td>
<td valign="top" align="center">61.0</td>
<td valign="top" align="center">75.0</td>
<td valign="top" align="center">55.2</td>
<td valign="top" align="center">70.6</td>
<td valign="top" align="center">78.6</td>
<td valign="top" align="center">33.3</td>
<td valign="top" align="center">68</td>
<td valign="top" align="center">71.4</td>
<td valign="top" align="center">63.6</td>
<td valign="top" align="center">72.7</td>
<td valign="top" align="center">100.0</td>
<td valign="top" align="center">0.0</td>
<td valign="top" align="center">67.4</td>
</tr>
<tr>
<td valign="top" align="left">AGL_s</td>
<td valign="top" align="center">68.6</td>
<td valign="top" align="center">74.1</td>
<td valign="top" align="center">62.5</td>
<td valign="top" align="center">70.7</td>
<td valign="top" align="center">58.3</td>
<td valign="top" align="center">75.9</td>
<td valign="top" align="center">82.4</td>
<td valign="top" align="center"><bold>96.4</bold></td>
<td valign="top" align="center">16.7</td>
<td valign="top" align="center">60.0</td>
<td valign="top" align="center">78.6</td>
<td valign="top" align="center">36.4</td>
<td valign="top" align="center">81.8</td>
<td valign="top" align="center">100.0</td>
<td valign="top" align="center">33.3</td>
<td valign="top" align="center">72.7</td>
</tr>
<tr>
<td valign="top" align="left">BiGRU</td>
<td valign="top" align="center">62.7</td>
<td valign="top" align="center">74.1</td>
<td valign="top" align="center">50.0</td>
<td valign="top" align="center">53.7</td>
<td valign="top" align="center">58.3</td>
<td valign="top" align="center">51.7</td>
<td valign="top" align="center">64.7</td>
<td valign="top" align="center">71.4</td>
<td valign="top" align="center">33.3</td>
<td valign="top" align="center">52.0</td>
<td valign="top" align="center">42.9</td>
<td valign="top" align="center"><bold>63.6</bold></td>
<td valign="top" align="center">72.7</td>
<td valign="top" align="center">87.5</td>
<td valign="top" align="center">33.3</td>
<td valign="top" align="center">61.2</td>
</tr>
<tr>
<td valign="top" align="left">MLP_d</td>
<td valign="top" align="center">70.6</td>
<td valign="top" align="center">88.9</td>
<td valign="top" align="center">50.0</td>
<td valign="top" align="center">48.8</td>
<td valign="top" align="center">66.7</td>
<td valign="top" align="center">41.4</td>
<td valign="top" align="center">73.5</td>
<td valign="top" align="center">82.1</td>
<td valign="top" align="center">33.3</td>
<td valign="top" align="center">56.0</td>
<td valign="top" align="center">71.4</td>
<td valign="top" align="center">36.4</td>
<td valign="top" align="center">72.7</td>
<td valign="top" align="center">87.5</td>
<td valign="top" align="center">33.3</td>
<td valign="top" align="center">64.3</td>
</tr>
<tr>
<td valign="top" align="left">GCN_d</td>
<td valign="top" align="center">64.7</td>
<td valign="top" align="center">74.1</td>
<td valign="top" align="center">54.2</td>
<td valign="top" align="center">70.7</td>
<td valign="top" align="center">66.7</td>
<td valign="top" align="center">72.4</td>
<td valign="top" align="center">73.5</td>
<td valign="top" align="center">85.7</td>
<td valign="top" align="center">16.7</td>
<td valign="top" align="center">68.0</td>
<td valign="top" align="center">92.9</td>
<td valign="top" align="center">36.4</td>
<td valign="top" align="center">72.7</td>
<td valign="top" align="center">100.0</td>
<td valign="top" align="center">0.0</td>
<td valign="top" align="center">69.9</td>
</tr>
<tr>
<td valign="top" align="left">AGL_d</td>
<td valign="top" align="center">70.6</td>
<td valign="top" align="center">81.5</td>
<td valign="top" align="center">58.3</td>
<td valign="top" align="center">70.7</td>
<td valign="top" align="center">58.3</td>
<td valign="top" align="center">75.9</td>
<td valign="top" align="center">76.5</td>
<td valign="top" align="center">89.3</td>
<td valign="top" align="center">16.7</td>
<td valign="top" align="center">68.0</td>
<td valign="top" align="center">85.7</td>
<td valign="top" align="center">45.5</td>
<td valign="top" align="center">81.8</td>
<td valign="top" align="center">87.5</td>
<td valign="top" align="center">66.7</td>
<td valign="top" align="center">73.5</td>
</tr>
<tr>
<td valign="top" align="left">ASTNet (ours)</td>
<td valign="top" align="center"><bold>74.5</bold></td>
<td valign="top" align="center"><bold>85.1</bold></td>
<td valign="top" align="center"><bold>62.5</bold></td>
<td valign="top" align="center"><bold>75.6</bold></td>
<td valign="top" align="center"><bold>75.0</bold></td>
<td valign="top" align="center"><bold>75.9</bold></td>
<td valign="top" align="center"><bold>85.3</bold></td>
<td valign="top" align="center">89.3</td>
<td valign="top" align="center"><bold>66.7</bold></td>
<td valign="top" align="center"><bold>76.0</bold></td>
<td valign="top" align="center"><bold>92.9</bold></td>
<td valign="top" align="center">54.5</td>
<td valign="top" align="center"><bold>90.9</bold></td>
<td valign="top" align="center"><bold>100.0</bold></td>
<td valign="top" align="center"><bold>66.7</bold></td>
<td valign="top" align="center"><bold>80.5</bold></td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>Avg-ACC, the average ACC across these five sites (%).</p>
<p>Best results are shown in bold.</p>
</table-wrap-foot>
</table-wrap>
<p>First, our proposed method and its variants (<italic>i.e</italic>., AGL_d and GCN_d) generally achieve better performance compared with the baseline methods (<italic>i.e</italic>., MLP, BiGRU, and Auto-Encoder) in the classification task. For example, in terms of ACC values, ASTNet achieved an improvement of 13.9%, compared with the best baseline method (with 66.6%) in ADHD classification. This demonstrates that our designed adaptive functional connectivity learning strategy and temporal dependency mining module can help extract more discriminative fMRI features, thus enhancing classification performance. Second, our proposed ASTNet and its variants outperform those methods without considering the temporal dynamics (e.g., with GCN_s and AGL_s) in terms of most metrics. In particular, the SEN values produced by our ASTNet in site PKU and NYU are 85.1 and 75.0%, which is higher than other methods. These results suggest that our TDM module can effectively capture dynamic changes in rs-fMRI time series. Finally, our ASTNet is superior to its variants (<italic>i.e</italic>., AGL_d and <italic>GCN</italic>_<italic>d</italic>). This result implies that the adaptive functional connectivity learning strategy and TDM module help boost the learning performance of ASTNet.</p>
</sec>
<sec>
<title>4.4 Interpretable analysis of the learned FCs</title>
<p>The proposed ASTNet can automatically learn dFCs in a data-driven manner, which differs from previous studies that rely on predefined FC networks (e.g., via Pearson&#x00027;s correlation). We now further analyze the FC networks learned by the proposed adaptive method. Specifically, as introduced in Section 3.2.2, the AFCG can learn new connectivity strength between each central node/ROI and all the remaining N-1 ROIs. Therefore, we can generate a fully connected FC network based on the learned connectivity vector. Given the size of the sliding window, different lengths of data will result in different numbers of segments. Taking PKU site as an example, we can construct <italic>K</italic> = 11 dynamic FC networks for each subject, with each network corresponding to a segment. Finally, using the standard t-test, we measure the group difference between ADHD and NC via p-values, with group difference matrices visualized in <xref ref-type="fig" rid="F2">Figure 2</xref>. For comparison, in <xref ref-type="fig" rid="F2">Figure 2</xref>, we also report the group difference of the stationary FC network that is constructed via measuring Pearson correlation coefficients between fMRI time series of pairwise brain ROIs. Note that the obtained <italic>p</italic>-values were binarized (i.e., setting <italic>p</italic>-values more than 0.05 to 1 and 0 otherwise) for clarity in <xref ref-type="fig" rid="F2">Figure 2</xref>. From <xref ref-type="fig" rid="F2">Figure 2</xref>, we have the following observations.</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>Visualization of group difference matrices generated by our learned dynamic FC networks and static network. Note that <italic>p</italic>-values &#x0003E; 0.05 are set to 1 (shown in yellow), while those &#x02264;0.05 were set to 0 (shown in green). The <italic>F</italic><sup><italic>i</italic></sup>(<italic>i</italic> &#x0003D; 1, &#x02026;, 11) repesents the group difference matrices generated by the <italic>i</italic>-th segment.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnins-18-1394234-g0002.tif"/>
</fig>
<p><italic>First</italic>, from <italic>F</italic><sup><italic>i</italic></sup>, <italic>i</italic> &#x0003D; 1, &#x02026;, 11 in <xref ref-type="fig" rid="F2">Figure 2</xref>, we can observe that the group difference matrices generated by different segments exhibit significant differences, which further validates the temporal variability of brain networks. <italic>Second</italic>, by comparing our learned <italic>F</italic><sup><italic>i</italic></sup> and Static in <xref ref-type="fig" rid="F2">Figure 2</xref>, it can be found that the dynamic FC network learned by our ASTNet shows superiority over the pre-defined static network in identifying disease-related functional connectivities and ROIs. For example, Several ROIs, such as the anterior cingulate and paracingulate gyri node (ACG.L) in <italic>F</italic><sup>1</sup>, the superior parietal gyrus node (SPG.L) in <italic>F</italic><sup>6</sup>, and the cerebellum nodes in <italic>F</italic><sup>5</sup>, are detected by our dynamic FC networks in AD vs. NC classification. These findings aligns with previous AD-related studies, which further demonstrates the learned FCs by our ASTNet have good interpretability.</p>
</sec>
<sec>
<title>4.5 Comparison with state-of-the-art methods</title>
<p>We further compare the proposed ASTNet with seven state-of-the-art (SOTA) methods designed for ADHD analysis, including PCA-LDA (Dey et al., <xref ref-type="bibr" rid="B8">2012</xref>), EM-MI (Dou et al., <xref ref-type="bibr" rid="B10">2020</xref>), 3D CNN (Zou et al., <xref ref-type="bibr" rid="B45">2017</xref>), SASNI (Zhang et al., <xref ref-type="bibr" rid="B42">2017</xref>), SPAE (Cao et al., <xref ref-type="bibr" rid="B5">2023</xref>), STAAE (Dong et al., <xref ref-type="bibr" rid="B9">2020</xref>), and KD-Transformer (Zhang et al., <xref ref-type="bibr" rid="B43">2022</xref>). Note that all the methods use the standard training/test sets division by the data set. The classification results achieved by different methods are reported in <xref ref-type="table" rid="T3">Table 3</xref>, with the best results highlighted in bold. From <xref ref-type="table" rid="T3">Table 3</xref>, we can have the following findings.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Quoted results from literature on ADHD-200 dataset.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Method</bold></th>
<th valign="top" align="center"><bold>PKU</bold></th>
<th valign="top" align="center"><bold>NYU</bold></th>
<th valign="top" align="center"><bold>OHSU</bold></th>
<th valign="top" align="center"><bold>NI</bold></th>
<th valign="top" align="center"><bold>KKI</bold></th>
<th valign="top" align="center"><bold>Avg-ACC</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">PCA-LDA (Dey et al., <xref ref-type="bibr" rid="B8">2012</xref>)</td>
<td valign="top" align="center">62.7</td>
<td valign="top" align="center">70.7</td>
<td valign="top" align="center">73.5</td>
<td valign="top" align="center">72.0</td>
<td valign="top" align="center">72.7</td>
<td valign="top" align="center">70.3</td>
</tr>
<tr>
<td valign="top" align="left">EM-MI (Dou et al., <xref ref-type="bibr" rid="B10">2020</xref>)</td>
<td valign="top" align="center">70.6</td>
<td valign="top" align="center">63.4</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">81.8</td>
<td valign="top" align="center">70.4</td>
</tr>
<tr>
<td valign="top" align="left">3D CNN (Zou et al., <xref ref-type="bibr" rid="B45">2017</xref>)</td>
<td valign="top" align="center">63.0</td>
<td valign="top" align="center">70.5</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">72.8</td>
<td valign="top" align="center">66.0</td>
</tr>
<tr>
<td valign="top" align="left">SASNI (Zhang et al., <xref ref-type="bibr" rid="B42">2017</xref>)</td>
<td valign="top" align="center">74.5</td>
<td valign="top" align="center">70.7</td>
<td valign="top" align="center">79.4</td>
<td valign="top" align="center">72.0</td>
<td valign="top" align="center">63.6</td>
<td valign="top" align="center">72.0</td>
</tr>
<tr>
<td valign="top" align="left">SPAE (Cao et al., <xref ref-type="bibr" rid="B5">2023</xref>)</td>
<td valign="top" align="center">70.6</td>
<td valign="top" align="center">65.4</td>
<td valign="top" align="center">65.9</td>
<td valign="top" align="center">76.0</td>
<td valign="top" align="center">73.6</td>
<td valign="top" align="center">70.5</td>
</tr>
<tr>
<td valign="top" align="left">STAAE (Dong et al., <xref ref-type="bibr" rid="B9">2020</xref>)</td>
<td valign="top" align="center">79.5</td>
<td valign="top" align="center">82.2</td>
<td valign="top" align="center">75.4</td>
<td valign="top" align="center">63.7</td>
<td valign="top" align="center">76.6</td>
<td valign="top" align="center">75.5</td>
</tr>
<tr>
<td valign="top" align="left">KD-transformer (Zhang et al., <xref ref-type="bibr" rid="B43">2022</xref>)</td>
<td valign="top" align="center">70.6</td>
<td valign="top" align="center"><bold>82.9</bold></td>
<td valign="top" align="center">85.3</td>
<td valign="top" align="center">72.0</td>
<td valign="top" align="center">90.9</td>
<td valign="top" align="center">80.3</td>
</tr>
<tr>
<td valign="top" align="left">ASTNet (ours)</td>
<td valign="top" align="center"><bold>74.5</bold></td>
<td valign="top" align="center">75.6</td>
<td valign="top" align="center"><bold>85.3</bold></td>
<td valign="top" align="center"><bold>76.0</bold></td>
<td valign="top" align="center"><bold>90.9</bold></td>
<td valign="top" align="center"><bold>80.5</bold></td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>Best results are shown in bold (%).</p>
</table-wrap-foot>
</table-wrap>
<p><italic>First</italic>, the proposed ASTNet outperforms seven SOTA methods in ADHD classification task on the ADHD-200 dataset, which implies that our ASTNet can learn more discriminative features for ADHD identification. <italic>Second</italic>, Compared with static methods (<italic>i.e</italic>., PCA-LDA, 3D CNN, SASNI, and KD-Transformer), the methods (<italic>i.e</italic>., SPAE, STAAE, and KD-Transformer) that consider temporal dynamics in fMRI series achieves relatively better performance. This suggests that temporal information conveyed in fMRI series plays an important role in distinguishing ADHD patients from normal controls.</p>
<p><italic>Third</italic>, the ACC of our ASTNet achieves an improvement of 5% compared with the STAAE that designs a spatiotemporal attention auto-encoder long-distance dependency in time. This finding further demonstrates the superiority of our ASTNet in dynamic brain network learning and brain disorder classification.</p>
</sec>
</sec>
<sec sec-type="discussion" id="s5">
<title>5 Discussion</title>
<p>In this section, we explore the influence of different sliding window sizes, compare the proposed method with its degraded variants, and discuss several limitations of the current work and future work.</p>
<sec>
<title>5.1 Influence of sliding window size</title>
<p>In main experiments, we divide fMRI series using sliding window strategy with window size of 20. To investigate the influence of different sliding window sizes on results, we vary the values of sliding window size within [10, 15, &#x022EF;&#x000A0;, 30]. The results in ADHD classification on five sites are reported in <xref ref-type="fig" rid="F3">Figure 3</xref>. As shown in <xref ref-type="fig" rid="F3">Figure 3</xref>, we can see that our the classification accuracy of our ASTNet fluctuates to a certain extent as the window size increases. When window size is 20, our method achieves its peak performance across different sites, which validates that our selected window size is reasonable.</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p>Results of the proposed ASTNet method with respect to different sliding windows length in ADHD vs. NC on different sites.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnins-18-1394234-g0003.tif"/>
</fig>
</sec>
<sec>
<title>5.2 Ablation study</title>
<p>To demonstrate the effectiveness of each module in the proposed ASTNet, we further compare our ASTNet with its degenerated variants, including (1) GCN_d without incorporating adaptive graph learning (AGL) module, (2) AGL_d without incorporating GCN module, (3) ASTNet_G without global branch and (4) ASTNet_L without local branch. The experiment results of our ASTNet and its variants are reported in <xref ref-type="table" rid="T4">Table 4</xref>.</p>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p>Ablation results on ADHD-200 dataset.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Method</bold></th>
<th valign="top" align="center" colspan="3"><bold>PKU</bold></th>
<th valign="top" align="center" colspan="3"><bold>NYU</bold></th>
<th valign="top" align="center" colspan="3"><bold>OHSU</bold></th>
<th valign="top" align="center" colspan="3"><bold>NI</bold></th>
<th valign="top" align="center" colspan="3"><bold>KKI</bold></th>
<th valign="top" align="center"><bold>Avg-ACC</bold></th>
</tr>
</thead>
<tbody>
<tr style="background-color:#919498;color:#ffffff">
<td/>
<td valign="top" align="center"><bold>ACC</bold></td>
<td valign="top" align="center"><bold>SEN</bold></td>
<td valign="top" align="center"><bold>SPE</bold></td>
<td valign="top" align="center"><bold>ACC</bold></td>
<td valign="top" align="center"><bold>SEN</bold></td>
<td valign="top" align="center"><bold>SPE</bold></td>
<td valign="top" align="center"><bold>ACC</bold></td>
<td valign="top" align="center"><bold>SEN</bold></td>
<td valign="top" align="center"><bold>SPE</bold></td>
<td valign="top" align="center"><bold>ACC</bold></td>
<td valign="top" align="center"><bold>SEN</bold></td>
<td valign="top" align="center"><bold>SPE</bold></td>
<td valign="top" align="center"><bold>ACC</bold></td>
<td valign="top" align="center"><bold>SEN</bold></td>
<td valign="top" align="center"><bold>SPE</bold></td>
<td/>
</tr>
<tr>
<td valign="top" align="left">GCN_d</td>
<td valign="top" align="center">64.7</td>
<td valign="top" align="center">74.1</td>
<td valign="top" align="center">54.2</td>
<td valign="top" align="center">70.7</td>
<td valign="top" align="center">66.7</td>
<td valign="top" align="center">72.4</td>
<td valign="top" align="center">73.5</td>
<td valign="top" align="center">85.7</td>
<td valign="top" align="center">16.7</td>
<td valign="top" align="center">68</td>
<td valign="top" align="center">92.9</td>
<td valign="top" align="center">36.4</td>
<td valign="top" align="center">72.7</td>
<td valign="top" align="center">100.0</td>
<td valign="top" align="center">0.0</td>
<td valign="top" align="center">69.9</td>
</tr>
<tr>
<td valign="top" align="left">AGL_d</td>
<td valign="top" align="center">70.6</td>
<td valign="top" align="center">81.5</td>
<td valign="top" align="center">58.3</td>
<td valign="top" align="center">70.7</td>
<td valign="top" align="center">58.3</td>
<td valign="top" align="center">75.9</td>
<td valign="top" align="center">76.5</td>
<td valign="top" align="center">89.3</td>
<td valign="top" align="center">16.7</td>
<td valign="top" align="center">68.0</td>
<td valign="top" align="center">85.7</td>
<td valign="top" align="center">45.5</td>
<td valign="top" align="center">81.8</td>
<td valign="top" align="center">87.5</td>
<td valign="top" align="center">66.7</td>
<td valign="top" align="center">73.5</td>
</tr>
<tr>
<td valign="top" align="left">ASTNet_G</td>
<td valign="top" align="center">72.5</td>
<td valign="top" align="center">81.5</td>
<td valign="top" align="center">62.5</td>
<td valign="top" align="center">70.7</td>
<td valign="top" align="center">50.0</td>
<td valign="top" align="center">79.3</td>
<td valign="top" align="center">82.4</td>
<td valign="top" align="center"><bold>100.0</bold></td>
<td valign="top" align="center">0.0</td>
<td valign="top" align="center">72.0</td>
<td valign="top" align="center">92.9</td>
<td valign="top" align="center">45.5</td>
<td valign="top" align="center">90.9</td>
<td valign="top" align="center">87.5</td>
<td valign="top" align="center"><bold>100.0</bold></td>
<td valign="top" align="center">77.7</td>
</tr>
<tr>
<td valign="top" align="left">ASTNet_L</td>
<td valign="top" align="center">62.7</td>
<td valign="top" align="center">74.1</td>
<td valign="top" align="center">50.0</td>
<td valign="top" align="center">68.3</td>
<td valign="top" align="center">41.7</td>
<td valign="top" align="center"><bold>79.3</bold></td>
<td valign="top" align="center">64.7</td>
<td valign="top" align="center">67.9</td>
<td valign="top" align="center">50.0</td>
<td valign="top" align="center"><bold>80.0</bold></td>
<td valign="top" align="center">92.9</td>
<td valign="top" align="center"><bold>63.6</bold></td>
<td valign="top" align="center">81.8</td>
<td valign="top" align="center">87.5</td>
<td valign="top" align="center">66.7</td>
<td valign="top" align="center">71.5</td>
</tr>
<tr>
<td valign="top" align="left">ASTNet (ours)</td>
<td valign="top" align="center"><bold>74.5</bold></td>
<td valign="top" align="center"><bold>85.1</bold></td>
<td valign="top" align="center"><bold>62.5</bold></td>
<td valign="top" align="center"><bold>75.6</bold></td>
<td valign="top" align="center"><bold>75.0</bold></td>
<td valign="top" align="center">75.9</td>
<td valign="top" align="center"><bold>85.3</bold></td>
<td valign="top" align="center">89.3</td>
<td valign="top" align="center"><bold>66.7</bold></td>
<td valign="top" align="center">76</td>
<td valign="top" align="center"><bold>92.9</bold></td>
<td valign="top" align="center">54.5</td>
<td valign="top" align="center"><bold>90.9</bold></td>
<td valign="top" align="center"><bold>100.0</bold></td>
<td valign="top" align="center">66.7</td>
<td valign="top" align="center"><bold>80.5</bold></td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>Best results are shown in bold (%).</p>
</table-wrap-foot>
</table-wrap>
<p>It can be found from that our ASTNet consistently outperforms GCN_d that fails to adaptively learn FC strength. This implies that our designed adaptive graph learning strategy can automatically generate more reliable FC network for subsequent analysis, thus boosting model performance. In addition, we can observe that our ASTNet is superior to ASTNet_G without modeling long-term dependencies among dynamic functional connectivities (dFCs). Besides, our ASTNet achieves better performance than ASTNet_L that can not capture local temporal dependency in dFCs. These observations further demonstrate the advantage of our ASTNet, which simultaneously uses global and local branches in fMRI temporal feature learning.</p>
</sec>
<sec>
<title>5.3 Limitations and future work</title>
<p>While our work achieves good results in automatically identifying ADHD using fMRI data, several issues still need to be considered in the future to further improve the performance of the proposed method. First, considering the small-sample-size issue of fMRI data, we will employ transfer learning and pretraining strategies to further enhance model generalization. Second, different brain image modalities, such as structural MRI and Positron Emission Tomography (PET), can provide complementary information for ADHD diagnosis. Integrating multimodal neuroimages would be an interesting avenue to pursue, which will be our future work. Finally, we only construct the functional connectivity matrix based on the AAL atlas with 116 pre-defined ROIs in this work. In the future, we will explore multi-scale functional connectivity networks divided by multiple brain atlas to capture complementary topological information.</p>
</sec>
</sec>
<sec sec-type="conclusions" id="s6">
<title>6 Conclusion</title>
<p>In this paper, we propose an end-to-end adaptive spatial-temporal neural network for ADHD classification using rs-fMRI time-series data. Specifically, we first divide fMRI data into non-overlapping segments to characterize the temporal variability. Then, a adaptive functional connectivity generation (AFCG) module is used model spatial dependencies between brain ROIs for each segment. In particular, within the AFCG, a adaptive graph learning strategy is designed to learn functional connectivity strength a data-driven manner. Finally, we develop a temporal dependency mining (TDM) module that integrates global and local branches to capture the temporal dynamics across multiple time segments. Extensive experiments on the dataset demonstrate the superiority of our ASTNet over several state-of-the-art methods, demonstrating its potential in identifying ADHD.</p>
</sec>
<sec sec-type="data-availability" id="s7">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>BQ: Writing &#x02013; original draft. QW: Writing &#x02013; review &#x00026; editing. XL: Validation, Writing &#x02013; original draft. WL: Writing &#x02013; original draft. WS: Writing &#x02013; review &#x00026; editing. MW: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing.</p>
</sec>
</body>
<back>
<sec sec-type="funding-information" id="s9">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. BQ, XL, WL, and MW were supported in part by the National Natural Science Foundation of China (No. 62102188), the Natural Science Foundation of Jiangsu Province of China (No. BK20210647), the Natural Science Foundation of the Jiangsu Higher Education Institutions of China (No. 21KJB520013), and the Project funded by China Postdoctoral Science Foundation (No. 2021M700076).</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<fn-group>
<fn id="fn0001"><p><sup>1</sup><ext-link ext-link-type="uri" xlink:href="https://fcon_1000.projects.nitrc.org/indi/adhd200/">https://fcon 1000.projects.nitrc.org/indi/adhd200/</ext-link></p></fn>
<fn id="fn0002"><p><sup>2</sup><ext-link ext-link-type="uri" xlink:href="http://preprocessed-connectomes-project.org/abide/">http://preprocessed-connectomes-project.org/abide/</ext-link></p></fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Arieli</surname> <given-names>A.</given-names></name> <name><surname>Sterkin</surname> <given-names>A.</given-names></name> <name><surname>Grinvald</surname> <given-names>A.</given-names></name> <name><surname>Aertsen</surname> <given-names>A.</given-names></name></person-group> (<year>1996</year>). <article-title>Dynamics of ongoing activity: explanation of the large variability in evoked cortical responses</article-title>. <source>Science</source> <volume>273</volume>, <fpage>1868</fpage>&#x02013;<lpage>1871</lpage>. <pub-id pub-id-type="doi">10.1126/science.273.5283.1868</pub-id><pub-id pub-id-type="pmid">8791593</pub-id></citation></ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bahrami</surname> <given-names>M.</given-names></name> <name><surname>Laurienti</surname> <given-names>P. J.</given-names></name> <name><surname>Shappell</surname> <given-names>H.</given-names></name> <name><surname>Simpson</surname> <given-names>S. L.</given-names></name></person-group> (<year>2021</year>). <article-title>A mixed-modeling framework for whole-brain dynamic network analysis</article-title>. <source>Netw. Neurosci</source>. <volume>6</volume>, <fpage>591</fpage>&#x02013;<lpage>613</lpage>. <pub-id pub-id-type="doi">10.1162/netn_a_00238</pub-id><pub-id pub-id-type="pmid">35733427</pub-id></citation></ref>
<ref id="B3">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bai</surname> <given-names>F.</given-names></name> <name><surname>Watson</surname> <given-names>D. R.</given-names></name> <name><surname>Yu</surname> <given-names>H. J.</given-names></name> <name><surname>Mei Shi</surname> <given-names>Y.</given-names></name> <name><surname>Yuan</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>Z.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>Abnormal resting-state functional connectivity of posterior cingulate cortex in amnestic type mild cognitive impairment</article-title>. <source>Brain Res</source>. <volume>1302</volume>, <fpage>167</fpage>&#x02013;<lpage>174</lpage>. <pub-id pub-id-type="doi">10.1016/j.brainres.2009.09.028</pub-id><pub-id pub-id-type="pmid">19765560</pub-id></citation></ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bi</surname> <given-names>X.</given-names></name> <name><surname>Shu</surname> <given-names>Q.</given-names></name> <name><surname>Sun</surname> <given-names>Q.</given-names></name> <name><surname>Xu</surname> <given-names>Q.</given-names></name></person-group> (<year>2018</year>). <article-title>Random support vector machine cluster analysis of resting-state fMRI in Alzheimer&#x00027;s disease</article-title>. <source>PLoS ONE</source> <volume>13</volume>:<fpage>e0194479</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0194479</pub-id><pub-id pub-id-type="pmid">29570705</pub-id></citation></ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cao</surname> <given-names>C.</given-names></name> <name><surname>Li</surname> <given-names>G.</given-names></name> <name><surname>Fu</surname> <given-names>H.</given-names></name> <name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Gao</surname> <given-names>X.</given-names></name></person-group> (<year>2023</year>). <article-title>&#x0201C;SPAE: spatial preservation-based autoencoder for ADHD functional brain networks modelling,&#x0201D;</article-title> in <source>Proceedings of the 2023 ACM International Conference on Multimedia Retrieval</source> (Association for Computeing Machinery), <fpage>370</fpage>&#x02013;<lpage>377</lpage>. <pub-id pub-id-type="doi">10.1145/3591106.3592213</pub-id></citation>
</ref>
<ref id="B6">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chung</surname> <given-names>J.</given-names></name> <name><surname>G&#x000FC;l&#x000E7;ehre</surname> <given-names>&#x000C7;.</given-names></name> <name><surname>Cho</surname> <given-names>K.</given-names></name> <name><surname>Bengio</surname> <given-names>Y.</given-names></name></person-group> (<year>2014</year>). <article-title>Empirical evaluation of gated recurrent neural networks on sequence modeling</article-title>. <source>arXiv</source> [Preprint]. arXiv/1412.3555. <pub-id pub-id-type="doi">10.48550/arXiv.1412.3555</pub-id></citation>
</ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Damoiseaux</surname> <given-names>J. S.</given-names></name></person-group> (<year>2012</year>). <article-title>Resting-state fMRI as a biomarker for Alzheimer&#x00027;s disease?</article-title> <source>Alzheimers Res. Ther</source>. <volume>4</volume>, <fpage>1</fpage>&#x02013;<lpage>2</lpage>. <pub-id pub-id-type="doi">10.1186/alzrt106</pub-id><pub-id pub-id-type="pmid">22423634</pub-id></citation></ref>
<ref id="B8">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dey</surname> <given-names>S.</given-names></name> <name><surname>Rao</surname> <given-names>A. R.</given-names></name> <name><surname>Shah</surname> <given-names>M.</given-names></name> <name><surname>Fair</surname> <given-names>D. A.</given-names></name></person-group> (<year>2012</year>). <article-title>Exploiting the brain&#x00027;s network structure in identifying ADHD subjects</article-title>. <source>Front. Syst. Neurosci</source>. <volume>6</volume>:<fpage>75</fpage>. <pub-id pub-id-type="doi">10.3389/fnsys.2012.00075</pub-id><pub-id pub-id-type="pmid">23162440</pub-id></citation></ref>
<ref id="B9">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Dong</surname> <given-names>Q.</given-names></name> <name><surname>Qiang</surname> <given-names>N.</given-names></name> <name><surname>Lv</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Liu</surname> <given-names>T.</given-names></name> <name><surname>Li</surname> <given-names>Q.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Spatiotemporal attention autoencoder (STAAE) for ADHD classification,&#x0201D;</article-title> in <source>Medical Image Computing and Computer Assisted Intervention &#x02013; MICCAI 2020. MICCAI 2020. Lecture Notes in Computer Science, Vol. 12267</source>, eds. Martel, A.L., et al. (<publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name>). <pub-id pub-id-type="doi">10.1007/978-3-030-59728-3_50</pub-id><pub-id pub-id-type="pmid">32833639</pub-id></citation></ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dou</surname> <given-names>C.</given-names></name> <name><surname>Zhang</surname> <given-names>S.</given-names></name> <name><surname>Wang</surname> <given-names>H.</given-names></name> <name><surname>Sun</surname> <given-names>L.</given-names></name> <name><surname>Huang</surname> <given-names>Y.</given-names></name> <name><surname>Yue</surname> <given-names>W.</given-names></name></person-group> (<year>2020</year>). <article-title>ADHD fMRI short-time analysis method for edge computing based on multi-instance learning</article-title>. <source>J. Syst. Archit</source>. <volume>111</volume>:<fpage>101834</fpage>. <pub-id pub-id-type="doi">10.1016/j.sysarc.2020.101834</pub-id></citation>
</ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Du</surname> <given-names>Y.</given-names></name> <name><surname>Fu</surname> <given-names>Z.</given-names></name> <name><surname>Calhoun</surname> <given-names>V. D.</given-names></name></person-group> (<year>2018</year>). <article-title>Classification and prediction of brain disorders using functional connectivity: promising but challenging</article-title>. <source>Front. Neurosci</source>. <volume>12</volume>:<fpage>525</fpage>. <pub-id pub-id-type="doi">10.3389/fnins.2018.00525</pub-id><pub-id pub-id-type="pmid">30127711</pub-id></citation></ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eslami</surname> <given-names>T.</given-names></name> <name><surname>Mirjalili</surname> <given-names>V.</given-names></name> <name><surname>Fong</surname> <given-names>A.</given-names></name> <name><surname>Laird</surname> <given-names>A. R.</given-names></name> <name><surname>Saeed</surname> <given-names>F.</given-names></name></person-group> (<year>2019</year>). <article-title>ASD-DiagNet: a hybrid learning approach for detection of autism spectrum disorder using fMRI data</article-title>. <source>Front. Neuroinform</source>. <volume>13</volume>:<fpage>70</fpage>. <pub-id pub-id-type="doi">10.3389/fninf.2019.00070</pub-id><pub-id pub-id-type="pmid">31827430</pub-id></citation></ref>
<ref id="B13">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Feng</surname> <given-names>Y.</given-names></name> <name><surname>Jia</surname> <given-names>J.</given-names></name> <name><surname>Zhang</surname> <given-names>R.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Classification of Alzheimer&#x00027;s disease by combining dynamic and static brain network features,&#x0201D;</article-title> in <source>Proceedings of the 2022 6th International Conference on Computer Science and Artificial Intelligence</source> (Association for Computering Machinery), <fpage>41</fpage>&#x02013;<lpage>48</lpage>. <pub-id pub-id-type="doi">10.1145/3577530.3577537</pub-id><pub-id pub-id-type="pmid">33144220</pub-id></citation></ref>
<ref id="B14">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Gadgil</surname> <given-names>S.</given-names></name> <name><surname>Zhao</surname> <given-names>Q.</given-names></name> <name><surname>Pfefferbaum</surname> <given-names>A.</given-names></name> <name><surname>Sullivan</surname> <given-names>E. V.</given-names></name> <name><surname>Adeli</surname> <given-names>E.</given-names></name> <name><surname>Pohl</surname> <given-names>K. M.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>&#x0201C;Spatio-temporal graph convolution for resting-state fMRI analysis,&#x0201D;</article-title> in <source>Medical Image Computing and computer-assisted intervention: MICCAI International Conference on Medical Image Computing and Computer-Assisted Intervention, Vol. 12267</source> (<publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>528</fpage>&#x02013;<lpage>538</lpage>. <pub-id pub-id-type="doi">10.1007/978-3-030-59728-3_52</pub-id><pub-id pub-id-type="pmid">33257918</pub-id></citation></ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jie</surname> <given-names>B.</given-names></name> <name><surname>Zhang</surname> <given-names>D.</given-names></name> <name><surname>Gao</surname> <given-names>W.</given-names></name> <name><surname>Wang</surname> <given-names>Q.</given-names></name> <name><surname>Wee</surname> <given-names>C. Y.</given-names></name> <name><surname>Shen</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Integration of network topological and connectivity properties for neuroimaging classification</article-title>. <source>IEEE Trans. Biomed. Eng</source>. <volume>61</volume>, <fpage>576</fpage>&#x02013;<lpage>589</lpage>. <pub-id pub-id-type="doi">10.1109/TBME.2013.2284195</pub-id><pub-id pub-id-type="pmid">24108708</pub-id></citation></ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jie</surname> <given-names>B.</given-names></name> <name><surname>Zhang</surname> <given-names>D.</given-names></name> <name><surname>Wee</surname> <given-names>C. Y.</given-names></name> <name><surname>Shen</surname> <given-names>D.</given-names></name></person-group> (<year>2014</year>). <article-title>Topological graph kernel on multiple thresholded functional connectivity networks for mild cognitive impairment classification</article-title>. <source>Hum. Brain Mapp</source>. <volume>35</volume>, <fpage>2876</fpage>&#x02013;<lpage>2897</lpage>. <pub-id pub-id-type="doi">10.1002/hbm.22353</pub-id><pub-id pub-id-type="pmid">24038749</pub-id></citation></ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kawahara</surname> <given-names>J.</given-names></name> <name><surname>Brown</surname> <given-names>C. J.</given-names></name> <name><surname>Miller</surname> <given-names>S. P.</given-names></name> <name><surname>Booth</surname> <given-names>B. G.</given-names></name> <name><surname>Chau</surname> <given-names>V.</given-names></name> <name><surname>Grunau</surname> <given-names>R. E.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>BrainNetCNN: convolutional neural networks for brain networks; towards predicting neurodevelopment</article-title>. <source>Neuroimage</source> <volume>146</volume>, <fpage>1038</fpage>&#x02013;<lpage>1049</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuroimage.2016.09.046</pub-id><pub-id pub-id-type="pmid">27693612</pub-id></citation></ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kipf</surname> <given-names>T.</given-names></name> <name><surname>Welling</surname> <given-names>M.</given-names></name></person-group> (<year>2016</year>). <article-title>Semi-supervised classification with graph convolutional networks</article-title>. <source>arXiv</source> [Preprint]. arXiv/1609.02907. <pub-id pub-id-type="doi">10.48550/arXiv.1609.02907</pub-id></citation>
</ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ktena</surname> <given-names>S. I.</given-names></name> <name><surname>Parisot</surname> <given-names>S.</given-names></name> <name><surname>Ferrante</surname> <given-names>E.</given-names></name> <name><surname>Rajchl</surname> <given-names>M.</given-names></name> <name><surname>Lee</surname> <given-names>M.</given-names></name> <name><surname>Glocker</surname> <given-names>B.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Metric learning with spectral graph convolutions on brain connectivity networks</article-title>. <source>Neuroimage</source> <volume>169</volume>, <fpage>431</fpage>&#x02013;<lpage>442</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuroimage.2017.12.052</pub-id><pub-id pub-id-type="pmid">29278772</pub-id></citation></ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Zhou</surname> <given-names>Y.</given-names></name> <name><surname>Gao</surname> <given-names>S.</given-names></name> <name><surname>Dvornek</surname> <given-names>N. C.</given-names></name> <name><surname>Zhang</surname> <given-names>M.</given-names></name> <name><surname>Zhuang</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>BrainGNN: interpretable brain graph neural network for fMRI analysis</article-title>. <source>bioRxiv</source>. <pub-id pub-id-type="doi">10.1101/2020.05.16.100057</pub-id><pub-id pub-id-type="pmid">34655865</pub-id></citation></ref>
<ref id="B21">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Liang</surname> <given-names>W.</given-names></name> <name><surname>Zhang</surname> <given-names>K.</given-names></name> <name><surname>Cao</surname> <given-names>P.</given-names></name> <name><surname>Zhao</surname> <given-names>P.</given-names></name> <name><surname>Liu</surname> <given-names>X.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>&#x0201C;Modeling Alzheimers&#x00027; disease progression from multi-task and self-supervised learning perspective with brain networks,&#x0201D;</article-title> in <source>International Conference on Medical Image Computing and Computer-Assisted Intervention</source> (<publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name>). <pub-id pub-id-type="doi">10.1007/978-3-031-43907-0_30</pub-id></citation>
</ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liang</surname> <given-names>Y.</given-names></name> <name><surname>Liu</surname> <given-names>B.</given-names></name> <name><surname>Zhang</surname> <given-names>H.</given-names></name></person-group> (<year>2021</year>). <article-title>A convolutional neural network combined with prototype learning framework for brain functional network classification of autism spectrum disorder</article-title>. <source>IEEE Trans. Neural Syst. Rehabil. Eng</source>. <volume>29</volume>, <fpage>2193</fpage>&#x02013;<lpage>2202</lpage>. <pub-id pub-id-type="doi">10.1109/TNSRE.2021.3120024</pub-id><pub-id pub-id-type="pmid">34648452</pub-id></citation></ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>K.</given-names></name> <name><surname>Jie</surname> <given-names>B.</given-names></name> <name><surname>Dong</surname> <given-names>P.</given-names></name> <name><surname>Ding</surname> <given-names>X.</given-names></name> <name><surname>Bian</surname> <given-names>W.</given-names></name> <name><surname>Liu</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Convolutional recurrent neural network for dynamic functional MRI analysis and brain disease identification</article-title>. <source>Front. Neurosci</source>. <volume>16</volume>:<fpage>933660</fpage>. <pub-id pub-id-type="doi">10.3389/fnins.2022.933660</pub-id><pub-id pub-id-type="pmid">35873806</pub-id></citation></ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>S.</given-names></name> <name><surname>Zhao</surname> <given-names>L.</given-names></name> <name><surname>Zhao</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>B.</given-names></name> <name><surname>Wang</surname> <given-names>S. H.</given-names></name></person-group> (<year>2022</year>). <article-title>Attention deficit/hyperactivity disorder classification based on deep spatio-temporal features of functional magnetic resonance imaging</article-title>. <source>Biomed. Signal Process. Control</source>. <volume>71</volume>:<fpage>103239</fpage>. <pub-id pub-id-type="doi">10.1016/j.bspc.2021.103239</pub-id><pub-id pub-id-type="pmid">32833639</pub-id></citation></ref>
<ref id="B25">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Makeig</surname> <given-names>S.</given-names></name> <name><surname>Debener</surname> <given-names>S.</given-names></name> <name><surname>Onton</surname> <given-names>J.</given-names></name> <name><surname>Delorme</surname> <given-names>A.</given-names></name></person-group> (<year>2004</year>). <article-title>Mining event-related brain dynamics</article-title>. <source>Trends Cogn. Sci</source>. <volume>8</volume>, <fpage>204</fpage>&#x02013;<lpage>210</lpage>. <pub-id pub-id-type="doi">10.1016/j.tics.2004.03.008</pub-id><pub-id pub-id-type="pmid">15120678</pub-id></citation></ref>
<ref id="B26">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Onton</surname> <given-names>J.</given-names></name> <name><surname>Westerfield</surname> <given-names>M.</given-names></name> <name><surname>Townsend</surname> <given-names>J.</given-names></name> <name><surname>Makeig</surname> <given-names>S.</given-names></name></person-group> (<year>2006</year>). <article-title>Imaging human EEG dynamics using independent component analysis</article-title>. <source>Neurosci. Biobehav. Rev</source>. <volume>30</volume>, <fpage>808</fpage>&#x02013;<lpage>822</lpage>. <pub-id pub-id-type="doi">10.1016/j.neubiorev.2006.06.007</pub-id><pub-id pub-id-type="pmid">16904745</pub-id></citation></ref>
<ref id="B27">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Plis</surname> <given-names>S. M.</given-names></name> <name><surname>Hjelm</surname> <given-names>D. R.</given-names></name> <name><surname>Salakhutdinov</surname> <given-names>R.</given-names></name> <name><surname>Allen</surname> <given-names>E. A.</given-names></name> <name><surname>Bockholt</surname> <given-names>H. J.</given-names></name> <name><surname>Long</surname> <given-names>J. D.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Deep learning for neuroimaging: a validation study</article-title>. <source>Front. Neurosci</source>. <volume>8</volume>:<fpage>229</fpage>. <pub-id pub-id-type="doi">10.3389/fnins.2014.00229</pub-id><pub-id pub-id-type="pmid">25191215</pub-id></citation></ref>
<ref id="B28">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thomas</surname> <given-names>R.</given-names></name> <name><surname>Sanders</surname> <given-names>S.</given-names></name> <name><surname>Doust</surname> <given-names>J.</given-names></name> <name><surname>Beller</surname> <given-names>E.</given-names></name> <name><surname>Glasziou</surname> <given-names>P.</given-names></name></person-group> (<year>2015</year>). <article-title>Prevalence of attention-deficit/hyperactivity disorder: a systematic review and meta-analysis</article-title>. <source>Pediatrics</source> <volume>135</volume>, <fpage>e994</fpage>&#x02013;<lpage>e1001</lpage>. <pub-id pub-id-type="doi">10.1542/peds.2014-3482</pub-id><pub-id pub-id-type="pmid">25733754</pub-id></citation></ref>
<ref id="B29">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tolstikhin</surname> <given-names>I. O.</given-names></name> <name><surname>Houlsby</surname> <given-names>N.</given-names></name> <name><surname>Kolesnikov</surname> <given-names>A.</given-names></name> <name><surname>Beyer</surname> <given-names>L.</given-names></name> <name><surname>Zhai</surname> <given-names>X.</given-names></name> <name><surname>Unterthiner</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>MLP-mixer: an all-MLP architecture for vision</article-title>. <source>ArXiv</source>. abs/2105.01601.</citation>
</ref>
<ref id="B30">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vergara</surname> <given-names>V. M.</given-names></name> <name><surname>Mayer</surname> <given-names>A. R.</given-names></name> <name><surname>Kiehl</surname> <given-names>K. A.</given-names></name> <name><surname>Calhoun</surname> <given-names>V. D.</given-names></name></person-group> (<year>2018</year>). <article-title>Dynamic functional network connectivity discriminates mild traumatic brain injury through machine learning</article-title>. <source>Neuroimage</source> <volume>19</volume>, <fpage>30</fpage>&#x02013;<lpage>37</lpage>. <pub-id pub-id-type="doi">10.1016/j.nicl.2018.03.017</pub-id><pub-id pub-id-type="pmid">30034999</pub-id></citation></ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>M.</given-names></name> <name><surname>Huang</surname> <given-names>J.</given-names></name> <name><surname>Liu</surname> <given-names>M.</given-names></name> <name><surname>Zhang</surname> <given-names>D.</given-names></name></person-group> (<year>2021</year>). <article-title>Modeling dynamic characteristics of brain functional connectivity networks using resting-state functional mri</article-title>. <source>Med. Image Anal</source>. <volume>71</volume>:<fpage>102063</fpage>. <pub-id pub-id-type="doi">10.1016/j.media.2021.102063</pub-id><pub-id pub-id-type="pmid">33910109</pub-id></citation></ref>
<ref id="B32">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>M.</given-names></name> <name><surname>Lian</surname> <given-names>C.</given-names></name> <name><surname>Yao</surname> <given-names>D.</given-names></name> <name><surname>Zhang</surname> <given-names>D.</given-names></name> <name><surname>Liu</surname> <given-names>M.</given-names></name> <name><surname>Shen</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2019b</year>). <article-title>Spatial-temporal dependency modeling and network hub detection for functional MRI analysis via convolutional-recurrent network</article-title>. <source>IEEE Trans. Biomed. Eng</source>. <volume>67</volume>, <fpage>2241</fpage>&#x02013;<lpage>2252</lpage>. <pub-id pub-id-type="doi">10.1109/TBME.2019.2957921</pub-id><pub-id pub-id-type="pmid">31825859</pub-id></citation></ref>
<ref id="B33">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>M.</given-names></name> <name><surname>Zhang</surname> <given-names>D.</given-names></name> <name><surname>Huang</surname> <given-names>J.</given-names></name> <name><surname>Liu</surname> <given-names>M.</given-names></name> <name><surname>Liu</surname> <given-names>Q.</given-names></name></person-group> (<year>2022a</year>). <article-title>Consistent connectome landscape mining for cross-site brain disease identification using functional MRI</article-title>. <source>Med. Image Anal</source>. <volume>82</volume>:<fpage>102591</fpage>. <pub-id pub-id-type="doi">10.1016/j.media.2022.102591</pub-id><pub-id pub-id-type="pmid">36070656</pub-id></citation></ref>
<ref id="B34">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>M.</given-names></name> <name><surname>Zhang</surname> <given-names>D.</given-names></name> <name><surname>Huang</surname> <given-names>J.</given-names></name> <name><surname>Yap</surname> <given-names>P. T.</given-names></name> <name><surname>Shen</surname> <given-names>D.</given-names></name> <name><surname>Liu</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2019a</year>). <article-title>Identifying autism spectrum disorder with multi-site fMRI via low-rank domain adaptation</article-title>. <source>IEEE Trans. Med. Imaging</source> <volume>39</volume>, <fpage>644</fpage>&#x02013;<lpage>655</lpage>. <pub-id pub-id-type="doi">10.1109/TMI.2019.2933160</pub-id><pub-id pub-id-type="pmid">31395542</pub-id></citation></ref>
<ref id="B35">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>M.</given-names></name> <name><surname>Zhu</surname> <given-names>L.</given-names></name> <name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Pan</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>L.</given-names></name></person-group> (<year>2023</year>). <article-title>Dynamic functional connectivity analysis with temporal convolutional network for attention deficit/hyperactivity disorder identification</article-title>. <source>Front. Neurosci</source>. <volume>17</volume>:<fpage>1322967</fpage>. <pub-id pub-id-type="doi">10.3389/fnins.2023.1322967</pub-id><pub-id pub-id-type="pmid">38148943</pub-id></citation></ref>
<ref id="B36">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>W.</given-names></name> <name><surname>Huang</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>L.</given-names></name></person-group> (<year>2014</year>). <article-title>&#x0201C;Generalized autoencoder: a neural network framework for dimensionality reduction,&#x0201D;</article-title> in <source>2014 IEEE Conference on Computer Vision and Pattern Recognition Workshops</source>, <fpage>496</fpage>&#x02013;<lpage>503</lpage>. <pub-id pub-id-type="doi">10.1109/CVPRW.2014.79</pub-id></citation>
</ref>
<ref id="B37">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>X.</given-names></name> <name><surname>Ren</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>W.</given-names></name></person-group> (<year>2017</year>). <article-title>Multi-task fused lasso method for constructing dynamic functional brain network of resting-state fMRI</article-title>. <source>J. Image Graph</source>. <volume>22</volume>, <fpage>978</fpage>&#x02013;<lpage>987</lpage>.</citation>
</ref>
<ref id="B38">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Z.</given-names></name> <name><surname>Xin</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>Q.</given-names></name> <name><surname>Wang</surname> <given-names>Z.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name></person-group> (<year>2022</year>). <article-title>NDCN-brain: an extensible dynamic functional brain network model</article-title>. <source>Diagnostics</source> <volume>12</volume>:<fpage>1298</fpage>. <pub-id pub-id-type="doi">10.3390/diagnostics12051298</pub-id><pub-id pub-id-type="pmid">35626453</pub-id></citation></ref>
<ref id="B39">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yan</surname> <given-names>W.</given-names></name> <name><surname>Calhoun</surname> <given-names>V.</given-names></name> <name><surname>Song</surname> <given-names>M.</given-names></name> <name><surname>Cui</surname> <given-names>Y.</given-names></name> <name><surname>Yan</surname> <given-names>H.</given-names></name> <name><surname>Liu</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Discriminating schizophrenia using recurrent neural network applied on time courses of multi-site fMRI data</article-title>. <source>EBioMedicine</source> <volume>47</volume>, <fpage>543</fpage>&#x02013;<lpage>552</lpage>. <pub-id pub-id-type="doi">10.1016/j.ebiom.2019.08.023</pub-id><pub-id pub-id-type="pmid">31420302</pub-id></citation></ref>
<ref id="B40">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>W.</given-names></name> <name><surname>Xu</surname> <given-names>X.</given-names></name> <name><surname>Wang</surname> <given-names>C.</given-names></name> <name><surname>Mei Cheng</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Xu</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Alterations of dynamic functional connectivity between visual and executive-control networks in schizophrenia</article-title>. <source>Brain Imaging Behav</source>. <volume>16</volume>, <fpage>1294</fpage>&#x02013;<lpage>1302</lpage>. <pub-id pub-id-type="doi">10.1007/s11682-021-00592-8</pub-id><pub-id pub-id-type="pmid">34997915</pub-id></citation></ref>
<ref id="B41">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yao</surname> <given-names>D.</given-names></name> <name><surname>Sui</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>M.</given-names></name> <name><surname>Yang</surname> <given-names>E.</given-names></name> <name><surname>Jiaerken</surname> <given-names>Y.</given-names></name> <name><surname>Luo</surname> <given-names>N.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>A mutual multi-scale triplet graph convolutional network for classification of brain disorders using functional or structural connectivity</article-title>. <source>IEEE Trans. Med. Imaging</source> <volume>40</volume>, <fpage>1279</fpage>&#x02013;<lpage>1289</lpage>. <pub-id pub-id-type="doi">10.1109/TMI.2021.3051604</pub-id><pub-id pub-id-type="pmid">33444133</pub-id></citation></ref>
<ref id="B42">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Zhou</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>L.</given-names></name></person-group> (<year>2017</year>). <article-title>Subject-adaptive integration of multiple SICE brain networks with different sparsity</article-title>. <source>Pattern Recognit</source>. <volume>63</volume>, <fpage>642</fpage>&#x02013;<lpage>652</lpage>. <pub-id pub-id-type="doi">10.1016/j.patcog.2016.09.024</pub-id></citation>
</ref>
<ref id="B43">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Zhou</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Liu</surname> <given-names>M.</given-names></name> <name><surname>Shen</surname> <given-names>D.</given-names></name></person-group> (<year>2022</year>). <article-title>Diffusion kernel attention network for brain disorder classification</article-title>. <source>IEEE Trans. Med. Imaging</source> <volume>41</volume>, <fpage>2814</fpage>&#x02013;<lpage>2827</lpage>. <pub-id pub-id-type="doi">10.1109/TMI.2022.3170701</pub-id><pub-id pub-id-type="pmid">35471877</pub-id></citation></ref>
<ref id="B44">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Yang</surname> <given-names>Y.</given-names></name> <name><surname>Zhao</surname> <given-names>S.</given-names></name> <name><surname>Guo</surname> <given-names>L.</given-names></name> <name><surname>Han</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Test-retest reliability of dynamic functional connectivity in naturalistic paradigm functional magnetic resonance imaging</article-title>. <source>Hum. Brain Mapp</source>. <volume>43</volume>, <fpage>1463</fpage>&#x02013;<lpage>1476</lpage>. <pub-id pub-id-type="doi">10.1002/hbm.25736</pub-id><pub-id pub-id-type="pmid">34870361</pub-id></citation></ref>
<ref id="B45">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zou</surname> <given-names>L.</given-names></name> <name><surname>Zheng</surname> <given-names>J.</given-names></name> <name><surname>Miao</surname> <given-names>C.</given-names></name> <name><surname>McKeown</surname> <given-names>M. J.</given-names></name> <name><surname>Wang</surname> <given-names>Z. J.</given-names></name></person-group> (<year>2017</year>). <article-title>3D CNN based automatic diagnosis of attention deficit hyperactivity disorder using functional and structural MRI</article-title>. <source>IEEE Access</source> <volume>5</volume>, <fpage>23626</fpage>&#x02013;<lpage>23636</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2017.2762703</pub-id></citation>
</ref>
</ref-list>
</back>
</article>