<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychiatry</journal-id>
<journal-title>Frontiers in Psychiatry</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychiatry</abbrev-journal-title>
<issn pub-type="epub">1664-0640</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyt.2025.1617650</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Psychiatry</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Graph learning based suicidal ideation detection via tree-drawing test</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Ye</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3122044/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zheng</surname>
<given-names>Jiashuo</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3083193/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zeng</surname>
<given-names>Yang</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3094648/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Luo</surname>
<given-names>Fang</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/549241/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Tian</surname>
<given-names>Xuetao</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2626698/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>School of Future Technology, South China University of Technology</institution>, <addr-line>Guangzhou</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Faculty of Psychology, Beijing Normal University</institution>, <addr-line>Beijing</addr-line>,&#xa0;<country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Engineering Research Center of Integration and Application of Digital Learning Technology, Ministry of Education</institution>, <addr-line>Beijing</addr-line>,&#xa0;<country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Areej Alhothali, King Abdulaziz University, Saudi Arabia</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Tao Xu, Northwestern Polytechnical University, China</p>
<p>Gengyu Lyu, Beijing University of Technology, China</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Xuetao Tian, <email xlink:href="mailto:xttian@bnu.edu.cn">xttian@bnu.edu.cn</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>18</day>
<month>07</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1617650</elocation-id>
<history>
<date date-type="received">
<day>24</day>
<month>04</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>06</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Liu, Zheng, Zeng, Luo and Tian</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Liu, Zheng, Zeng, Luo and Tian</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Adolescent suicide is a critical public health concern worldwide, necessitating effective methods for early detection of high suicidal ideation. Traditional detection methods, such as self-report scales, suffer from limited accuracy and are susceptible to personal concealment. Automatic methods based on artificial intelligence techniques are more accurate, while they often lack scalability due to strict data requirements. In order to achieve a balance between accuracy and scalability, this paper introduces the Tree-Drawing Test (TDT) as an effective tool for suicidal ideation detection, and proposes a novel graph learning approach to enable its automatic application.</p>
</sec>
<sec>
<title>Methods</title>
<p>The proposed method first constructs a semantic graph based on psychological features annotated automatically from tree-drawing images, and leverages a Graph Convolutional Network (GCN) model to realize individual suicidal ideation detection. To evaluate this method, a real dataset of 806 students from primary and secondary school in Shaanxi Province, China, is collected, and some metrics including macro-F1, G-mean, and false positive rate are used.</p>
</sec>
<sec>
<title>Results</title>
<p>The results demonstrate that the proposed method significantly outperforms traditional machine learning and convolution neural network approaches. The ablation study demonstrates the effectiveness of feature &#x201c;leaves and fruits&#x201d; in detecting suicidal ideation. Further experiments demonstrate that the proposed method remains stable even when the model is disturbed, such as when a tree-drawing image cannot be fully represented.</p>
</sec>
<sec>
<title>Discussion</title>
<p>The proposed method highlights its effectiveness in large-scale suicidal ideation screening, as it not only achieves high detection performance but also maintains model stability while remaining flexible and adaptable.</p>
</sec>
</abstract>
<kwd-group>
<kwd>suicidal ideation detection</kwd>
<kwd>tree-drawing test</kwd>
<kwd>projective test</kwd>
<kwd>graph learning</kwd>
<kwd>graph convolutional network</kwd>
</kwd-group>
<counts>
<fig-count count="9"/>
<table-count count="7"/>
<equation-count count="14"/>
<ref-count count="58"/>
<page-count count="16"/>
<word-count count="8721"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Digital Mental Health</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Adolescent suicide has been a public health concern. Data from the World Health Organization (WHO) shows that more than 1.5 million adolescents and young adults aged 10 to 24 years died in 2021 (<xref ref-type="bibr" rid="B1">1</xref>), and suicide has been the fourth leading cause of death among young people from the ages of 15 to 29 (<xref ref-type="bibr" rid="B2">2</xref>). Meanwhile, approximately one-third of adolescents experiencing suicidal ideation progress to developing suicide plans, and approximately 60% of those have attempted suicide (<xref ref-type="bibr" rid="B3">3</xref>). In this case, early detection and intervention of suicidal ideation through large-scale screening is crucial to promoting healthy adolescent development.</p>
<p>Current tools for detecting suicidal ideation mainly contain self-report scales, artificial intelligence (AI)-driven detection methods and projective tests as shown in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>. Although self-report scales [e.g., Beck Scale (<xref ref-type="bibr" rid="B4">4</xref>)] facilitate efficient large-scale screening for suicidal ideation, their results are susceptible to inaccuracies and self-presentation biases, particularly those arising from intentional self-concealment of sensitive information. AI-driven detection methods, which utilize multi-modal data such as text (<xref ref-type="bibr" rid="B5">5</xref>&#x2013;<xref ref-type="bibr" rid="B7">7</xref>), audio (<xref ref-type="bibr" rid="B8">8</xref>&#x2013;<xref ref-type="bibr" rid="B10">10</xref>), video (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B12">12</xref>), electroencephalogram (EEG) (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B14">14</xref>), etc., demonstrate superior accuracy but lower scalability, as they require specialized data collection process. For instance, researchers collected video and audio data from clinical interviews to analyze smile and gaze behavior, and used SVM method to classify suicidal patients, psychiatric patients and control groups (<xref ref-type="bibr" rid="B11">11</xref>). Another study collected resting-state fMRI data from depressed patients in clinical suicidal crisis, constructed a feature mask via two-sample <italic>t</italic>-test on regional connectivity, and designed a semisupervised clustering framework using the mask for suicidal ideation prediction (<xref ref-type="bibr" rid="B15">15</xref>). Projective tests like the Tree-Drawing Test (TDT) have been applied to identify individuals with psychological states like depressive disorders (<xref ref-type="bibr" rid="B16">16</xref>) and dissociative identity disorder (<xref ref-type="bibr" rid="B17">17</xref>). By leveraging ambiguous stimuli to uncover latent emotions, these methods mitigate subjective bias, enhance response authenticity, and facilitate the scalability of psychological evaluation. However, this approach heavily relies on expert interpretation and cannot achieve a timely diagnosis.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Flowchart of suicidal ideation detection. <bold>(a)</bold> Flowchart of suicidal ideation detection via self-report scales. <bold>(b)</bold> Flowchart of suicidal ideation detection via automatic AI model. <bold>(c)</bold> Flowchart of suicidal ideation detection via the drawing projective tests.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1617650-g001.tif">
<alt-text content-type="machine-generated">a. Illustration showing a subject using self-report scales to assess suicidal ideation, depicted by a bell curve ranging from low to high ideation.  b. Diagram of an AI model processing data from text, images, and audio to detect suicidal ideation, with results indicating high or low ideation.  c. Diagram showing a subject creating a tree image, which an expert analyzes to produce a report detecting suicidal ideation, indicating high or low ideation.</alt-text>
</graphic>
</fig>
<p>To address this challenge of supporting large-scale screening, computer vision methods, such as image processing and Convolutional Neural Network (CNN), have been applied to the TDT successfully (<xref ref-type="bibr" rid="B18">18</xref>&#x2013;<xref ref-type="bibr" rid="B20">20</xref>). However, since they focus more on the texture features of tree drawing images and lack the prior knowledge of psychology, it is difficult for them to capture the highly relevant characteristics between TDT and psychological states. Against this background, this paper aims to leverage graph learning methods to employ explainable semantic features related to suicidal ideation and achieve powerful detection capabilities simultaneously, thereby promote TDT&#x2019;s application in the field of suicidal ideation detection.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Dataset</title>
<p>To conduct this research, we established a dataset involving lots of students from primary and secondary schools in Shaanxi Province, China. There are totally 806 participants (392 males and 414 females). Each participant completed the Beck Scale for Suicide Ideation and drew a tree on A4-sized white paper as part of the Tree-Drawing Test. To ensure the effectiveness of scale, we evaluated itemtotal correlation and refined it to nine items, achieving a Cronbach&#x2019;s <italic>&#x3b1;</italic> of 0.89, indicating high internal consistency and reliability (<xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B22">22</xref>). The scoring ranges from 0 to 10 points for each item, with a total score ranging from 0 to 90 for the nineitem scale. The score distribution is displayed in <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>. The average score for suicidal ideation across all subjects was 17.19 (<italic>SD</italic> = 7.01). To categorize the subjects into groups based on their level of suicidal ideation, we applied a threshold of mean plus standard deviation, a common practice in psychological research (<xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B24">24</xref>). Consequently, 94 subjects were classified into the high suicidal ideation group, while the remaining 712 were categorized as low suicidal ideation.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>The score distribution from the self-report scale of suicidal ideation.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1617650-g002.tif">
<alt-text content-type="machine-generated">Violin plot showing the score distribution, with a primary concentration of scores between 10 and 30. The distribution is symmetrical and extends slightly beyond these values.</alt-text>
</graphic>
</fig>
<p>For the Tree-Drawing Test, we selected 98 significant features that can be grouped into 12 classes according to the current psychological research (<xref ref-type="bibr" rid="B25">25</xref>&#x2013;<xref ref-type="bibr" rid="B28">28</xref>). These features are shown in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>, they were manually labeled by three graduate students specializing in psychometrics. If a certain feature was present in an image, it was marked as &#x201c;1&#x201d;; if absent, it was marked as &#x201c;0&#x201d;. The labeling process was conducted independently by each annotator, resulting in an initial agreement rate of 94%. Any disagreements were resolved through discussion among annotators to reach consensus final labels. Notably, the data collection was conducted in accordance with the Declaration of Helsinki, and approved by the Institutional Review Board of Beijing Normal University (protocol code: 202112300092, and date of approval: December 30, 2021).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Classes and details of tree-drawing features.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Class</th>
<th valign="top" align="left">Features</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">overall</td>
<td valign="top" align="left">huge tree; small tree; tree above; tree below; tree on the left; tree on the right; tilted trunk or crown; cut at the edge of the tree and paper; cut above; cut on the left; cut on the right; cut below</td>
</tr>
<tr>
<td valign="top" align="left">line</td>
<td valign="top" align="left">thick lines; light lines; obvious differences in strength; sloppy lines; mainly short lines; mainly long lines; mainly trembling wavy lines</td>
</tr>
<tr>
<td valign="top" align="left">special mark</td>
<td valign="top" align="left">snakelike; symmetrical</td>
</tr>
<tr>
<td valign="top" align="left">special tree type</td>
<td valign="top" align="left">dead tree; simplified tree; pine tree; theme loss; multiple trees</td>
</tr>
<tr>
<td valign="top" align="left">canopy</td>
<td valign="top" align="left">closed canopy; open canopy; zoned canopy; large canopy; small canopy; squashed canopy; full canopy; emphasized canopy lines; light canopy lines; multi-layered canopy lines; cloud-like canopy lines; ringed canopy line; quivering shaped canopy lines; circular canopy lines; black shadows in the canopy; chaos in the canopy; blank canopy; detailed depicted canopy; short wavy lines drawn in the canopy</td>
</tr>
<tr>
<td valign="top" align="left">branch</td>
<td valign="top" align="left">broken branches; crossing branches; vigorously growing branches; drooping branches; patchwork branches; single-line branches; parallel branches; open branch ends; sharp branch ends</td>
</tr>
<tr>
<td valign="top" align="left">leaf and flower</td>
<td valign="top" align="left">fruits or flowers in the canopy; leaves; fallen leaves</td>
</tr>
<tr>
<td valign="top" align="left">trunk</td>
<td valign="top" align="left">small trunk; long trunk; parallel trunk; wide at the top and narrow at the bottom; wide at the bottom of the trunk; scars on the trunk; black shadow on the trunk; depiction of bark; completely blank trunk; emphasis on trunk edge lines; light trunk edge lines; trunk with small twigs</td>
</tr>
<tr>
<td valign="top" align="left">junction</td>
<td valign="top" align="left">trunk sealed at the top; trunk open at the top; trunk forms a &#x2018;M&#x2019; shape at the top; trunk sealed at the bottom; trunk transitionally sealed at the bottom (drawing whisker-like roots); trunk open at the bottom; trunk directly connects to the branches and the junction is hollow</td>
</tr>
<tr>
<td valign="top" align="left">root</td>
<td valign="top" align="left">drawn roots; fibrous roots; sharp roots; crossing roots; overly drawn roots; exposed roots</td>
</tr>
<tr>
<td valign="top" align="left">ground</td>
<td valign="top" align="left">drawn ground line; sloping ground line; wavy ground line; hilly ground line; emphasized ground; paper&#x2019;s base as ground line (only if depicted flowers and plants); ground line through the trunk</td>
</tr>
<tr>
<td valign="top" align="left">attachment</td>
<td valign="top" align="left">drawn attachments; sun; clouds; flowers under the tree; grass under the tree; birds or bird&#x2019;s nests; houses or people; words; wind and rain</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Baselines</title>
<p>To identify the high suicidal ideation, any binary classifier of machine learning algorithms can be effectively applied to features, extracted by automatic tree features extraction model or manually labeled from images. In this study, we adopted some machine learning (ML) models, including Logistic Regression (LR) (<xref ref-type="bibr" rid="B29">29</xref>), Decision Tree (DT) (<xref ref-type="bibr" rid="B30">30</xref>), Support Vector Machine (SVM) (<xref ref-type="bibr" rid="B31">31</xref>) and Random Forest (RF) (<xref ref-type="bibr" rid="B32">32</xref>) to implement binary classification. Besides, the suicidal ideation detection on images can be realized by deep learning techniques directly. Convolutional Neural Networks (CNN) is a common framework in deep learning, and also widely used in image classification. We selected some classic CNN models, such as AlexNet (<xref ref-type="bibr" rid="B33">33</xref>), VGG16 (<xref ref-type="bibr" rid="B34">34</xref>), Inception (<xref ref-type="bibr" rid="B35">35</xref>) and ResNet (<xref ref-type="bibr" rid="B36">36</xref>) as our baselines. To make a comparison with state-of-the-art graph learning models, we also selected GAT (<xref ref-type="bibr" rid="B37">37</xref>), HAN (<xref ref-type="bibr" rid="B38">38</xref>) and Simple-HGN (S-HGN) (<xref ref-type="bibr" rid="B39">39</xref>) as baselines.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Proposed model</title>
<sec id="s2_3_1">
<label>2.3.1</label>
<title>Overview</title>
<p>In this study, we proposed a new model to achieve automatic suicidal ideation detection based on TreeDrawing Test, as illustrated in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>. The model consists of three modules. The first one is automatic feature extraction, determining which tree features are contained in Tree-Drawing Test images. The second one is semantic graph construction, it aims at establishing a graph, where the weight of edge represents the correlation between psychological tree feature and individual image. The third one is suicidal ideation detection, which realizes the detection of individual suicidal ideation based on the Tree-Drawing Test and graph node classification. Such a method transforms traditional image classification task to graph node classification task. Based on Graph Convolutional Network (GCN), the images from Tree-Drawing Test can be better represented, leading to a better performance on suicidal ideation detection. For clearer presentation, <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref> displayed the main notations and descriptions.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Overall framework of the proposed model, which consists of three modules: (1) automatic feature extraction, (2) semantic graph construction, and (3) suicidal ideation detection. Such a method formalizes individual suicidal ideation detection as a node classification task in graph. Based on graph learning, the images from Tree-Drawing Test can be better represented via combining psychological tree features and deep learning techniques, leading to a better performance on suicidal ideation detection.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1617650-g003.tif">
<alt-text content-type="machine-generated">Flowchart depicting a three-step process for analyzing tree drawings to detect suicidal ideation. Step 1: Automatic feature extraction using CNN, identifying characteristics like canopy details. Step 2: Constructs semantic graphs with categorized features. Step 3: Employs GCN for suicidal ideation detection, using image vertices and feature representation leading to an MLP for final detection.</alt-text>
</graphic>
</fig>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Notations and descriptions of the proposed model.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Symbols</th>
<th valign="top" align="center">Notations and descriptions</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">
<inline-formula>
<mml:math display="inline" id="im1">
<mml:mi mathvariant="script">G</mml:mi>
</mml:math>
</inline-formula>
</td>
<td valign="top" align="center">Image-feature semantic graph</td>
</tr>
<tr>
<td valign="top" align="center">
<inline-formula>
<mml:math display="inline" id="im2">
<mml:mi mathvariant="script">V</mml:mi>
</mml:math>
</inline-formula>
</td>
<td valign="top" align="center">Vertices set</td>
</tr>
<tr>
<td valign="top" align="center">
<inline-formula>
<mml:math display="inline" id="im3">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>F</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td valign="top" align="center">Feature vertices set</td>
</tr>
<tr>
<td valign="top" align="center">
<inline-formula>
<mml:math display="inline" id="im4">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>I</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td valign="top" align="center">Image vertices set</td>
</tr>
<tr>
<td valign="top" align="center">
<inline-formula>
<mml:math display="inline" id="im5">
<mml:mi>&#x2130;</mml:mi>
</mml:math>
</inline-formula>
</td>
<td valign="top" align="center">Edge set</td>
</tr>
<tr>
<td valign="top" align="center">
<bold>A</bold>
</td>
<td valign="top" align="center">Adjacency matrix</td>
</tr>
<tr>
<td valign="top" align="center">
<bold>X</bold>
</td>
<td valign="top" align="center">Initial representation of all vertices</td>
</tr>
<tr>
<td valign="top" align="center">
<bold>H</bold>
<sup>(</sup>
<italic>
<sup>l</sup>
</italic>
<sup>)</sup>
</td>
<td valign="top" align="center">Feature representation at the <italic>l</italic>-th layer</td>
</tr>
<tr>
<td valign="top" align="center">
<bold>W</bold>
<sup>(</sup>
<italic>
<sup>l</sup>
</italic>
<sup>)</sup>
</td>
<td valign="top" align="center">Trainable weight matrix of the <italic>l</italic>-th layer</td>
</tr>
<tr>
<td valign="top" align="center">
<bold>y</bold>
<italic>
<sup>j</sup>
</italic>
</td>
<td valign="top" align="center">The ground truth label for the <italic>j</italic>-th vertice</td>
</tr>
<tr>
<td valign="top" align="center">
<inline-formula>
<mml:math display="inline" id="im6">
<mml:mrow>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
<mml:mi>j</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td valign="top" align="center">The prediction for the <italic>j</italic>-th vertice</td>
</tr>
<tr>
<td valign="top" align="center">
<italic>w<sub>c</sub>
</italic>
</td>
<td valign="top" align="center">The weight of class <italic>c</italic>
</td>
</tr>
<tr>
<td valign="top" align="center">
<inline-formula>
<mml:math display="inline" id="im7">
<mml:mrow>
<mml:msubsup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>z</mml:mi>
</mml:mstyle>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td valign="top" align="center">The ground-truth of manual annotation whether the <italic>j</italic>-th image sample has the <italic>i</italic>-th feature</td>
</tr>
<tr>
<td valign="bottom" align="center">
<inline-formula>
<mml:math display="inline" id="im8">
<mml:mrow>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>z</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> <inline-formula>
<mml:math display="inline" id="im9">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td valign="top" align="center">The probability that the model predicts the <italic>j</italic>-th image sample has the <italic>i</italic>-th feature<break/>The weight of minority class for the <italic>i</italic>-th feature</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2_3_2">
<label>2.3.2</label>
<title>Automatic tree features extraction</title>
<p>Based on the manually-labeled features, we fine-tuned a ResNet network to achieve automatic tree features extraction through multi-label classification of 98 image features. Specifically, we modified the output of the last fully-connected layer in ResNet34 (<xref ref-type="bibr" rid="B36">36</xref>) as 98 parallel linear layers. The model performed binary classification for each feature, and outputted a 98-dimensional vector that indicates whether the feature exists in the input image. It is trained by cross entropy loss, which is commonly used for classification tasks. For the <italic>i</italic>-th feature, the loss <inline-formula>
<mml:math display="inline" id="im10">
<mml:mrow>
<mml:msubsup>
<mml:mi>&#x2112;</mml:mi>
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is shown in <xref ref-type="disp-formula" rid="eq1">Equation 1</xref>. The total loss <inline-formula>
<mml:math display="inline" id="im11">
<mml:mrow>
<mml:msup>
<mml:mi>L</mml:mi>
<mml:mn>1</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> is the mean of the losses of each feature, as shown in <xref ref-type="disp-formula" rid="eq2">Equation 2</xref>.</p>
<disp-formula id="eq1">
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:msubsup>
<mml:mi>&#x2112;</mml:mi>
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>M</mml:mi>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>M</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:mo stretchy="false">(</mml:mo>
<mml:msubsup>
<mml:mtext mathvariant="bold">z</mml:mtext>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
<mml:mtext>log&#xa0;</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:mtext mathvariant="bold">z</mml:mtext>
<mml:mo>^</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mtext mathvariant="bold">z</mml:mtext>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mtext>log&#xa0;</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:mtext mathvariant="bold">z</mml:mtext>
<mml:mo>^</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq2">
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:msup>
<mml:mi>&#x2112;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>N</mml:mi>
</mml:mfrac>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>N</mml:mi>
</mml:msubsup>
<mml:msubsup>
<mml:mi>&#x2112;</mml:mi>
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mi>N</mml:mi>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Here, <inline-formula>
<mml:math display="inline" id="im12">
<mml:mrow>
<mml:msubsup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>z</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is the probability that the model predicts the <italic>j</italic>-th image sample has the <italic>i</italic>-th feature and <inline-formula>
<mml:math display="inline" id="im13">
<mml:mrow>
<mml:msubsup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>z</mml:mi>
</mml:mstyle>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> represents the ground-truth of manual annotation whether the <italic>j</italic>-th image sample has the <italic>i</italic>-th feature. <italic>M</italic> is the number of training images, and <italic>N</italic> is 98 since there are 98 predefined tree features.</p>
</sec>
<sec id="s2_3_3">
<label>2.3.3</label>
<title>Semantic graph construction</title>
<p>To link the above psychological tree features and images, a semantic graph is constructed and further used to explore intrinsic semantic information contained in images. Generally, a graph is composed of a finite number of vertices and edges between them, usually represented as <inline-formula>
<mml:math display="inline" id="im14">
<mml:mrow>
<mml:mi mathvariant="script">G</mml:mi>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x2130;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, where <inline-formula>
<mml:math display="inline" id="im15">
<mml:mi mathvariant="script">G</mml:mi>
</mml:math>
</inline-formula> denotes the graph, <inline-formula>
<mml:math display="inline" id="im16">
<mml:mi mathvariant="script">V</mml:mi>
</mml:math>
</inline-formula> is the set of vertices in graph <inline-formula>
<mml:math display="inline" id="im17">
<mml:mi mathvariant="script">G</mml:mi>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math display="inline" id="im18">
<mml:mrow>
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the <italic>i</italic>-th node and <inline-formula>
<mml:math display="inline" id="im19">
<mml:mi>&#x2130;</mml:mi>
</mml:math>
</inline-formula> is the set of edges in graph <inline-formula>
<mml:math display="inline" id="im20">
<mml:mi mathvariant="script">G</mml:mi>
</mml:math>
</inline-formula>. In this model, we take both features and images as vertices to build the image-feature semantic graph, that is, <inline-formula>
<mml:math display="inline" id="im21">
<mml:mrow>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>F</mml:mi>
</mml:msub>
<mml:mo>&#x222a;</mml:mo>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>I</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, where <inline-formula>
<mml:math display="inline" id="im22">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>F</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im23">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>I</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> respectively represent the set of feature vertices and the set of image vertices. If the number of images and features are <inline-formula>
<mml:math display="inline" id="im24">
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>F</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>|</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im25">
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>I</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>|</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> respectively, then the total number of vertices is <inline-formula>
<mml:math display="inline" id="im26">
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>F</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mo>+</mml:mo>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>I</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>|</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>. Moreover, the edge set <inline-formula>
<mml:math display="inline" id="im27">
<mml:mi>&#x2130;</mml:mi>
</mml:math>
</inline-formula> of semantic graph is generated according to the results of automatic tree features extraction. When the <italic>i</italic>-th image ( <inline-formula>
<mml:math display="inline" id="im28">
<mml:mrow>
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>I</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>) has the <italic>j</italic>-th feature ( <inline-formula>
<mml:math display="inline" id="im29">
<mml:mrow>
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:msub>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mi>F</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>), there is an edge <inline-formula>
<mml:math display="inline" id="im30">
<mml:mrow>
<mml:msub>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>&#x2130;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> between image vertex <inline-formula>
<mml:math display="inline" id="im31">
<mml:mrow>
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and feature vertex <inline-formula>
<mml:math display="inline" id="im32">
<mml:mrow>
<mml:msub>
<mml:mi>v</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> in the graph <inline-formula>
<mml:math display="inline" id="im33">
<mml:mi mathvariant="script">G</mml:mi>
</mml:math>
</inline-formula>. In graph theory, the adjacency matrix is commonly used to represent the relationship between vertices. For semantic graph <inline-formula>
<mml:math display="inline" id="im34">
<mml:mrow>
<mml:mi mathvariant="script">G</mml:mi>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x2130;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, the corresponding adjacency matrix is an <inline-formula>
<mml:math display="inline" id="im35">
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> by <inline-formula>
<mml:math display="inline" id="im36">
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> square matrix <inline-formula>
<mml:math display="inline" id="im37">
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>A</mml:mi>
</mml:mstyle>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi>&#x211d;</mml:mi>
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> with each element generated as <xref ref-type="disp-formula" rid="eq3">Equation 3</xref>.</p>
<disp-formula id="eq3">
<label>(3)</label>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>A</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mtable columnalign="left">
<mml:mtr columnalign="left">
<mml:mtd columnalign="left">
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>f</mml:mi>
<mml:mtext>&#xa0;</mml:mtext>
<mml:msub>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>&#x2130;</mml:mi>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr columnalign="left">
<mml:mtd columnalign="left">
<mml:mrow>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mrow>
<mml:mtext>otherwise</mml:mtext>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mtext>where&#xa0;</mml:mtext>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>If there is an edge <inline-formula>
<mml:math display="inline" id="im38">
<mml:mrow>
<mml:msub>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>&#x2130;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> between vertex <italic>v<sub>i</sub>
</italic> and vertex <italic>v<sub>j</sub>
</italic> in graph G, then the element in the <italic>i</italic>-th row and the <italic>j</italic>-th column of adjacency matrix <bold>A</bold> is 1, otherwise it is 0. In this way, the semantic knowledge of Tree-Drawing Test images can be fully preserved in the semantic graph. Consequently, the semantic graph is composed of 904 nodes and 15379 edges, and the edge density is approximately 0.04, indicating that the semantic graph is sparse.</p>
</sec>
<sec id="s2_3_4">
<label>2.3.4</label>
<title>Suicidal ideation detection based on tree-drawing test and graph learning</title>
<p>Since each image vertex has its label, where images of the individuals with low suicidal ideation belong to class 0 and the others belong to class 1, the suicidal ideation detection is transformed into a node classification task on the constructed semantic graph. The graph convolutional network (GCN) has a great expressive power to learn the node representations and has achieved a superior performance in node classification (<xref ref-type="bibr" rid="B40">40</xref>). Therefore, the graph convolutional network is adopted to achieve the final classification results by the following three steps:</p>
<sec id="s2_3_4_1">
<label>2.3.4.1</label>
<title>Initial representation</title>
<p>Fundamentally, a GCN takes a graph together with a set of feature vectors as input, where each node is associated with its own feature vector. In this model, the initial feature vector is obtained by node2vec (<xref ref-type="bibr" rid="B41">41</xref>), which learns low-dimensional embedding for nodes in image-feature semantic graph via applying random walks on semantic graph starting at a target node. Specifically, it first calculates the transition probabilities between nodes, then generate the walk sequence by biased random walk, and finally obtains the representation through the Skip-gram method (<xref ref-type="bibr" rid="B42">42</xref>). It enables structurally-similar vertices to have similar representations. Assume that the feature of each vertex is represented as a <italic>k</italic>-dimensional vector, finally we obtained the set of all vertices representations <inline-formula>
<mml:math display="inline" id="im39">
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>X</mml:mi>
</mml:mstyle>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi>&#x211d;</mml:mi>
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi>V</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</sec>
<sec id="s2_3_4_2">
<label>2.3.4.2</label>
<title>Graph convolutional network for node representation</title>
<p>To integrate the information of psychological tree features (i.e. the feature vertices) into the image representations (i.e. the embedding of image vertices), we leveraged Graph Convolutional Networks (GCN) (<xref ref-type="bibr" rid="B43">43</xref>), which can learn both topology structure of the graph and semantic features of vertices. GCN implements the node representation process as shown in <xref ref-type="disp-formula" rid="eq4">Equation 4</xref>.</p>
<disp-formula id="eq4">
<label>(4)</label>
<mml:math display="block" id="M4">
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>H</mml:mi>
</mml:mstyle>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>&#x3b8;</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>X</mml:mi>
</mml:mstyle>
<mml:mo>,</mml:mo>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>A</mml:mi>
</mml:mstyle>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Here, <bold>X</bold> is the initial vertex embeddings, <italic>&#x3b8;</italic> is the learnable parameter in GCN model, <bold>A</bold> is the adjacency matrix of image-feature semantic graph, and <bold>H</bold>
<sup>(</sup>
<italic>
<sup>L</sup>
</italic>
<sup>)</sup>is the representation of all unlabeled image vertices. The key of GCN model is to obtain a good node representation. To achieve this, GCN can update the embedding of vertex by aggregating the information from its corresponding neighbors via a multi-layer structure, as shown in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>. If GCN model has <italic>L</italic> layers, every GCN layer updates the node features according to <xref ref-type="disp-formula" rid="eq4">Equation 4</xref>.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>The process and details of graph convolutional network (GCN). Left: GCN can update the embeddings of vertices in the graph based on the known adjacency matrix and vertex embeddings. Right: The <italic>l</italic>-th layer of GCN output <bold>H</bold>
<sup>(</sup>
<italic>
<sup>l</sup>
</italic>
<sup>+1)</sup> by calculating product of <inline-formula>
<mml:math display="inline" id="im40">
<mml:mrow>
<mml:msup>
<mml:mtext mathvariant="bold">H</mml:mtext>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mover accent="true">
<mml:mtext mathvariant="bold">A</mml:mtext>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> and <bold>W</bold>
<sup>(</sup>
<italic>
<sup>l</sup>
</italic>
<sup>)</sup>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1617650-g004.tif">
<alt-text content-type="machine-generated">Diagram of a neural network architecture. On the left, multiple layers of interconnected nodes represent input processing through three graph layers. To the right, a sequence shows data transformations: a normalized adjacency matrix multiplies with feature representations, followed by multiplication with a trainable weight matrix. Columns of colored blocks indicate different feature and weight stages, denoted by \(d_0\), \(d_1\), \(d_2\), etc., emphasizing layer transformations and outputs.</alt-text>
</graphic>
</fig>
<disp-formula id="eq5">
<label>(5)</label>
<mml:math display="block" id="M5">
<mml:mrow>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>H</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mi>&#x3c3;</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>A</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>H</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>W</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mtext>where&#xa0;</mml:mtext>
<mml:mi>l</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mi>L</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1,</mml:mn>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im41">
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>A</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi>&#x211d;</mml:mi>
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi>V</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi>V</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> is the normalized adjacency matrix calculated by <inline-formula>
<mml:math display="inline" id="im42">
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>A</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
<mml:mo>=</mml:mo>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>D</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mi>1</mml:mi>
<mml:mn>2</mml:mn>
</mml:mfrac>
</mml:mrow>
</mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>A</mml:mi>
</mml:mstyle>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>D</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mi>1</mml:mi>
<mml:mn>2</mml:mn>
</mml:mfrac>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, <bold>D</bold> represent graph degree matrix, which is a diagonal matrix with each diagonal element as <inline-formula>
<mml:math display="inline" id="im43">
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>D</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mtext mathvariant="script">|V|</mml:mtext>
</mml:msubsup>
</mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>A</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>. And <inline-formula>
<mml:math display="inline" id="im44">
<mml:mrow>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>W</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi>&#x211d;</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi>d</mml:mi>
<mml:mi>l</mml:mi>
</mml:msub>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>d</mml:mi>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> is a trainable weight matrix of the <italic>l</italic>-th layer and <italic>&#x3c3;</italic> represents an activation function. <inline-formula>
<mml:math display="inline" id="im45">
<mml:mrow>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>H</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi>&#x211d;</mml:mi>
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi>V</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>d</mml:mi>
<mml:mi>l</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>is the feature representation at the <italic>l</italic>-th layer. Notably, the initial state, <inline-formula>
<mml:math display="inline" id="im46">
<mml:mrow>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>H</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, is set as <bold>X</bold>, i.e., <inline-formula>
<mml:math display="inline" id="im47">
<mml:mrow>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>H</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>X</mml:mi>
</mml:mstyle>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</sec>
<sec id="s2_3_4_3">
<label>2.3.4.3</label>
<title>Node classification</title>
<p>The output of the <italic>L</italic>-th GCN layer is <bold>H</bold>
<sup>(</sup>
<italic>
<sup>L</sup>
</italic>
<sup>)</sup>, and node classification is realized by applying a fully-connected layer with softmax activation function on it as formulated by <xref ref-type="disp-formula" rid="eq6">Equation 6</xref>.</p>
<disp-formula id="eq6">
<label>(6)</label>
<mml:math display="block" id="M6">
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>y</mml:mi>
</mml:mstyle>
<mml:mo>=</mml:mo>
<mml:mi>s</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>W</mml:mi>
</mml:mstyle>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>H</mml:mi>
</mml:mstyle>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>L</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>b</mml:mi>
</mml:mstyle>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im48">
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>W</mml:mi>
</mml:mstyle>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi>&#x211d;</mml:mi>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>d</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math display="inline" id="im49">
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>b</mml:mi>
</mml:mstyle>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi>&#x211d;</mml:mi>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math display="inline" id="im50">
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>y</mml:mi>
</mml:mstyle>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi>&#x211d;</mml:mi>
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi mathvariant="script">V</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>. The parameters of the GCN are trained by the commonly-used cross entropy loss as shown in <xref ref-type="disp-formula" rid="eq7">Equation 7</xref>.</p>
<disp-formula id="eq7">
<label>(7)</label>
<mml:math display="block" id="M7">
<mml:mrow>
<mml:msup>
<mml:mi>&#x2112;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
<mml:mo>,</mml:mo>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>y</mml:mi>
</mml:mstyle>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>T</mml:mi>
</mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>T</mml:mi>
</mml:msubsup>
</mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>y</mml:mi>
</mml:mstyle>
<mml:mi>j</mml:mi>
</mml:msup>
<mml:mtext>log&#xa0;</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
<mml:mi>j</mml:mi>
</mml:msup>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>y</mml:mi>
</mml:mstyle>
<mml:mi>j</mml:mi>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mtext>log&#xa0;</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
<mml:mi>j</mml:mi>
</mml:msup>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im51">
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
</mml:math>
</inline-formula> and <bold>y</bold> are the predicted values and ground truth labels of image vertices, that is the prediction and real labels of Tree-Drawing Test image about suicidal ideation, respectively. <italic>T</italic> is the number of training image vertices with labels in the semantic graph. <inline-formula>
<mml:math display="inline" id="im52">
<mml:mrow>
<mml:msup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
<mml:mi>j</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> indicates the prediction for the <italic>j</italic>-th vertice. The whole GCN model is optimized through back propagation.</p>
</sec>
</sec>
<sec id="s2_3_5">
<label>2.3.5</label>
<title>Cost-sensitive strategy for class-imbalanced issue</title>
<p>It is worth noting that the number of individuals with high suicidal ideation is usually much smaller than that of individuals with low suicidal ideation, so there is an class-imbalance issue for suicidal ideation detection. Similarly, automatic tree feature extraction also suffer from class-imbalance issue. To address issue of the class-imbalanced distribution during both automatic feature extraction and suicidal ideation detection, cost-sensitive strategy is employed by leveraging weighted cross entropy loss, which is shown in <xref ref-type="disp-formula" rid="eq8">Equation 8</xref>. By giving minority class with a larger weight, cost-sensitive strategy would penalize more if incorrect prediction is achieved for these minority class. As a result, the prediction accuracy for these minority class is improved. For the binary classification process of suicidal ideation detection, by using cost-sensitive strategy, the loss function of GCN model in <xref ref-type="disp-formula" rid="eq7">Equation 7</xref> is revised as follows:</p>
<disp-formula id="eq8">
<label>(8)</label>
<mml:math display="block" id="M8">
<mml:mrow>
<mml:msubsup>
<mml:mi>&#x2112;</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>b</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mover accent="true">
<mml:mtext mathvariant="bold">y</mml:mtext>
<mml:mo>^</mml:mo>
</mml:mover>
<mml:mo>,</mml:mo>
<mml:mtext mathvariant="bold">y</mml:mtext>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>T</mml:mi>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>T</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
<mml:msup>
<mml:mtext mathvariant="bold">y</mml:mtext>
<mml:mi>j</mml:mi>
</mml:msup>
<mml:mtext>log&#xa0;</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:msup>
<mml:mover accent="true">
<mml:mtext mathvariant="bold">y</mml:mtext>
<mml:mo>^</mml:mo>
</mml:mover>
<mml:mi>j</mml:mi>
</mml:msup>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mtext mathvariant="bold">y</mml:mtext>
<mml:mi>j</mml:mi>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mtext>log&#xa0;</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mover accent="true">
<mml:mtext mathvariant="bold">y</mml:mtext>
<mml:mo>^</mml:mo>
</mml:mover>
<mml:mi>j</mml:mi>
</mml:msup>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Here, <italic>w<sub>c</sub>
</italic> is the weight of class <italic>c</italic>, where the <italic>j</italic>-th sample belongs to, i.e., <italic>c</italic> = <bold>y</bold>
<italic>
<sup>j</sup>
</italic>. When the <italic>j</italic>-th image vertice represents sample with high suicidal ideation (class 1 and <bold>y</bold>
<italic>
<sup>j</sup>
</italic> = 1), a larger weight <italic>w</italic>
<sub>1</sub> is assigned to the minority class sample. Through assigning a larger weight <italic>w<sub>c</sub>
</italic> for each sample in minority classes, the penalty on minority class in the loss function can be adjusted to alleviate the class-imbalanced issues and further detect more effective individuals with high suicidal ideation as well as tree features.</p>
<p>Similarly, in the multi-label classification process of automatic tree feature extraction, the cost-sensitive strategy is employed to handle the class-imbalanced tree features distribution, the loss function of automatic tree features extraction model in <xref ref-type="disp-formula" rid="eq1">Equation 1</xref> for the <italic>i</italic>-th feature is revised as follows:</p>
<disp-formula id="eq9">
<label>(9)</label>
<mml:math display="block" id="M9">
<mml:mrow>
<mml:msubsup>
<mml:mi>&#x2112;</mml:mi>
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>b</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>M</mml:mi>
</mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>M</mml:mi>
</mml:msubsup>
</mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:msubsup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>z</mml:mi>
</mml:mstyle>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
<mml:mtext>log&#xa0;</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:msubsup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>z</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>z</mml:mi>
</mml:mstyle>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mtext>log&#xa0;</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mover accent="true">
<mml:mi>z</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mstyle>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Here, <inline-formula>
<mml:math display="inline" id="im53">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is the weight of minority class for the <italic>i</italic>-th feature. For the <italic>i</italic>-th feature classification, if images with the <italic>i</italic>-th feature belongs to the minority class, a larger weight <inline-formula>
<mml:math display="inline" id="im54">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is assigned to images with label <inline-formula>
<mml:math display="inline" id="im55">
<mml:mrow>
<mml:msubsup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>z</mml:mi>
</mml:mstyle>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>. If images without <italic>i</italic>-th feature belongs to the minority class, a larger weight weight <inline-formula>
<mml:math display="inline" id="im56">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is assigned to images without <italic>i</italic>-th feature, i.e., images with label <inline-formula>
<mml:math display="inline" id="im57">
<mml:mrow>
<mml:msubsup>
<mml:mstyle mathvariant="bold" mathsize="normal">
<mml:mi>z</mml:mi>
</mml:mstyle>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:msubsup>
<mml:mo>=</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</sec>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Experimental settings</title>
<p>Lots of experiments are conducted to validate the effectiveness of the proposed method. These experiments are designed to address the following research questions:</p>
<list list-type="bullet">
<list-item>
<p>
<italic>RQ-1</italic>: Does the proposed graph learning method outperform other baselines?</p>
</list-item>
<list-item>
<p>
<italic>RQ-2</italic>: Can automatic tree features extraction replace manual annotation for the suicidal ideation detection task?</p>
</list-item>
<list-item>
<p>
<italic>RQ-3</italic>: Does each class of tree features contribute to the individual suicidal ideation detection?</p>
</list-item>
<list-item>
<p>
<italic>RQ-4</italic>: How do different hyperparameters (i.e. cost-sensitive weight for suicidal ideation detection, cost-sensitive weight for feature extraction, and the number of layers in GCN) affect the performance of suicidal ideation detection?</p>
</list-item>
<list-item>
<p>
<italic>RQ-5</italic>: Does the graph learning method perform stable on different sizes of training set?</p>
</list-item>
</list>
<p>When comparing the proposed method with the baselines, features are firstly extracted by automatic feature extraction module for each image. Then, an image can be represented as a 98-dimensional vector, where each dimension represents the presence or absence of the corresponding feature. For ML models, classification results are obtained by applying ML models on the extracted 98-dimensional vector. For the graph learning model represented by GCN, the extracted tree features are used to build the image-feature semantic graph, and then the model is applied for suicidal ideation detection task. In graph learning models, such as HAN and Simple-HGN, the image-feature semantic graph is represented as a heterogeneous graph, where image nodes and feature nodes are treated as two distinct types of nodes. The two types of edges are &#x201c;image-has-feature&#x201d; and &#x201c;feature-exists in-image.&#x201d; For CNN models, suicidal ideation detection can be seen as a simple image classification task with original image as input.</p>
<p>Additionally, <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref> shows the hyperparameters in the proposed method. Specifically, we used a multi-label learning model to implement automatic tree-drawing features extraction. By using the manuallyannotated features as labels, we trained the automatic tree features extraction model to obtain feature predictions for each image. During the training, the learning rate is set as 0.01, and the weight decay is set as 0.000001. For the class-imbalance issue in automatic tree feature extraction, the cost-sensitive weighted hyperparameter (<inline-formula>
<mml:math display="inline" id="im59">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> in <xref ref-type="disp-formula" rid="eq9">Equation 9</xref>) is set to 4.0. Also, a two-layer GCN (<italic>L</italic> = 2) is employed as graph learning module, and the ReLU function is used as the activation function in <xref ref-type="disp-formula" rid="eq5">Equation 5</xref>. To train GCN model, the learning rate is set as 0.01 and the weight decay is 0.001. For the class-imbalance issue in suicidal ideation detection, the cost-sensitive weighted hyperparameter (<italic>w<sub>c</sub>
</italic> in <xref ref-type="disp-formula" rid="eq8">Equation 8</xref>) is set to 7.0, These hyperparameters are determined by sensitivity analysis as shown in section 3.4. Besides, after the semantic graph construction, the graph contains 904 vertices(|<italic>V</italic>| = 904), comprising 806 image vertices and 98 feature vertices. For performance evaluation, 80% of image vertices are used as the training set and the rest 20% of image vertices are utilized as the testing set. The performance on the testing set is reported.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Hyperparameter settings.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Hyperparameter</th>
<th valign="top" align="center">Description</th>
<th valign="top" align="center">Value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">
<italic>L</italic>
</td>
<td valign="top" align="center">The number of GCN layers.</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="center">activation function</td>
<td valign="top" align="center">A mathematical function used in neural networks to introduce non-linearity, allowing the network to learn complex patterns.</td>
<td valign="top" align="center">ReLU</td>
</tr>
<tr>
<td valign="top" align="center">learning rate</td>
<td valign="top" align="center">A hyperparameter that controls the step size of parameter updates during model training.</td>
<td valign="top" align="center">0.01</td>
</tr>
<tr>
<td valign="top" align="center">weight decay</td>
<td valign="top" align="center">A technique used to prevent overfitting by adding a penalty term to the loss function.</td>
<td valign="top" align="center">0.001</td>
</tr>
<tr>
<td valign="top" align="center">
<italic>w<sub>c</sub>
</italic>
</td>
<td valign="top" align="center">The weight of class c.</td>
<td valign="top" align="center">7.0</td>
</tr>
<tr>
<td valign="top" align="center">
<inline-formula>
<mml:math display="inline" id="im58">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td valign="top" align="center">The weight of minority class for the i-th feature.</td>
<td valign="top" align="center">4.0</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Metrics</title>
<p>Regarding the task of suicidal ideation detection, it is more important to minimize missed cases with high suicidal ideation. Since suicidal ideation detection suffers from serious classimbalanced issue, the individuals who actually have high suicidal ideation (class 1) but are predicted as low suicidal ideation (class 0) are our main concern. Therefore, the following metrics, widely used in imbalanced classification, are employed to evaluate performance: precision of class 0 (precision<sub>0</sub>), recall of class 1 (recall<sub>1</sub>), macro average of F1 score (macro-F1), G-mean and false positive rate (FPR). They are defined in <xref ref-type="disp-formula" rid="eq10">Equations 10</xref>&#x2013;<xref ref-type="disp-formula" rid="eq14">14</xref> as follows (<xref ref-type="bibr" rid="B44">44</xref>):</p>
<disp-formula id="eq10">
<label>(10)</label>
<mml:math display="block" id="M10">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>precision</mml:mtext>
</mml:mrow>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mtext>TN</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>TN</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FN</mml:mtext>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>recall</mml:mtext>
</mml:mrow>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mtext>TN</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>TN</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq11">
<label>(11)</label>
<mml:math display="block" id="M11">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>precision</mml:mtext>
</mml:mrow>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>recall</mml:mtext>
</mml:mrow>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FN</mml:mtext>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq12">
<label>(12)</label>
<mml:math display="block" id="M12">
<mml:mrow>
<mml:mtable>
<mml:mtr>
<mml:mtd>
<mml:mtext>F</mml:mtext>
<mml:msub>
<mml:mn>1</mml:mn>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mtext>precisio</mml:mtext>
<mml:msub>
<mml:mtext>n</mml:mtext>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>recal</mml:mtext>
<mml:msub>
<mml:mtext>l</mml:mtext>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mtext>precisio</mml:mtext>
<mml:msub>
<mml:mtext>n</mml:mtext>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mtext>recal</mml:mtext>
<mml:msub>
<mml:mtext>l</mml:mtext>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mtext>&#x2009;F</mml:mtext>
<mml:msub>
<mml:mn>1</mml:mn>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mtext>precisio</mml:mtext>
<mml:msub>
<mml:mtext>n</mml:mtext>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>recal</mml:mtext>
<mml:msub>
<mml:mtext>l</mml:mtext>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mtext>precisio</mml:mtext>
<mml:msub>
<mml:mtext>n</mml:mtext>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mtext>recal</mml:mtext>
<mml:msub>
<mml:mtext>l</mml:mtext>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mtext>&#x2009;macro</mml:mtext>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext>F</mml:mtext>
<mml:mn>1</mml:mn>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mn>2</mml:mn>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:mo stretchy="false">(</mml:mo>
<mml:mtext>F</mml:mtext>
<mml:msub>
<mml:mn>1</mml:mn>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mtext>F</mml:mtext>
<mml:msub>
<mml:mn>1</mml:mn>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq13">
<label>(13)</label>
<mml:math display="block" id="M13">
<mml:mrow>
<mml:mtext>G</mml:mtext>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext>mean</mml:mtext>
<mml:mo>=</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mtext>recal</mml:mtext>
<mml:msub>
<mml:mtext>l</mml:mtext>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>TN</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>TN</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:msqrt>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq14">
<label>(14)</label>
<mml:math display="block" id="M14">
<mml:mrow>
<mml:mtext>FPR</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>FP</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>TN</mml:mtext>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where TP, TN, FP, and FN denote true positive, true negative, false positive, and false negative respectively. F1<sub>0</sub> and F1<sub>1</sub> represent F1 scores of class 0 and class 1 respectively. Macro-F1 can evaluate the model&#x2019;s performance by treat all classes equally. G-mean is a comprehensive indicator of the recall of class 0 and class 1. For the above metrics, a higher value indicates better performance. The False Positive Rate (FPR) measures the model&#x2019;s tendency to incorrectly predict negative samples as positive. A lower FPR indicates better performance in identifying negative samples.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>The proposed GCN method achieves better performance than baselines (RQ-1)</title>
<p>The performance of all methods are reported in <xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref> (left), with the cost-sensitive strategy consistently applied to both CNN models and graph learning models. From the results, both ML models and graph learning models have better result on macro-F1, demonstrating that these models perform well in predicting both high suicidal ideation class and low suicidal ideation class. Different from CNN models, which use convolution operations to extract the features of images, ML models and graph learning models were conducted based on the 98 tree-drawing features extracted from the images (see Section 2.3.2). Since these tree-drawing features are meaningful psychologically, they are relevant to individual suicidal ideation. They are well-suited for the task of suicidal ideation detection, thereby improving the overall performance. In order to explain the results more intuitively, <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref> shows the confusion matrices of decision tree (DT), cost-sensitive DT (<xref ref-type="bibr" rid="B45">45</xref>) and GCN. It can be noticed that the TP of GCN is higher than that of DT, thereby the recall<sub>1</sub> is higher. Since recall<sub>1</sub> is a very important metric in our task, which measures the model&#x2019;s ability to recognize the individuals with high suicidal ideation, the ML methods are not competitive for this task. In this case, lower FPR is due to a small number of high suicidal ideation being identified. The highest G-mean also demonstrates this point. Conceivably, compared with CNN and ML models, different tree-drawing image nodes are connected through tree-drawing feature nodes in semantic graph, similarities and differences among different samples during training can be better captured by graph.</p>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>Performance comparison results.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">model</th>
<th valign="top" align="center">precision<sub>0</sub>
</th>
<th valign="top" align="center">recall<sub>1</sub>
</th>
<th valign="top" align="center">macro-F1</th>
<th valign="top" align="center">G-mean</th>
<th valign="top" align="center">FPR</th>
<th valign="top" align="center">model*</th>
<th valign="top" align="center">precision<sub>0</sub>
</th>
<th valign="top" align="center">recall<sub>1</sub>
</th>
<th valign="top" align="center">macro-F1</th>
<th valign="top" align="center">G-mean</th>
<th valign="top" align="center">FPR</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">89.36%</td>
<td valign="top" align="center">21.05%</td>
<td valign="top" align="center">54.78%</td>
<td valign="top" align="center">43.22%</td>
<td valign="top" align="center">11.27%</td>
<td valign="top" align="center">LR*</td>
<td valign="top" align="center">89.93%</td>
<td valign="top" align="center">26.32%</td>
<td valign="top" align="center">56.68%</td>
<td valign="top" align="center">48.13%</td>
<td valign="top" align="center">11.97%</td>
</tr>
<tr>
<td valign="top" align="center">DT</td>
<td valign="top" align="center">89.58%</td>
<td valign="top" align="center">21.05%</td>
<td valign="top" align="center">
<bold>56.22%</bold>
</td>
<td valign="top" align="center">43.73%</td>
<td valign="top" align="center">9.15%</td>
<td valign="top" align="center">DT*</td>
<td valign="top" align="center">89.15%</td>
<td valign="top" align="center">26.32%</td>
<td valign="top" align="center">52.24%</td>
<td valign="top" align="center">46.17%</td>
<td valign="top" align="center">19.01%</td>
</tr>
<tr>
<td valign="top" align="center">SVM</td>
<td valign="top" align="center">88.96%</td>
<td valign="top" align="center">10.53%</td>
<td valign="top" align="center">53.98%</td>
<td valign="top" align="center">31.87%</td>
<td valign="top" align="center">
<bold>3.52%</bold>
</td>
<td valign="top" align="center">SVM*</td>
<td valign="top" align="center">90.13%</td>
<td valign="top" align="center">21.05%</td>
<td valign="top" align="center">60.88%</td>
<td valign="top" align="center">45.07%</td>
<td valign="top" align="center">3.52%</td>
</tr>
<tr>
<td valign="top" align="center">RF</td>
<td valign="top" align="center">88.96%</td>
<td valign="top" align="center">10.53%</td>
<td valign="top" align="center">53.98%</td>
<td valign="top" align="center">31.87%</td>
<td valign="top" align="center">
<bold>3.52%</bold>
</td>
<td valign="top" align="center">RF*</td>
<td valign="top" align="center">89.03%</td>
<td valign="top" align="center">10.53%</td>
<td valign="top" align="center">54.46%</td>
<td valign="top" align="center">31.98%</td>
<td valign="top" align="center">2.82%</td>
</tr>
<tr>
<td valign="top" align="center">AlexNet</td>
<td valign="top" align="center">88.17%</td>
<td valign="top" align="center">42.11%</td>
<td valign="top" align="center">44.09%</td>
<td valign="top" align="center">49.31%</td>
<td valign="top" align="center">42.25%</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="center">VGG16</td>
<td valign="top" align="center">86.89%</td>
<td valign="top" align="center">
<bold>57.89%</bold>
</td>
<td valign="top" align="center">35.35%</td>
<td valign="top" align="center">46.49%</td>
<td valign="top" align="center">62.68%</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="center">Inception</td>
<td valign="top" align="center">86.44%</td>
<td valign="top" align="center">
<bold>57.89%</bold>
</td>
<td valign="top" align="center">34.46%</td>
<td valign="top" align="center">45.60%</td>
<td valign="top" align="center">64.08%</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="center">ResNet</td>
<td valign="top" align="center">85.29%</td>
<td valign="top" align="center">47.37%</td>
<td valign="top" align="center">35.65%</td>
<td valign="top" align="center">43.99%</td>
<td valign="top" align="center">59.15%</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="center">GAT</td>
<td valign="top" align="center">89.74%</td>
<td valign="top" align="center">
<bold>57.89%</bold>
</td>
<td valign="top" align="center">42.60%</td>
<td valign="top" align="center">53.42%</td>
<td valign="top" align="center">50.70%</td>
<td valign="top" align="center">GAT*</td>
<td valign="top" align="center">91.09%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">50.52%</td>
<td valign="top" align="center">58.39%</td>
<td valign="top" align="center">35.21%</td>
</tr>
<tr>
<td valign="top" align="center">HAN</td>
<td valign="top" align="center">87.95%</td>
<td valign="top" align="center">47.37%</td>
<td valign="top" align="center">41.72%</td>
<td valign="top" align="center">49.35%</td>
<td valign="top" align="center">48.59%</td>
<td valign="top" align="center">HAN*</td>
<td valign="top" align="center">90.72%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">48.87%</td>
<td valign="top" align="center">57.11%</td>
<td valign="top" align="center">38.03%</td>
</tr>
<tr>
<td valign="top" align="center">S-HGN</td>
<td valign="top" align="center">88.76%</td>
<td valign="top" align="center">47.37%</td>
<td valign="top" align="center">44.09%</td>
<td valign="top" align="center">51.34%</td>
<td valign="top" align="center">44.37%</td>
<td valign="top" align="center">S-HGN*</td>
<td valign="top" align="center">90.00%</td>
<td valign="top" align="center">42.11%</td>
<td valign="top" align="center">50.71%</td>
<td valign="top" align="center">54.18%</td>
<td valign="top" align="center">30.28%</td>
</tr>
<tr>
<td valign="top" align="center">GCN</td>
<td valign="top" align="center">
<bold>90.59%</bold>
</td>
<td valign="top" align="center">
<bold>57.89%</bold>
</td>
<td valign="top" align="center">45.50%</td>
<td valign="top" align="center">
<bold>56.03%</bold>
</td>
<td valign="top" align="center">45.77%</td>
<td valign="top" align="center">GCN*</td>
<td valign="top" align="center">92.68%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">60.56%</td>
<td valign="top" align="center">65.00%</td>
<td valign="top" align="center">19.72%</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Bold indicates the best result among all methods.</p>
<p>*represents the situations where the tree features are manually-annotated.</p>
</fn>
<fn>
<p>-represents the situations where the model implementation does not rely on manually-annotated tree features.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>The confusion matrices of decision tree (DT), cost-sensitive DT and Graph Convolutional Network (GCN).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1617650-g005.tif">
<alt-text content-type="machine-generated">Three confusion matrices compare Decision Tree (DT), Cost-sensitive Decision Tree, and Graph Convolutional Network (GCN) models. Each matrix shows true positive (TP), false positive (FP), false negative (FN), and true negative (TN) values. DT: TP 4, FP 13, FN 15, TN 129. Cost-sensitive DT: TP 4, FP 23, FN 15, TN 119. GCN: TP 11, FP 65, FN 8, TN 77. Shaded gradients indicate data density.</alt-text>
</graphic>
</fig>
<p>As for the comparison with other graph learning models, GCN outperforms in terms of all metrics. We hypothesize that, due to the limited number of node types and edge types in the image-feature semantic graph, heterogeneous graph learning models are unable to fully demonstrate their advantages. Compared to GAT, which assigns adaptive edge weights through attention mechanisms, GCN still demonstrates superior performance. This discrepancy may suggest that maintaining equal edge weights is more suitable for the current task. Additionally, this could indicate that the current dataset size might not be sufficient for graph learning to learn the feature importance. Further exploration is warranted with a larger dataset in the future research.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Automatic extraction of tree-drawing features has room for improvement (RQ-2)</title>
<p>As mentioned in Section 2.3, we used a multi-label learning model to implement automatic tree-drawing features extraction. On the basis, we compared the models using automatically-extracted tree features with that using manually-annotated tree features for individual suicidal ideation detection. The results are reported in <xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref> (left vs. right). For a specific model, the suicidal ideation detection performance with manually-annotated tree features can be considered as idealized result. If the performance obtained using automatically-extracted tree features is closer to the idealized result, it means automatic feature extraction is more effective. From the results, it is apparent that individual suicidal ideation detection depends on accurate tree features for both machine learning models and graph learning models. In our method, the tree-drawing features are represented as vertices, which only have connections with image vertices in the image-feature semantic graph. The representation of a tree-drawing image would heavily be affected by the quality of features based on the information propagation mechanism of GCN, leading to significant improvement in terms of macro-F1 and G-mean metrics with manually-annotated feature for GCN. Thus, there is still significant room for improvement in automatic feature extraction in the future. Besides, it can be seen that GCN model outperforms ML models in suicidal ideation detection even under the setting of using manually-annotated tree features, demonstrating the effectiveness of the proposed method again. In an ideal scenario, the performance of GCN still surpasses that of the ML models, CNN models, and other graph learning models. And, the ideal GCN model performs well in both macro-F1 (60.56%) and G-mean (65.00%), and also demonstrates good performance in recall<sub>1</sub> (52.63%) and FPR (19.72%). This indicates that the GCN model has the highest potential for suicidal ideation detection based on Tree-Drawing Test.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>All classes of tree-drawing test features can contribute to suicidal ideation detection verified by ablation study (RQ-3)</title>
<p>As above-mentioned in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>, there is a total of 12 features classes. In order to prove the effectiveness of the features we selected, we conducted an ablation experiment. Based on the manually-annotated tree features, we removed each class of features respectively, and further conducted a GCN-based suicidal ideation detection experiment with the remaining features. The results are shown in <xref ref-type="table" rid="T5">
<bold>Table&#xa0;5</bold>
</xref>. The &#x201c;removed feature&#x201d; column represents the removed feature class, and the first &#x201c;none&#x201d; row means that all features are retained. The results indicate that the performance of the model after removing a certain class of features is slightly inferior to that without removing any class of features, which can be explained to a certain extent that all 12 classes of features are effective for individual suicidal ideation detection. Moreover, it is worth noting that when we removed the feature class &#x201c;leaf and flower&#x201d;, the performance had the most significant decline. In contrast, the performance reduction caused by removing feature class &#x201c;root&#x201d; or &#x201c;attachment&#x201d; is not obvious. We can initially conclude that for the task of suicidal ideation detection, features in the class &#x201c;leaves and flowers&#x201d;, such as &#x201c;leaves&#x201d; and &#x201c;fruits&#x201d;, play a more important role in detecting suicidal ideation than other features. In existing tree-drawing test studies, researchers have identified numerous characteristics related to psychological states, such as the shape of the tree crown, the inclination of the trunk, and the overall size of the tree (<xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B46">46</xref>). The importance of &#x201c;leaves and fruits&#x201d; validated by our study provides a new perspective to this field. In terms of metric recall<sub>1</sub>, the value increased when the feature classes &#x201c;special tree type&#x201d;, &#x201c;canopy&#x201d;, &#x201c;leaf and flower&#x201d; or &#x201c;ground&#x201d; were removed, which may suggest that these features usually appear in the images of low suicidal ideation. In total, all the 12 classes of features have a certain effect on detecting individual suicidal ideation.</p>
<table-wrap id="T5" position="float">
<label>Table&#xa0;5</label>
<caption>
<p>Feature ablation experiment.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">removed feature</th>
<th valign="top" align="center">precision<sub>0</sub>
</th>
<th valign="top" align="center">recall<sub>1</sub>
</th>
<th valign="top" align="center">macro-F1</th>
<th valign="top" align="center">G-mean</th>
<th valign="top" align="center">FPR</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">
<bold>none</bold>
</td>
<td valign="top" align="center">
<bold>92.68%</bold>
</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">
<bold>60.56%</bold>
</td>
<td valign="top" align="center">
<bold>65.00%</bold>
</td>
<td valign="top" align="center">
<bold>19.72%</bold>
</td>
</tr>
<tr>
<td valign="top" align="center">overall</td>
<td valign="top" align="center">92.04%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">55.71%</td>
<td valign="top" align="center">62.09%</td>
<td valign="top" align="center">26.76%</td>
</tr>
<tr>
<td valign="top" align="center">line</td>
<td valign="top" align="center">91.89%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">54.81%</td>
<td valign="top" align="center">61.49%</td>
<td valign="top" align="center">28.17%</td>
</tr>
<tr>
<td valign="top" align="center">special mark</td>
<td valign="top" align="center">92.11%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">56.17%</td>
<td valign="top" align="center">62.38%</td>
<td valign="top" align="center">26.06%</td>
</tr>
<tr>
<td valign="top" align="center">special tree type</td>
<td valign="top" align="center">92.79%</td>
<td valign="top" align="center">
<bold>57.89%</bold>
</td>
<td valign="top" align="center">56.65%</td>
<td valign="top" align="center">64.80%</td>
<td valign="top" align="center">27.46%</td>
</tr>
<tr>
<td valign="top" align="center">canopy</td>
<td valign="top" align="center">92.45%</td>
<td valign="top" align="center">
<bold>57.89%</bold>
</td>
<td valign="top" align="center">54.38%</td>
<td valign="top" align="center">63.21%</td>
<td valign="top" align="center">30.99%</td>
</tr>
<tr>
<td valign="top" align="center">branch</td>
<td valign="top" align="center">91.67%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">53.49%</td>
<td valign="top" align="center">60.58%</td>
<td valign="top" align="center">30.28%</td>
</tr>
<tr>
<td valign="top" align="center">leaf and flower</td>
<td valign="top" align="center">90.91%</td>
<td valign="top" align="center">
<bold>57.89%</bold>
</td>
<td valign="top" align="center">46.74%</td>
<td valign="top" align="center">57.11%</td>
<td valign="top" align="center">43.66%</td>
</tr>
<tr>
<td valign="top" align="center">trunk</td>
<td valign="top" align="center">91.82%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">54.37%</td>
<td valign="top" align="center">61.18%</td>
<td valign="top" align="center">28.87%</td>
</tr>
<tr>
<td valign="top" align="center">junction</td>
<td valign="top" align="center">91.89%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">54.81%</td>
<td valign="top" align="center">61.49%</td>
<td valign="top" align="center">28.17%</td>
</tr>
<tr>
<td valign="top" align="center">root</td>
<td valign="top" align="center">92.62%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">60.04%</td>
<td valign="top" align="center">64.72%</td>
<td valign="top" align="center">20.42%</td>
</tr>
<tr>
<td valign="top" align="center">ground</td>
<td valign="top" align="center">92.73%</td>
<td valign="top" align="center">
<bold>57.89%</bold>
</td>
<td valign="top" align="center">56.19%</td>
<td valign="top" align="center">64.49%</td>
<td valign="top" align="center">28.17%</td>
</tr>
<tr>
<td valign="top" align="center">attachment</td>
<td valign="top" align="center">92.62%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">60.04%</td>
<td valign="top" align="center">64.72%</td>
<td valign="top" align="center">20.42%</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Bold indicates the best result among all methods.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Sensitivity analysis helps determining the best hyperparameters (RQ-4)</title>
<sec id="s3_4_1">
<label>3.4.1</label>
<title>Cost-sensitive weight for suicidal ideation detection</title>
<p>In reality, the number of individuals with low suicidal ideation is much larger than that with high suicidal ideation, resulting in a serious class-imbalance issue between class 0 (low suicidal ideation) and class 1 (high suicidal ideation) in the dataset. A cost-sensitive strategy with weighting factor <italic>w<sub>c</sub>
</italic> is introduced in <xref ref-type="disp-formula" rid="eq8">Equation 8</xref> to solve this problem. We tested the weight values in the range between 1 and 16 in steps of 1, since the ratio of samples with low suicidal ideation to those with high suicidal ideation is approximately 7.57:1. The performance with the change of weighting factor <italic>w<sub>c</sub>
</italic> is shown in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>. When the <italic>w<sub>c</sub>
</italic> is 1 or 2, the values of G-mean and recall<sub>1</sub> are zero, which means that the model has difficulties in detecting the samples with high suicidal ideation, and the model gives wrong predictions to all samples with high suicidal ideation. In general, the overall performance increases firstly and then decreases. The model has a more stable performance when the <italic>w<sub>c</sub>
</italic> is between 6 and 9. Besides, it seems that the four metrics achieve the best results when <italic>w<sub>c</sub>
</italic> is 7. It suggests that the proposed method requires selecting <italic>w<sub>c</sub>
</italic> based on data distribution in practical applications.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Sensitivity test of cost-sensitive weight for individual suicidal ideation detection.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1617650-g006.tif">
<alt-text content-type="machine-generated">Line graph plotting various performance metrics against \(w_c\) values from 1 to 16. Orange line represents precision0, consistently above 80%. Yellow and green lines, recall1 and macro-f1, fluctuate between 0% and 60%. Cyan line, G-mean, increases from 0% to 60%. Red line, FPR, shows more variation between 0% and 40%.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3_4_2">
<label>3.4.2</label>
<title>Cost-sensitive weight for feature extraction</title>
<p>For each feature, there is also a class-imbalance issue. For example, closed tree canopy is more common in tree images, so there are more images with the &#x201c;closed canopy&#x201d; feature than that without it in our dataset. And only a very small number of images contain houses or people, so the number of images without &#x201c;houses or people&#x201d; feature is much larger than that with it. Therefore, we introduced the weighting factor (named <inline-formula>
<mml:math display="inline" id="im60">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula>) in <xref ref-type="disp-formula" rid="eq9">Equation 9</xref> during the automatic features extraction. For each feature, we gave a larger <inline-formula>
<mml:math display="inline" id="im61">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> to the feature class with fewer samples when performing the multi-classification task. Following the same range of <italic>w<sub>c</sub>
</italic> in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>, we tried 5 different <inline-formula>
<mml:math display="inline" id="im62">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> values for each feature class and conducted the automatic tree features extraction experiment, and the results are shown in <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>. The specific approach is using the manually-annotated features as labels and applying automatic tree features extraction model. During the training, <inline-formula>
<mml:math display="inline" id="im63">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is applied to the class with fewer samples for each feature. Overall, the feature extraction model performs the best when <inline-formula>
<mml:math display="inline" id="im64">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is 4.0.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Sensitivity test of cost-sensitive weight for automatic features extraction.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1617650-g007.tif">
<alt-text content-type="machine-generated">Line graph showing performance percentages of precision, recall, and F1 score against a variable labeled \( w_f^i \). Precision decreases, recall increases, and F1 score remains stable, intersecting at \( w_f^i = 2 \).</alt-text>
</graphic>
</fig>
<p>After we obtained automatic feature extraction results based on the models with five different <inline-formula>
<mml:math display="inline" id="im65">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula>, the image-feature semantic graph is constructed and the suicidal ideation task is conducted respectively. The results are shown in <xref ref-type="table" rid="T6">
<bold>Table&#xa0;6</bold>
</xref>. It can be noticed that GCN and DT perform better when <inline-formula>
<mml:math display="inline" id="im66">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is 4, and the best <inline-formula>
<mml:math display="inline" id="im67">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> for LR, SVM and RF is 2. From the results, we can find that the performance with <inline-formula>
<mml:math display="inline" id="im68">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> as 1 is worse than that of 2, 4 and 8, such result demonstrates that the cost-sensitive strategy does improve the performance of individual suicidal ideation detection. Meanwhile, there are opposite effects when the <inline-formula>
<mml:math display="inline" id="im69">
<mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is too large.</p>
<table-wrap id="T6" position="float">
<label>Table&#xa0;6</label>
<caption>
<p>Suicidal ideation detection based on automatic feature coding with different <italic>w<sub>f</sub>
</italic>.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Model</th>
<th valign="top" align="center">
<italic>w<sub>f</sub>
</italic>
</th>
<th valign="top" align="center">Precision<sub>0</sub>
</th>
<th valign="top" align="center">Recall<sub>1</sub>
</th>
<th valign="top" align="center">Macro-F1</th>
<th valign="top" align="center">G-mean</th>
<th valign="top" align="center">FPR</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" rowspan="5" align="center">GCN</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">89.36%</td>
<td valign="top" align="center">47.37%</td>
<td valign="top" align="center">46.06%</td>
<td valign="top" align="center">52.93%</td>
<td valign="top" align="center">40.85%</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">90.32%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">47.24%</td>
<td valign="top" align="center">55.80%</td>
<td valign="top" align="center">40.85%</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">90.59%</td>
<td valign="top" align="center">57.89%</td>
<td valign="top" align="center">45.50%</td>
<td valign="top" align="center">56.03%</td>
<td valign="top" align="center">45.77%</td>
</tr>
<tr>
<td valign="top" align="center">8</td>
<td valign="top" align="center">90.00%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">46.02%</td>
<td valign="top" align="center">54.79%</td>
<td valign="top" align="center">42.96%</td>
</tr>
<tr>
<td valign="top" align="center">16</td>
<td valign="top" align="center">89.58%</td>
<td valign="top" align="center">47.37%</td>
<td valign="top" align="center">46.85%</td>
<td valign="top" align="center">53.56%</td>
<td valign="top" align="center">39.44%</td>
</tr>
<tr>
<td valign="top" rowspan="5" align="center">LR</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">89.29%</td>
<td valign="top" align="center">21.05%</td>
<td valign="top" align="center">54.33%</td>
<td valign="top" align="center">43.05%</td>
<td valign="top" align="center">11.97%</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">88.71%</td>
<td valign="top" align="center">26.32%</td>
<td valign="top" align="center">50.28%</td>
<td valign="top" align="center">45.15%</td>
<td valign="top" align="center">22.54%</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">89.36%</td>
<td valign="top" align="center">21.05%</td>
<td valign="top" align="center">54.78%</td>
<td valign="top" align="center">43.22%</td>
<td valign="top" align="center">11.27%</td>
</tr>
<tr>
<td valign="top" align="center">8</td>
<td valign="top" align="center">88.54%</td>
<td valign="top" align="center">5.26%</td>
<td valign="top" align="center">50.84%</td>
<td valign="top" align="center">22.70%</td>
<td valign="top" align="center">2.11%</td>
</tr>
<tr>
<td valign="top" align="center">16</td>
<td valign="top" align="center">89.24%</td>
<td valign="top" align="center">10.53%</td>
<td valign="top" align="center">56.09%</td>
<td valign="top" align="center">32.33%</td>
<td valign="top" align="center">0.70%</td>
</tr>
<tr>
<td valign="top" rowspan="5" align="center">DT</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">88.74%</td>
<td valign="top" align="center">10.53%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">31.52%</td>
<td valign="top" align="center">5.63%</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">88.81%</td>
<td valign="top" align="center">15.79%</td>
<td valign="top" align="center">52.67%</td>
<td valign="top" align="center">37.58%</td>
<td valign="top" align="center">10.56%</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">89.58%</td>
<td valign="top" align="center">21.05%</td>
<td valign="top" align="center">56.22%</td>
<td valign="top" align="center">43.73%</td>
<td valign="top" align="center">9.15%</td>
</tr>
<tr>
<td valign="top" align="center">8</td>
<td valign="top" align="center">88.98%</td>
<td valign="top" align="center">26.32%</td>
<td valign="top" align="center">51.44%</td>
<td valign="top" align="center">45.76%</td>
<td valign="top" align="center">20.42%</td>
</tr>
<tr>
<td valign="top" align="center">16</td>
<td valign="top" align="center">84.47%</td>
<td valign="top" align="center">15.79%</td>
<td valign="top" align="center">39.41%</td>
<td valign="top" align="center">31.10%</td>
<td valign="top" align="center">38.73%</td>
</tr>
<tr>
<td valign="top" rowspan="5" align="center">SVM</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">88.61%</td>
<td valign="top" align="center">5.26%</td>
<td valign="top" align="center">51.21%</td>
<td valign="top" align="center">22.78%</td>
<td valign="top" align="center">1.41%</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">88.96%</td>
<td valign="top" align="center">10.53%</td>
<td valign="top" align="center">53.98%</td>
<td valign="top" align="center">31.87%</td>
<td valign="top" align="center">3.52%</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">88.67%</td>
<td valign="top" align="center">5.26%</td>
<td valign="top" align="center">51.61%</td>
<td valign="top" align="center">22.86%</td>
<td valign="top" align="center">0.70%</td>
</tr>
<tr>
<td valign="top" align="center">8</td>
<td valign="top" align="center">88.08%</td>
<td valign="top" align="center">5.26%</td>
<td valign="top" align="center">48.84%</td>
<td valign="top" align="center">22.20%</td>
<td valign="top" align="center">6.34%</td>
</tr>
<tr>
<td valign="top" align="center">16</td>
<td valign="top" align="center">88.75%</td>
<td valign="top" align="center">5.26%</td>
<td valign="top" align="center">52.02%</td>
<td valign="top" align="center">22.94%</td>
<td valign="top" align="center">0%</td>
</tr>
<tr>
<td valign="top" rowspan="5" align="center">RF</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">88.96%</td>
<td valign="top" align="center">10.53%</td>
<td valign="top" align="center">53.98%</td>
<td valign="top" align="center">31.87%</td>
<td valign="top" align="center">3.52%</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">88.96%</td>
<td valign="top" align="center">10.53%</td>
<td valign="top" align="center">53.98%</td>
<td valign="top" align="center">31.87%</td>
<td valign="top" align="center">3.52%</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">88.54%</td>
<td valign="top" align="center">5.26%</td>
<td valign="top" align="center">50.84%</td>
<td valign="top" align="center">22.70%</td>
<td valign="top" align="center">2.11%</td>
</tr>
<tr>
<td valign="top" align="center">8</td>
<td valign="top" align="center">88.82%</td>
<td valign="top" align="center">10.53%</td>
<td valign="top" align="center">53.06%</td>
<td valign="top" align="center">31.63%</td>
<td valign="top" align="center">4.93%</td>
</tr>
<tr>
<td valign="top" align="center">16</td>
<td valign="top" align="center">87.86%</td>
<td valign="top" align="center">10.53%</td>
<td valign="top" align="center">48.62%</td>
<td valign="top" align="center">30.20%</td>
<td valign="top" align="center">13.38%</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_4_3">
<label>3.4.3</label>
<title>The number of GCN layers</title>
<p>Since the number of layers in GCN also has great influence in the performance of our suicidal ideation detection model, we experimented on GCN with 1, 2, 3, and 4 layers. The results are shown in <xref ref-type="table" rid="T7">
<bold>Table&#xa0;7</bold>
</xref>. It shows that the best performance is achieved when the number of layers is 2. Such a result is also consistent with previous researches that stacking more layers in GCN will lead to worse performance, due to vanishing gradients and over-smoothing (<xref ref-type="bibr" rid="B47">47</xref>).</p>
<table-wrap id="T7" position="float">
<label>Table&#xa0;7</label>
<caption>
<p>The performance of the GCN with different number of layers.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Layer number</th>
<th valign="top" align="center">Precision<sub>0</sub>
</th>
<th valign="top" align="center">Recall<sub>1</sub>
</th>
<th valign="top" align="center">Macro-F1</th>
<th valign="top" align="center">G-mean</th>
<th valign="top" align="center">FPR</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">92.66%</td>
<td valign="top" align="center">57.89%</td>
<td valign="top" align="center">55.73%</td>
<td valign="top" align="center">64.17%</td>
<td valign="top" align="center">28.87%</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">92.68%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">60.56%</td>
<td valign="top" align="center">65.00%</td>
<td valign="top" align="center">19.72%</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">92.11%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">56.17%</td>
<td valign="top" align="center">62.38%</td>
<td valign="top" align="center">26.06%</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">91.67%</td>
<td valign="top" align="center">52.63%</td>
<td valign="top" align="center">53.49%</td>
<td valign="top" align="center">60.58%</td>
<td valign="top" align="center">30.28%</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>The Proposed GCN model exhibits stability as training data changes (RQ-5)</title>
<sec id="s3_5_1">
<label>3.5.1</label>
<title>Stability of the model with different training sizes</title>
<p>In the suicidal ideation task, the image vertices on the graph are divided into 645 training vertices and 161 testing vertices, and GCN in graph learning module is trained with training data via back-propagation. Therefore, in order to show the stability of our proposed method with different training sizes, we conducted the experiments with different size of training data. Keeping the 161 testing vertices unchanged, 580 (90%), 516 (80%), 451 (70%), 387 (60%), 322 (50%) training vertices are randomly selected from 645 training vertices and used to construct the image-feature semantic graph respectively. Then the GCN model is trained on these graphs separately. The results are shown in <xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8</bold>
</xref>. It is easy to find that the experiment results do not fluctuate as the number of training vertices changes, which effectively proves the stability of the model.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>The performance of the model on training sets with different sample sizes.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1617650-g008.tif">
<alt-text content-type="machine-generated">Line graph comparing performance metrics against training size. Precision0 remains near 90% across all sizes. G-mean and macro-fl around 60%-70%, while recall1 declines slightly. FPR starts at 25%, decreasing, then increasing slightly.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3_5_2">
<label>3.5.2</label>
<title>Stability of the model on different edge sizes</title>
<p>Considering the situation where insufficient individual expression or inaccurate automatic feature extraction leads to missing features, the semantic graph may miss some edges, i.e., the connections between tree-drawing image and its features. Thus, it is also necessary to explore the model stability on different numbers of missing edges. To achieve it, we randomly kept edges to simulate the situation where tree features cannot be extracted. We retained 90%, 80%, 70%, 60% and 50% of the edges in the image-feature semantic graph and then performed suicide ideation detection on the newly generated graphs, the results are shown in <xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9</bold>
</xref>.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>The performance of the model with different numbers of missing edges.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1617650-g009.tif">
<alt-text content-type="machine-generated">Line chart displaying performance metrics against edge size. The x-axis shows edge size percentages from one hundred to fifty percent. The y-axis shows performance percentages from zero to one hundred percent. Lines represent precision0, recall1, macro-f1, G-mean, and FPR, with precision0 remaining high and stable, recall1 slightly declining, and FPR increasing as edge size decreases.</alt-text>
</graphic>
</fig>
<p>From the results, we can notice that when some edges are removed, the overall performance is relatively stable as the edge size decreases. Besides, macro-F1 and G-mean show a downward trend, and this trend become apparent when the edge size is less than 80%. It can be concluded that the absence of edges does have a slight impact on the performance of suicidal ideation detection, and this impact becomes significant when degree of absence increases to a certain value. Such results indicate that our proposed method is still capable of detecting suicidal ideation when less than 20% characteristics of the tree-drawing image cannot be fully represented. Moreover, such a result once again demonstrates that automatic features extraction should be further studied to improve the performance of the proposed method in the future.</p>
</sec>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>This study employs projective test methodologies, specifically the Tree-Drawing Test (TDT), which effectively uncovers individuals&#x2019; subconscious psychological states while minimizing susceptibility to social desirability and subjective control biases. Compared to techniques requiring high-precision equipment and technical expertise, such as electroencephalography, the TDT necessitates only paper and pencil, enabling broader implementation and lower operational costs. This study focuses on how to automatically detect individual suicidal ideation based on the TDT. Beyond machine learning and image processing techniques, we further leverage graph learning to implement automated detection from projective responses. This approach integrates psychological tree features with graph learning techniques, improving the performance of suicidal ideation detection and thereby advancing the application of the TDT in the field of mental health.</p>
<p>Next, it is worth noting that the theoretical basis of TDT is the psychoanalytic genre (<xref ref-type="bibr" rid="B48">48</xref>), which heavily relies on experts&#x2019; interpretations. To address this issue, existing researches have explored various coding systems to link drawing features with specific mental states (<xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B49">49</xref>&#x2013;<xref ref-type="bibr" rid="B52">52</xref>). For instance, trunk width, trunk base opening, and branch ends size are significantly associated with schizophrenia (<xref ref-type="bibr" rid="B49">49</xref>). Canopy area, canopy height, canopy width, trunk width and total tree area are related to depressive symptoms (<xref ref-type="bibr" rid="B16">16</xref>). Roots, truncated tree, flattened crown, and bizarre tree are considered as the important predictors for mental disorders (<xref ref-type="bibr" rid="B50">50</xref>). In our ablation study, &#x201c;leaves and fruits&#x201d; demonstrates its effectiveness in detecting suicidal ideation. Generally speaking, in projective tree-drawing test, &#x201c;leaves and fruits&#x201d; typically correspond to an individual&#x2019;s connection with their environment and personal growth and aspirations (<xref ref-type="bibr" rid="B53">53</xref>), and thus some researches have adopted &#x201c;leaves&#x201d; and &#x201c;fruit&#x201d; to predict individual depression (<xref ref-type="bibr" rid="B54">54</xref>). This is inherently consistent with our findings. This series of research suggests that projection tests contain rich individual differences, and the relevant features are worth continuously exploring.</p>
<p>Furthermore, considering the associations among negative emotions, abnormal mental state and suicidal ideation, previous studies provide a certain basis for automatic suicidal ideation detection. However, in traditional machine learning methods that initially depend on feature recognition, the accuracy of this feature recognition process significantly impacts model performance. The current study demonstrates that employing graph learning approaches can, to a certain extent, address the issue of performance stability. This may be because graph learning allows for the modeling of complex relationships and interactions between tree-drawing images and tree features (<xref ref-type="bibr" rid="B55">55</xref>). This characteristic ensures robust stability of the model under high performance, even when the training set changes. At the same time, the unique &#x201c;image-feature&#x201d; semantic graph structure can better explain the inference of the proposed method. Moreover, graph learning models are inherently flexible and adaptable, capable of incorporating new information dynamically. When new image features are added, the graph model can naturally expand by adding new nodes, but traditional machine learning models can only be redesigned and trained (<xref ref-type="bibr" rid="B56">56</xref>, <xref ref-type="bibr" rid="B57">57</xref>). Additionally, more and more graph modeling techniques are beginning to focus on the interpretability of model&#x2019;s decisions (<xref ref-type="bibr" rid="B38">38</xref>, <xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B58">58</xref>). Although these complex models did not yield good results on our dataset, they may become future solutions for automated analysis of projection tests as data accumulates.</p>
<p>Finally, there are also some limitations to be explored in the future. First, regarding sample selection, this study only included 806 primary and middle school students from Shaanxi Province, resulting in a small sample size with limited geographic and age diversity. The symbolic meanings of tree drawings may vary across cultural and age groups, so the model&#x2019;s applicability in different cultural contexts requires further consideration. Second, this study adopted a cross-sectional design, capturing data at a single time point. However, suicidal ideation often exhibits dynamic development, and data from a single time point may be significantly influenced by the testing context and participants&#x2019; current psychological states. Future research should consider integrating projective tests into longitudinal designs, capturing the temporal dynamics of suicidal ideation and allowing for a more comprehensive understanding of its progression over time. Next, due to the small data size and the nature of GCN model, this study did not conduct an in-depth analysis of the importance of each tree-drawing image feature. In future research, with the application of advanced graph models supported by a larger dataset, it is expected that we can explain the effectiveness of these features more thoroughly. Finally, the performance of automated recognition of image features in the tree-drawing test still needs improvement, to support more accurate individual suicidal ideation detection.</p>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s6" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Institutional Review Board of Beijing Normal University. The studies were conducted in accordance with the local legislation and institutional requirements. The ethics committee/institutional review board waived the requirement of written informed consent for participation from the participants or the participants&#x2019; legal guardians/next of kin because the study was conducted as part of a national education monitoring task, and the relevant educational systems and schools were fully informed about the research objectives and procedures.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>YL: Writing &#x2013; original draft, Funding acquisition, Formal analysis, Methodology. JZ: Methodology, Writing &#x2013; original draft. YZ: Writing &#x2013; original draft. FL: Writing &#x2013; review &amp; editing, Conceptualization, Resources. XT: Funding acquisition, Project administration, Supervision, Writing &#x2013; review &amp; editing.</p>
</sec>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This work is supported by the National Natural Science Foundation of China (No. 62306118, 62207002), the Guangdong Provincial Key Laboratory of Human Digital Twin (2022B1212010004), the Fundamental Research Funds for the Central Universities (2023ZYGXZR105), and Engineering Research Center of Integration and Application of Digital Learning Technology, Ministry of Education (1411003).</p>
</sec>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="book">
<person-group person-group-type="author">
<collab>World Health Organization</collab>
</person-group>. <source>Adolescent and young adult health</source>. (<year>2023</year>). Available at: <uri xlink:href="https://www.who.int/news-room/fact-sheets/detail/adolescents-health-risks-and-solutions">https://www.who.int/news-room/fact-sheets/detail/adolescents-health-risks-and-solutions</uri>
</citation></ref>
<ref id="B2">
<label>2</label>
<citation citation-type="book">
<person-group person-group-type="author">
<collab>World Health Organization</collab>
</person-group>. <source>Suicide</source>. (<year>2023</year>). Available at: <uri xlink:href="https://www.who.int/news-room/fact-sheets/detail/suicide">https://www.who.int/news-room/fact-sheets/detail/suicide</uri>
</citation></ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wasserman</surname> <given-names>D</given-names>
</name>
<name>
<surname>Carli</surname> <given-names>V</given-names>
</name>
<name>
<surname>Iosue</surname> <given-names>M</given-names>
</name>
<name>
<surname>Javed</surname> <given-names>A</given-names>
</name>
<name>
<surname>Herrman</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Suicide prevention in childhood and adolescence: a narrative review of current knowledge on risk and protective factors and effectiveness of interventions</article-title>. <source>Asia-Pac Psychiatry</source>. (<year>2021</year>) <volume>13</volume>:<fpage>e12452</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/appy.12452</pub-id>, PMID: <pub-id pub-id-type="pmid">33646646</pub-id></citation></ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beck</surname> <given-names>AT</given-names>
</name>
<name>
<surname>Steer</surname> <given-names>RA</given-names>
</name>
<name>
<surname>Ranieri</surname> <given-names>WF</given-names>
</name>
</person-group>. <article-title>Scale for suicide ideation: Psychometric properties of a self-report version</article-title>. <source>J Clin Psychol</source>. (<year>1988</year>) <volume>44</volume>:<fpage>499</fpage>&#x2013;<lpage>505</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/1097-4679(198807)44:4&lt;499::AID-JCLP2270440404&gt;3.0.CO;2-6</pub-id>
</citation></ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bello</surname> <given-names>HJ</given-names>
</name>
<name>
<surname>Palomar-Ciria</surname> <given-names>N</given-names>
</name>
<name>
<surname>Baca-Garc&#xed;a</surname> <given-names>E</given-names>
</name>
<name>
<surname>Lozano</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Suicide classification for news media using convolutional neural networks</article-title>. <source>Health Commun</source>. (<year>2023</year>) <volume>38</volume>:<page-range>2178&#x2013;87</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/10410236.2022.2058686</pub-id>, PMID: <pub-id pub-id-type="pmid">35532012</pub-id></citation></ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McManus</surname> <given-names>KF</given-names>
</name>
<name>
<surname>Stringer</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Corson</surname> <given-names>N</given-names>
</name>
<name>
<surname>Fodeh</surname> <given-names>S</given-names>
</name>
<name>
<surname>Steinhardt</surname> <given-names>S</given-names>
</name>
<name>
<surname>Levin</surname> <given-names>FL</given-names>
</name>
<etal/>
</person-group>. <article-title>Deploying a national clinical text processing infrastructure</article-title>. <source>J Am Med Inf Assoc</source>. (<year>2024</year>) <volume>31</volume>:<page-range>727&#x2013;31</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/jamia/ocad249</pub-id>, PMID: <pub-id pub-id-type="pmid">38146986</pub-id></citation></ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heckler</surname> <given-names>WF</given-names>
</name>
<name>
<surname>Feij&#xf3;</surname> <given-names>LP</given-names>
</name>
<name>
<surname>de Carvalho</surname> <given-names>JV</given-names>
</name>
<name>
<surname>Barbosa</surname> <given-names>JLV</given-names>
</name>
</person-group>. <article-title>Thoth: An intelligent model for assisting individuals with suicidal ideation</article-title>. <source>Expert Syst Appl</source>. (<year>2023</year>) <volume>233</volume>:<fpage>120918</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eswa.2023.120918</pub-id>
</citation></ref>
<ref id="B8">
<label>8</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Gideon</surname> <given-names>J</given-names>
</name>
<name>
<surname>Schatten</surname> <given-names>HT</given-names>
</name>
<name>
<surname>McInnis</surname> <given-names>MG</given-names>
</name>
<name>
<surname>Provost</surname> <given-names>EM</given-names>
</name>
</person-group>. <article-title>Emotion recognition from natural phone conversations in individuals with and without recent suicidal ideation</article-title>. In: <source>Interspeech</source> <publisher-loc>Graz, Austria</publisher-loc>: <publisher-loc>ISCA</publisher-loc> (<year>2019</year>).</citation></ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Belouali</surname> <given-names>A</given-names>
</name>
<name>
<surname>Gupta</surname> <given-names>S</given-names>
</name>
<name>
<surname>Sourirajan</surname> <given-names>V</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Allen</surname> <given-names>N</given-names>
</name>
<name>
<surname>Alaoui</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Acoustic and language analysis of speech for suicidal ideation among us veterans</article-title>. <source>BioData Min</source>. (<year>2021</year>) <volume>14</volume>:<fpage>1</fpage>&#x2013;<lpage>17</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13040-021-00245-y</pub-id>, PMID: <pub-id pub-id-type="pmid">33531048</pub-id></citation></ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Iyer</surname> <given-names>R</given-names>
</name>
<name>
<surname>Nedeljkovic</surname> <given-names>M</given-names>
</name>
<name>
<surname>Meyer</surname> <given-names>D</given-names>
</name>
</person-group>. <article-title>Using voice biomarkers to classify suicide risk in adult telehealth callers: retrospective observational study</article-title>. <source>JMIR Ment Health</source>. (<year>2022</year>) <volume>9</volume>:<fpage>e39807</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2196/39807</pub-id>, PMID: <pub-id pub-id-type="pmid">35969444</pub-id></citation></ref>
<ref id="B11">
<label>11</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Eigbe</surname> <given-names>N</given-names>
</name>
<name>
<surname>Baltrusaitis</surname> <given-names>T</given-names>
</name>
<name>
<surname>Morency</surname> <given-names>L-P</given-names>
</name>
<name>
<surname>Pestian</surname> <given-names>J</given-names>
</name>
</person-group>. (<year>2018</year>). <article-title>Toward visual behavior markers of suicidal ideation</article-title>, in: <conf-name>2018 13th IEEE International Conference on Automatic Face &amp; Gesture Recognition (FG 2018)</conf-name>, <publisher-loc>Piscataway, NJ, USA</publisher-loc>: <publisher-name>IEEE</publisher-name>. pp. <page-range>530&#x2013;4</page-range>. <publisher-name>IEEE</publisher-name>.</citation></ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Onie</surname> <given-names>S</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<name>
<surname>Glastonbury</surname> <given-names>K</given-names>
</name>
<name>
<surname>Hardy</surname> <given-names>RC</given-names>
</name>
<name>
<surname>Rakusin</surname> <given-names>D</given-names>
</name>
<name>
<surname>Wong</surname> <given-names>I</given-names>
</name>
<etal/>
</person-group>. <article-title>Understanding and detecting behaviours prior to a suicide attempt: A mixed-methods study</article-title>. <source>Aust New Z J Psychiatry</source>. (<year>2023</year>) <volume>57</volume>:<page-range>1016&#x2013;22</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/00048674231152159</pub-id>, PMID: <pub-id pub-id-type="pmid">36715024</pub-id></citation></ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Prasad</surname> <given-names>DK</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>S-HA</given-names>
</name>
<name>
<surname>Quek</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Sentiment analysis using eeg activities for suicidology</article-title>. <source>Expert Syst Appl</source>. (<year>2018</year>) <volume>103</volume>:<page-range>206&#x2013;17</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eswa.2018.03.011</pub-id>
</citation></ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hasey</surname> <given-names>G</given-names>
</name>
<name>
<surname>Colic</surname> <given-names>S</given-names>
</name>
<name>
<surname>Reilly</surname> <given-names>J</given-names>
</name>
<name>
<surname>MacCrimmon</surname> <given-names>D</given-names>
</name>
<name>
<surname>Khodayari</surname> <given-names>A</given-names>
</name>
<name>
<surname>DeBruin</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Detection of suicidal ideation in depressed subjects using resting electroencephalography features identified by machine learning algorithms</article-title>. <source>Biol Psychiatry</source>. (<year>2020</year>) <volume>87</volume>:<page-range>S380&#x2013;1</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.biopsych.2020.02.974</pub-id>
</citation></ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dai</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>X</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>S</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>R</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<etal/>
</person-group>. <article-title>Gradually evaluating of suicidal risk in depression by semi-supervised cluster analysis on resting-state fmri</article-title>. <source>Brain Imaging Behav</source>. (<year>2021</year>) <volume>15</volume>:<page-range>2149&#x2013;58</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11682-020-00410-7</pub-id>, PMID: <pub-id pub-id-type="pmid">33151465</pub-id></citation></ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>F</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>R</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>G</given-names>
</name>
<etal/>
</person-group>. <article-title>Screening depressive disorders with tree-drawing test</article-title>. <source>Front Psychol</source>. (<year>2020</year>) <volume>11</volume>:<elocation-id>1446</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpsyg.2020.01446</pub-id>, PMID: <pub-id pub-id-type="pmid">32670166</pub-id></citation></ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Morris</surname> <given-names>MB</given-names>
</name>
</person-group>. <article-title>The diagnostic drawing series and the tree rating scale: An isomorphic representation of multiple personality disorder, major depression, and schizophrenia populations</article-title>. <source>Art Ther</source>. (<year>1995</year>) <volume>12</volume>:<page-range>118&#x2013;28</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/07421656.1995.10759142</pub-id>
</citation></ref>
<ref id="B18">
<label>18</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Anica</surname> <given-names>PF</given-names>
</name>
<name>
<surname>Lucian</surname> <given-names>CV</given-names>
</name>
</person-group>. <article-title>Image processing techniques, interpretation of parameters and psychological significance by the tree-drawing test</article-title>. In: <source>International Conference &#x201c;SUPERVISION IN PSYCHOTHERAPY&#x201d; 2nd editionAt</source>. <publisher-loc>Timisoara, Romania</publisher-loc>: <publisher-name>IPCS</publisher-name> (<year>2019</year>).</citation></ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Anica</surname> <given-names>F</given-names>
</name>
<name>
<surname>Lucian</surname> <given-names>CV</given-names>
</name>
</person-group>. <article-title>Automatic image processing of tree drawings for psychological tests</article-title>. <source>Int Conf Legal Med Cluj</source>. (<year>2020</year>) <volume>2</volume>:<page-range>166&#x2013;71</page-range>.</citation></ref>
<ref id="B20">
<label>20</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Maliki</surname> <given-names>I</given-names>
</name>
<name>
<surname>Firmansyah</surname> <given-names>AR</given-names>
</name>
</person-group>. (<year>2023</year>). <article-title>Personality detection based on tree drawing using convolutional neural network</article-title>, in: <conf-name>2023 International Conference on Informatics Engineering, Science &amp; Technology (INCITEST)</conf-name>, <publisher-loc>Piscataway, NJ, USA</publisher-loc>: <publisher-name>IEEE</publisher-name>. pp. <fpage>1</fpage>&#x2013;<lpage>6</lpage>.</citation></ref>
<ref id="B21">
<label>21</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Nunnally</surname> <given-names>J</given-names>
</name>
</person-group>. <source>Psychometric Theory 3E. McGraw-Hill series in psychology</source>. <publisher-loc>New York, USA</publisher-loc>: <publisher-name>Tata McGraw-Hill Education</publisher-name> (<year>1994</year>).</citation></ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cronbach</surname> <given-names>LJ</given-names>
</name>
</person-group>. <article-title>Coefficient alpha and the internal structure of tests</article-title>. <source>psychometrika</source>. (<year>1951</year>) <volume>16</volume>:<fpage>297</fpage>&#x2013;<lpage>334</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF02310555</pub-id>
</citation></ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reynolds</surname> <given-names>CR</given-names>
</name>
</person-group>. <article-title>Behavior assessment system for children</article-title>. <source>Corsini Encyclopedia Psychol</source>. (<year>2010</year>), <fpage>1</fpage>&#x2013;<lpage>2</lpage>.</citation></ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tian</surname> <given-names>X</given-names>
</name>
<name>
<surname>Jing</surname> <given-names>L</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>F</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Shyness trait recognition for schoolchildren via multi-view features of online writing</article-title>. <source>IEEE Trans Affect Comput</source>. (<year>2023</year>) <volume>14</volume>:<page-range>509&#x2013;22</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TAFFC.2021.3077410</pub-id>
</citation></ref>
<ref id="B25">
<label>25</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>T</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H</given-names>
</name>
</person-group>. <source>
<italic>Uncover the secrets of your personality: House-Tree-Person Drawing Test</italic> (China federation of literary and art circles publishing corporation)</source>. (<year>2007</year>).</citation></ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sorge</surname> <given-names>A</given-names>
</name>
<name>
<surname>Saita</surname> <given-names>E</given-names>
</name>
</person-group>. <article-title>Assessment of suicide and self-harm risk in foreign offenders. evaluating the use of tree-drawing test</article-title>. <source>Mediterr J Clin Psychol</source>. (<year>2021</year>) <volume>9</volume>:<fpage>1</fpage>&#x2013;<lpage>18</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.13129/2282-1619/mjcp-3024</pub-id>
</citation></ref>
<ref id="B27">
<label>27</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Xiong</surname> <given-names>D</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>R</given-names>
</name>
<name>
<surname>Ge</surname> <given-names>H</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>R</given-names>
</name>
<name>
<surname>Li</surname> <given-names>L</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>). <article-title>Development and efficiency research of distressed mood and suicide risk test system with house-tree-person (htp) drawing</article-title>, in: <conf-name>International Conference on Man-Machine-Environment System Engineering</conf-name>, <publisher-loc>Berlin, German</publisher-loc>: <publisher-name>Springer</publisher-name>. pp. <page-range>259&#x2013;64</page-range>. <publisher-name>Springer</publisher-name>.</citation></ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>G</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>L</given-names>
</name>
<name>
<surname>Sheng</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Association of synthetic house-tree-person drawing test and depression in cancer patients</article-title>. <source>BioMed Res Int</source>. (<year>2019</year>) <volume>2019</volume>:<elocation-id>1478634</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2019/1478634</pub-id>, PMID: <pub-id pub-id-type="pmid">31467869</pub-id></citation></ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hosmer</surname> <given-names>DW</given-names>
<suffix>Jr.</suffix>
</name>
<name>
<surname>Lemeshow</surname> <given-names>S</given-names>
</name>
<name>
<surname>Sturdivant</surname> <given-names>RX</given-names>
</name>
</person-group>. <source>Appl Logistic Regression</source>. (<year>2013</year>). <publisher-loc>Hoboken, NJ, USA</publisher-loc>: <publisher-name>John Wiley &amp; Sons</publisher-name>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/9781118548387</pub-id>
</citation></ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Quinlan</surname> <given-names>JR</given-names>
</name>
</person-group>. <article-title>Induction of decision trees</article-title>. <source>Mach Learn</source>. (<year>1986</year>) <volume>1</volume>:<fpage>81</fpage>&#x2013;<lpage>106</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF00116251</pub-id>
</citation></ref>
<ref id="B31">
<label>31</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Sch&#xf6;lkopf</surname> <given-names>B</given-names>
</name>
<name>
<surname>Smola</surname> <given-names>AJ</given-names>
</name>
</person-group>. <source>Learning with kernels: support vector machines, regularization, optimization, and beyond</source>. <publisher-loc>Cambridge, Massachusetts, USA</publisher-loc>: <publisher-name>MIT press</publisher-name> (<year>2002</year>).</citation></ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Random forests</article-title>. <source>Mach Learn</source>. (<year>2001</year>) <volume>45</volume>:<fpage>5</fpage>&#x2013;<lpage>32</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id>
</citation></ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krizhevsky</surname> <given-names>A</given-names>
</name>
<name>
<surname>Sutskever</surname> <given-names>I</given-names>
</name>
<name>
<surname>Hinton</surname> <given-names>GE</given-names>
</name>
</person-group>. <article-title>Imagenet classification with deep convolutional neural networks</article-title>. <source>Adv Neural Inf Process Syst</source>. (<year>2012</year>) <volume>25</volume>:<page-range>1097&#x2013;105</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1145/3065386</pub-id>
</citation></ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Simonyan</surname> <given-names>K</given-names>
</name>
<name>
<surname>Zisserman</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Very deep convolutional networks for large-scale image recognition</article-title>. <source>arXiv preprint arXiv:1409.1556</source>. (<year>2014</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.48550/arXiv.1409.1556</pub-id>
</citation></ref>
<ref id="B35">
<label>35</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Szegedy</surname> <given-names>C</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>W</given-names>
</name>
<name>
<surname>Jia</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Sermanet</surname> <given-names>P</given-names>
</name>
<name>
<surname>Reed</surname> <given-names>S</given-names>
</name>
<name>
<surname>Anguelov</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Going deeper with convolutions</article-title>, in: <conf-name>Proceedings of the IEEE conference on computer vision and pattern recognition</conf-name>, <publisher-loc>Piscataway, NJ, USA</publisher-loc>: <publisher-name>IEEE</publisher-name>. pp. <fpage>1</fpage>&#x2013;<lpage>9</lpage>.</citation></ref>
<ref id="B36">
<label>36</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>He</surname> <given-names>K</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Ren</surname> <given-names>S</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>J</given-names>
</name>
</person-group>. (<year>2016</year>). <article-title>Deep residual learning for image recognition</article-title>, in: <conf-name>Proceedings of the IEEE conference on computer vision and pattern recognition</conf-name>, <publisher-loc>Piscataway, NJ, USA</publisher-loc>: <publisher-name>IEEE</publisher-name>. pp. <page-range>770&#x2013;8</page-range>.</citation></ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Veli&#x10d;kovi&#x107;</surname> <given-names>P</given-names>
</name>
<name>
<surname>Cucurull</surname> <given-names>G</given-names>
</name>
<name>
<surname>Casanova</surname> <given-names>A</given-names>
</name>
<name>
<surname>Romero</surname> <given-names>A</given-names>
</name>
<name>
<surname>Lio</surname> <given-names>P</given-names>
</name>
<name>
<surname>Bengio</surname> <given-names>Y</given-names>
</name>
</person-group>. <article-title>Graph attention networks</article-title>. <source>arXiv preprint arXiv:1710.10903</source>. (<year>2017</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.48550/arXiv.1710.10903</pub-id>
</citation></ref>
<ref id="B38">
<label>38</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Ji</surname> <given-names>H</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>C</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>B</given-names>
</name>
<name>
<surname>Ye</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Cui</surname> <given-names>P</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Heterogeneous graph attention network</article-title>, in: <conf-name>The world wide web conference</conf-name>, <publisher-loc>New York, NY, USA</publisher-loc>: <publisher-name>ACM</publisher-name>. pp. <page-range>2022&#x2013;32</page-range>.</citation></ref>
<ref id="B39">
<label>39</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Lv</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>M</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>W</given-names>
</name>
<name>
<surname>He</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Are we really making much progress? revisiting, benchmarking and refining heterogeneous graph neural networks</article-title>, in: <conf-name>Proceedings of the 27th ACM SIGKDD conference on knowledge discovery &amp; data mining</conf-name>, <publisher-loc>New York, NY, USA</publisher-loc>: <publisher-name>ACM</publisher-name>. pp. <page-range>1150&#x2013;60</page-range>.</citation></ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhatti</surname> <given-names>UA</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>G</given-names>
</name>
<name>
<surname>Marjan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Hussain</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Deep learning with graph convolutional networks: An overview and latest applications in computational intelligence</article-title>. <source>Int J Intelligent Syst</source>. (<year>2023</year>) <volume>2023</volume>:<fpage>8342104</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2023/8342104</pub-id>
</citation></ref>
<ref id="B41">
<label>41</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Grover</surname> <given-names>A</given-names>
</name>
<name>
<surname>Leskovec</surname> <given-names>J</given-names>
</name>
</person-group>. <source>Proceedings of the 22nd ACM SIGKDD international conference on Knowledge discovery and data mining</source> (<year>2016</year>). p. <page-range>855&#x2013;64</page-range>.</citation></ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mikolov</surname> <given-names>T</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>K</given-names>
</name>
<name>
<surname>Corrado</surname> <given-names>G</given-names>
</name>
<name>
<surname>Dean</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Efficient estimation of word representations in vector space</article-title>. <source>arXiv preprint arXiv:1301.3781</source>. (<year>2013</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.48550/arXiv.1301.3781</pub-id>
</citation></ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kipf</surname> <given-names>TN</given-names>
</name>
<name>
<surname>Welling</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Semi-supervised classification with graph convolutional networks</article-title>. <source>arXiv preprint arXiv:1609.02907</source>. (<year>2016</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.48550/arXiv.1609.02907</pub-id>
</citation></ref>
<ref id="B44">
<label>44</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Sokolova</surname> <given-names>M</given-names>
</name>
<name>
<surname>Japkowicz</surname> <given-names>N</given-names>
</name>
<name>
<surname>Szpakowicz</surname> <given-names>S</given-names>
</name>
</person-group>. (<year>2006</year>). <article-title>Beyond accuracy, f-score and roc: a family of discriminant measures for performance evaluation</article-title>, in: <conf-name>Australasian joint conference on artificial intelligence</conf-name>, <publisher-loc>Berlin, German</publisher-loc>: <publisher-name>Springer</publisher-name>. pp. <page-range>1015&#x2013;21</page-range>. <publisher-name>Springer</publisher-name>.</citation></ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ting</surname> <given-names>KM</given-names>
</name>
</person-group>. <article-title>An instance-weighting method to induce cost-sensitive trees</article-title>. <source>IEEE Trans Knowledge Data Eng</source>. (<year>2002</year>) <volume>14</volume>:<page-range>659&#x2013;65</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TKDE.2002.1000348</pub-id>
</citation></ref>
<ref id="B46">
<label>46</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Guo</surname> <given-names>H</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>B</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>T</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>R</given-names>
</name>
<name>
<surname>Fan</surname> <given-names>H</given-names>
</name>
<name>
<surname>Dong</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>Tree imagery in drawing tests for screening mental disorders: A systematic review and meta-analysis</article-title>. In: <source>Research Squere</source> (<year>2024</year>). preprint.</citation></ref>
<ref id="B47">
<label>47</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Han</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>X-M</given-names>
</name>
</person-group>. (<year>2018</year>). <article-title>Deeper insights into graph convolutional networks for semisupervised learning</article-title>, in: <conf-name>Proceedings of the AAAI conference on artificial intelligence</conf-name>.</citation></ref>
<ref id="B48">
<label>48</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Pan</surname> <given-names>T</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>X</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>B</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>W</given-names>
</name>
</person-group>. (<year>2022</year>). <article-title>Automated drawing psychoanalysis via house-tree-person test</article-title>, in: <conf-name>2022 IEEE 34th International Conference on Tools with Artificial Intelligence (ICTAI)</conf-name>, <publisher-loc>Piscataway, NJ, USA</publisher-loc>. pp. <page-range>1120&#x2013;5</page-range>. <publisher-name>IEEE</publisher-name>.</citation></ref>
<ref id="B49">
<label>49</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kaneda</surname> <given-names>A</given-names>
</name>
<name>
<surname>Yasui-Furukori</surname> <given-names>N</given-names>
</name>
<name>
<surname>Saito</surname> <given-names>M</given-names>
</name>
<name>
<surname>Sugawara</surname> <given-names>N</given-names>
</name>
<name>
<surname>Nakagami</surname> <given-names>T</given-names>
</name>
<name>
<surname>Furukori</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Characteristics of the tree-drawing test in chronic schizophrenia</article-title>. <source>Psychiatry Clin Neurosci</source>. (<year>2010</year>) <volume>64</volume>:<page-range>141&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1440-1819.2010.02071.x</pub-id>, PMID: <pub-id pub-id-type="pmid">20447010</pub-id></citation></ref>
<ref id="B50">
<label>50</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname> <given-names>H</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>B</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Fan</surname> <given-names>H</given-names>
</name>
<name>
<surname>Dong</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>Analysis of the screening and predicting characteristics of the house-tree-person drawing test for mental disorders: A systematic review and meta-analysis</article-title>. <source>Front Psychiatry</source>. (<year>2023</year>) <volume>13</volume>:<elocation-id>1041770</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpsyt.2022.1041770</pub-id>, PMID: <pub-id pub-id-type="pmid">36683989</pub-id></citation></ref>
<ref id="B51">
<label>51</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stanzani Maserati</surname> <given-names>M</given-names>
</name>
<name>
<surname>Matacena</surname> <given-names>C</given-names>
</name>
<name>
<surname>Sambati</surname> <given-names>L</given-names>
</name>
<name>
<surname>Oppi</surname> <given-names>F</given-names>
</name>
<name>
<surname>Poda</surname> <given-names>R</given-names>
</name>
<name>
<surname>De Matteis</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>The tree-drawing test (koch&#x2019;s baum test): a useful aid to diagnose cognitive impairment</article-title>. <source>Behav Neurol</source>. (<year>2015</year>) <volume>2015</volume>:<elocation-id>534681</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2015/534681</pub-id>, PMID: <pub-id pub-id-type="pmid">26175548</pub-id></citation></ref>
<ref id="B52">
<label>52</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>G</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Qin</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Characteristics of house-tree-person drawing test in junior high school students with depressive symptoms</article-title>. <source>Clin Child Psychol Psychiatry</source>. (<year>2023</year>) <volume>28</volume>:<page-range>1623&#x2013;34</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/13591045221129706</pub-id>, PMID: <pub-id pub-id-type="pmid">36154491</pub-id></citation></ref>
<ref id="B53">
<label>53</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Koch</surname> <given-names>C</given-names>
</name>
</person-group>. <source>The Tree Test; the tree-drawing test as an aid in psychodiagnosis</source>. <publisher-loc>New York, USA</publisher-loc>: <publisher-name>Grune &amp; Stratton</publisher-name> (<year>1952</year>).</citation></ref>
<ref id="B54">
<label>54</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>J-d</given-names>
</name>
</person-group>. <article-title>Application of projective tree drawing test in adolescents with depression</article-title>. <source>Chin J Clin Psychol</source>. (<year>2012</year>) <volume>20</volume>:<page-range>185&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.16128/j.cnki.1005-3611.2012.02.041</pub-id>
</citation></ref>
<ref id="B55">
<label>55</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xia</surname> <given-names>F</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>K</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Aziz</surname> <given-names>A</given-names>
</name>
<name>
<surname>Wan</surname> <given-names>L</given-names>
</name>
<name>
<surname>Pan</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Graph learning: A survey</article-title>. <source>IEEE Trans Artif Intell</source>. (<year>2021</year>) <volume>2</volume>:<page-range>109&#x2013;27</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TAI.2021.3076021</pub-id>
</citation></ref>
<ref id="B56">
<label>56</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Tong</surname> <given-names>H</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Maciejewski</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>Graph convolutional networks: a comprehensive review</article-title>. <source>Comput Soc Networks</source>. (<year>2019</year>) <volume>6</volume>:<fpage>1</fpage>&#x2013;<lpage>23</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s40649-019-0069-y</pub-id>, PMID: <pub-id pub-id-type="pmid">37915858</pub-id></citation></ref>
<ref id="B57">
<label>57</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Gao</surname> <given-names>H</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Ji</surname> <given-names>S</given-names>
</name>
</person-group>. (<year>2018</year>). <article-title>Large-scale learnable graph convolutional networks</article-title>, in: <conf-name>Proceedings of the 24th ACM SIGKDD international conference on knowledge discovery &amp; data mining</conf-name>, <publisher-name>New York, NY, USA</publisher-name>: <publisher-name>ACM</publisher-name>. pp. <page-range>1416&#x2013;24</page-range>.</citation></ref>
<ref id="B58">
<label>58</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>He</surname> <given-names>X</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>M</given-names>
</name>
<name>
<surname>Chua</surname> <given-names>T-S</given-names>
</name>
</person-group>. (<year>2019</year>). <article-title>Kgat: Knowledge graph attention network for recommendation</article-title>, in: <conf-name>Proceedings of the 25th ACM SIGKDD international conference on knowledge discovery &amp; data mining</conf-name>, <publisher-loc>New York, NY, USA</publisher-loc>: <publisher-name>ACM</publisher-name>. pp. <page-range>950&#x2013;8</page-range>.</citation></ref>
</ref-list>
</back>
</article>