<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" dtd-version="1.3" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Artif. Intell.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Artificial Intelligence</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Artif. Intell.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2624-8212</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/frai.2026.1662264</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Machine learning strategies for predicting pediatric suicidal behaviors in a Brazilian emergency setting</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Carvalho</surname> <given-names>Isis F.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Couto da Silva</surname> <given-names>Ana Paula</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Lacerda</surname> <given-names>Anisio M.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Meira</surname> <given-names>Wagner</given-names> <suffix>Jr.</suffix></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/1491180"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Bastos Bispo Ferreira</surname> <given-names>Danilo</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/3093547"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Malloy Diniz</surname> <given-names>Lys</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Serpa</surname> <given-names>Alexandre Luiz de Oliveira</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/55574"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Machado</surname> <given-names>Maria Carolina Lobato</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/3327304"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Romano-Silva</surname> <given-names>Marco A.</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Miranda</surname> <given-names>Debora Marques de</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/60764"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Pappa</surname> <given-names>Gisele Lobo</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/3292988"/>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Departamento de Ci&#x000EA;ncia da Computa&#x000E7;&#x000E3;o</institution>, <city>Universidade Federal de Minas Gerais</city>, <city>Belo Horizonte</city>, <city>MG</city>, <country country="br">Brazil</country></aff>
<aff id="aff2"><label>2</label><institution>Faculdade de Medicina</institution>, <city>Universidade Federal de Minas Gerais</city>, <city>Belo Horizonte</city>, <city>MG</city>, <country country="br">Brazil</country></aff>
<aff id="aff3"><label>3</label><institution>PPG em Ci&#x000EA;ncias do Desenvolvimento Humano</institution>, <city>Universidade Presbiteriana Mackenzie</city>, <city>S&#x000E3;o Paulo</city>, <city>SP</city>, <country country="br">Brazil</country></aff>
<aff id="aff4"><label>4</label><institution>Shanghai Mental Health Centre</institution>, <city>Shanghai</city>, <country country="cn">China</country></aff>
<aff id="aff5"><label>5</label><institution>Centro de Tecnologia e Medicina Molecular</institution>, <city>Faculdade de Medicina</city>, <city>Universidade Federal de Minas Gerais</city>, <city>Belo Horizonte</city>, <city>MG</city>, <country country="br">Brazil</country></aff>
<author-notes>
<corresp id="c001"><label>&#x0002A;</label>Correspondence: Debora Marques de Miranda, <email xlink:href="mailto:debora.m.miranda@gmail.com">debora.m.miranda@gmail.com</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-18">
<day>18</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>9</volume>
<elocation-id>1662264</elocation-id>
<history>
<date date-type="received">
<day>08</day>
<month>07</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>03</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>16</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2026 Carvalho, Couto da Silva, Lacerda, Meira, Bastos Bispo Ferreira, Malloy Diniz, Serpa, Machado, Romano-Silva, Miranda and Pappa.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Carvalho, Couto da Silva, Lacerda, Meira, Bastos Bispo Ferreira, Malloy Diniz, Serpa, Machado, Romano-Silva, Miranda and Pappa</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-18">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Suicide is a leading cause of death worldwide, yet its prediction remains a challenge. This difficulty arises not only because suicidal behavior is a rare event in the general population, leading to significant class imbalance in datasets, but also due to its complex, multi-causal nature involving a non-linear interplay of sociodemographic and clinical factors. Furthermore, while the majority of suicides occur in middle-income countries, there is a lack of predictive models tailored to these specific social contexts. This study evaluates machine learning strategies in an enriched clinical setting: a pediatric psychiatric emergency center in Brazil.</p></sec>
<sec>
<title>Methods</title>
<p>We analyzed a comprehensive database of 2,365 youth seeking emergency care. We benchmarked three machine learning algorithms, namely Logistic Regression, Random Forest, and XGBoost, to predict three outcomes: self-harm, suicidal ideation, and suicide attempts. To address class imbalance, we applied oversampling techniques to the training data. We also used SHapley Additive exPlanations (SHAP) values to quantify each feature&#x00027;s contribution to the predictions.</p></sec>
<sec>
<title>Findings and interpretation</title>
<p>In this setting, suicide-related behaviors represented 28.7% of the clinical demand. The Random Forest model combined with oversampling was the most effective strategy, achieving sensitivities of 78.04% for suicidal ideation, 71.18% for suicide attempts, and 69.37% for self-harm. Specificity remained consistently above 75%. SHAP value analysis revealed that social determinants were critical predictors, highlighting that social conditions in middle-income populations introduce unique variables that significantly influence suicidal risk. While accuracy for suicide attempts remained a challenge, SHAP provided clear clinical insights into the drivers of risk.</p></sec>
<sec>
<title>Conclusions</title>
<p>Machine learning, specifically Random Forest models together with oversampling and SHAP, demonstrates strong potential for identifying suicidal risk in pediatric emergency settings. By integrating clinical data with social determinants, these models provide a transparent and scalable strategy for early identification in regions with limited specialized psychiatric resources.</p></sec></abstract>
<kwd-group>
<kwd>adolescents</kwd>
<kwd>children</kwd>
<kwd>prediction</kwd>
<kwd>risk features</kwd>
<kwd>self-harm</kwd>
<kwd>suicide attempt</kwd>
<kwd>suicide ideation</kwd>
</kwd-group>
<funding-group>
<award-group id="gs1">
 <funding-source id="sp1">
 <institution-wrap>
 <institution>Funda&#x000E7;&#x000E3;o de Amparo &#x000E0; Pesquisa do Estado de S&#x000E3;o Paulo</institution>
 <institution-id institution-id-type="doi" vocab="open-funder-registry" vocab-identifier="10.13039/open_funder_registry">10.13039/501100001807</institution-id>
 </institution-wrap>
 </funding-source>
</award-group>
<award-group id="gs2">
 <funding-source id="sp2">
 <institution-wrap>
 <institution>Conselho Nacional de Desenvolvimento Cient&#x000ED;fico e Tecnol&#x000F3;gico</institution>
 <institution-id institution-id-type="doi" vocab="open-funder-registry" vocab-identifier="10.13039/open_funder_registry">10.13039/501100003593</institution-id>
 </institution-wrap>
 </funding-source>
</award-group>
 <funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This study was financed with resources from the National Institute for Science and Technology (INCT NeurotechR), CAPES, and the Centre for Innovation and Artificial Intelligence for Health (CI-IA Sa&#x000FA;de), in part with resources from the S&#x000E3;o Paulo State Research Support Foundation (FAPESP) Process no. 2020/09866-4, from Minas Gerais Research Support Foundation (FAPEMIG) Process No. PPE-00030-21 and UNIMED Belo Horizonte and CNPq.</funding-statement>
</funding-group>
<counts>
<fig-count count="5"/>
<table-count count="5"/>
<equation-count count="0"/>
<ref-count count="36"/>
<page-count count="10"/>
<word-count count="7764"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Medicine and Public Health</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<label>1</label>
<title>Introduction</title>
<p>Suicide claims a life every 40 s globally, and each loss impacts 60&#x02013;135 people (<xref ref-type="bibr" rid="B12">Knipe et al., 2022</xref>). In 2020, a meta-analysis reported a suicide rate of 4.9/100,000 and a pooled rate of 17% for suicidal ideation among adolescents (<xref ref-type="bibr" rid="B2">Bersia et al., 2022</xref>). In developed countries, suicide stands as the foremost cause of death among children and adolescents (<xref ref-type="bibr" rid="B12">Knipe et al., 2022</xref>). The often underestimated burden of suicide and related behaviors weighs heavily on low- and middle-income countries (LMICs) (<xref ref-type="bibr" rid="B12">Knipe et al., 2022</xref>; <xref ref-type="bibr" rid="B20">Naghavi, 2019</xref>), which account for 75% of suicides worldwide. Hence, efforts to understand this phenomenon in these nations remain necessary, as few studies have examined them (<xref ref-type="bibr" rid="B11">Klonsky et al., 2016</xref>; <xref ref-type="bibr" rid="B27">Robinson et al., 2018</xref>). The differences in suicide rates in LMICs are mainly attributed to economic, social and cultural features, such as access to social support systems or mental health care (<xref ref-type="bibr" rid="B18">Miladinov, 2023</xref>).</p>
<p>Self-harm occurs at a 20 times higher frequency than suicide, and often precedes suicide attempts (<xref ref-type="bibr" rid="B16">Mars et al., 2019a</xref>). Both engaging in self-harm and being exposed to it are prominent predictors of suicide attempts (<xref ref-type="bibr" rid="B16">Mars et al., 2019a</xref>). In LMICs, the incidence of suicide planning and attempts among adolescents, especially girls aged 15&#x02013;17, is approximately 17% (<xref ref-type="bibr" rid="B30">Uddin et al., 2019</xref>). Given the profound individual, societal and household impact of child and adolescent deaths, it is imperative to investigate the factors leading to this condition.</p>
<p>Multiple machine learning (ML) models have been proposed to predict suicide (<xref ref-type="bibr" rid="B8">Harris et al., 2019a</xref>). However, predicting suicide is a challenge even for proficient psychiatrists and mental health specialists. Understanding the interplay between social and environmental factors and mental health is crucial, as social factors often contribute to risk (<xref ref-type="bibr" rid="B27">Robinson et al., 2018</xref>; <xref ref-type="bibr" rid="B25">Pollock, 2019</xref>; <xref ref-type="bibr" rid="B21">Navarro et al., 2021</xref>). This holds particular significance in countries such as Brazil, where inequality and social shortcomings can exacerbate psychiatric risks (<xref ref-type="bibr" rid="B7">Glenn et al., 2020</xref>; <xref ref-type="bibr" rid="B22">Orellana et al., 2020</xref>).</p>
<p>Robust predictors for suicide-related behaviors offer a pathway to intervene in individuals&#x00027; behavior or monitor specific variables. (<xref ref-type="bibr" rid="B8">Harris et al. 2019a</xref>) conducted a systematic review of risk assessment tools for predicting adolescent suicide (<xref ref-type="bibr" rid="B9">Harris et al., 2019b</xref>). They evaluated ten risk assessment tools used in the US and the UK and found that none of them could effectively predict suicidal behaviors. This reveals the complexity of the task, a matter that warrants significant attention given its widespread impact (<xref ref-type="bibr" rid="B8">Harris et al., 2019a</xref>,<xref ref-type="bibr" rid="B9">b</xref>).</p>
<p>In a population-based longitudinal study of Scottish young adults aged 18&#x02013;34 (<xref ref-type="bibr" rid="B31">van Mens et al., 2020</xref>), the prediction of suicidal behaviors using traditional ML techniques found that algorithms based on decision trees outperformed regular logistic regression, achieving a sensitivity of 0.47 and a specificity of 0.91 for suicide attempt prediction. When comparing short- and long-term predictions of suicide risk using longitudinal data from structured electronic health records at the Connecticut Children&#x00027;s Medical Center, (<xref ref-type="bibr" rid="B29">Su et al. 2020</xref>) developed a model with sensitivity 0.62 and specificity 0.90; their model exhibited superior performance for shorter prediction windows. A model derived from a Brazilian cohort revealed a heightened risk of depression among individuals who are female, socially isolated, non-white, involved in drug use and conflicts, experiencing academic difficulties, and victims of maltreatment (<xref ref-type="bibr" rid="B22">Orellana et al., 2020</xref>).</p>
<p>Here, we propose models to predict self-harm, suicidal ideation and suicidal attempts using an enriched dataset from the regional emergency unit of the Psychiatric Emergency Center for Children and Adolescents (CEPAI-FHEMI), in Brazil. This facility provides urgent psychiatric care, primarily assisting individuals reporting depression, substance use, and symptoms of agitation and aggressiveness, as detailed in (<xref ref-type="bibr" rid="B14">Lobato Machado et al. 2022</xref>). This sample had more frequent suicidal behaviors than the general population, which may facilitate the identification of risks to the outcome (<xref ref-type="bibr" rid="B27">Robinson et al., 2018</xref>).</p></sec>
<sec id="s2">
<label>2</label>
<title>Methods</title>
<sec>
<label>2.1</label>
<title>Ethics approval</title>
<p>This study was approved by the institutional review board (IRB) of the participating institution (COEP Ciencias M&#x000E9;dicas). All procedures followed the ethical standards for human subjects research, and a waiver of informed consent was granted due to the retrospective design, in accordance with national regulations. The original data follows the rules from the medical records data storage, which must be retrieved only for patient benefit and must be safely stored for 20 years. Data was anonymized by removing names, addresses, document IDs, and other sensitive information. We report only aggregated patient statistics to avoid any risk of reidentification.</p></sec>
<sec>
<label>2.2</label>
<title>Dataset</title>
<p>We conducted a retrospective observational study with children and adolescents receiving emergency psychiatric care. The dataset comprises 2,365 health records of patients admitted to CEPAI-FHEMIG, some with multiple admissions, resulting in 1,720 unique patients (<xref ref-type="bibr" rid="B14">Lobato Machado et al., 2022</xref>). The data was collected from June 2017 to May 2018, and the subjects&#x00027; ages range from 1 to 18 years. The dataset includes 27 sociodemographic features, such as race, gender, place of birth, household geographical location, school situation, living situation, and 123 clinical features, encompassing details such as reasons for seeking psychiatric assistance, family history of mental disorders, substance abuse information, psychiatric diagnoses received after treatment at the facility, neuro-psychomotor development delays, and previous traumatic events, among other relevant aspects.</p>
<p>We excluded 75 admissions where patients: (i) had no information at all (5); (ii) had only personal information (37); (iii) had no information about the motivations for looking for help or diagnoses (31); (iv) had not completed the screening stages at the center (1); or (v) had missing age information (1). Regarding the features, 12 of 110 contained textual information (e.g., a written reason for the patient leaving school). On average, more than 87% of the data in these 12 features were missing, and therefore these features were discarded. The original dataset also contained 21 features related to suicidal behaviors, which were, unfortunately, mostly missing (more than 80% of instances were missing) and were therefore excluded due to the high risk of data imputation in this context.</p>
<p>With the assistance of psychiatry professionals, out of the remaining 77 features, 57 were considered more informative for the tasks at hand. From the selected features, 33 were categorical. These categorical features were binarized, yielding 21 new binary features (e.g., whether the patient had depression, schizophrenia, or learning difficulties). The final dataset had 2,289 admissions for 1,687 unique patients (1,071 male and 616 female), with each admission described by 154 features.</p>
<p>Three target values&#x02014;self-harm, suicidal ideation, and suicidal attempt&#x02014;were extracted from the patient&#x00027;s motivation for seeking help, which was the prediction target. In this scenario, we had 337 out of 2,291 cases of self-harm (14.71%), 309 cases of suicide ideation (13.48%) and 323 positive suicide attempts (14.09%).</p>
<p>Self-harm was operationally defined as any non-suicidal manifestation of self-poisoning or self-injury lacking the explicit intent to induce mortality. Suicide ideation was identified in instances where individuals self-reported contemplation or strategic planning associated with suicidal tendencies. Concurrently, a suicide attempt was characterized as a deliberate act of self-poisoning or self-injury with the explicit aim of inducing mortality.</p></sec>
<sec>
<label>2.3</label>
<title>Methodology</title>
<p>To build prediction models for all outcomes, the classic methodology for handling data was followed. The first step was data preparation, as reported in the previous section. Next, the prepared datasets were used to train ML models, and oversampling was used to address class imbalance. As one of our main objectives is to interpret the contribution of each predictor to the model&#x00027;s decisions, we also employed SHapley Additive exPlanations (SHAP) (<xref ref-type="bibr" rid="B15">Lundberg and Lee, 2017</xref>) to understand predictions better. Each of these steps is detailed next.</p>
<p>The three ML models used in our experiments were Logistic Regression (LR), Random Forest (RF), and eXtreme Gradient Boosting (XGB) (<xref ref-type="bibr" rid="B36">Zaki and Meira, 2014</xref>). LR was chosen for its interpretability, whereas RF and XGB, as tree-based models, excel at capturing non-linear relationships and may facilitate the emergence of interpretable models. The experiments were conducted using the Scikit-learn (<xref ref-type="bibr" rid="B24">Pedregosa et al., 2011</xref>) and XGBoost libraries (<xref ref-type="bibr" rid="B5">Chen and Guestrin, 2016</xref>). A detailed description of these algorithms can be found in (<xref ref-type="bibr" rid="B3">Bishop 2006</xref>).</p>
<p>Given the imbalanced nature of the data, instances with suicidal behaviors were oversampled to compose 30% of the training set. Oversampling is a well-known technique that alters the data distribution in the training set to improve predictive performance by increasing the number of instances of the rarer class.</p>
<p>The models were trained on two distinct feature sets. The first set incorporates all available features and is denoted as &#x0201C;All Features&#x0201D; in the results table. The second set, referred to as &#x0201C;Feature Selection,&#x0201D; was generated using pre-selected features based on expert knowledge of the specialist who curated the dataset. It comprises features such as motivations for seeking help, diagnoses during medical hospitalization, whether it is the first-time admission to CEPAI-FHEMIG, and personal data, including gender, age, and the number of people in the household. We are aware that this type of selection can bias the model, and, for that reason, experiments with the full set of available features were also performed, and their results were compared with those obtained using only the features selected by the specialist.</p>
<p>During model training, the target variables were excluded from the set of predictors. Considering the relationship between suicide ideation and suicide attempt, ideation was used as a predictor for suicide attempt. Still, the suicide attempt was removed from the data used for suicide ideation prediction. For the self-harm prediction task, both suicidal ideation and suicide attempts were used as predictors, in line with previous research (<xref ref-type="bibr" rid="B17">Mars et al., 2019b</xref>).</p>
<p>Each model generated provided feature importance scores for the predictors, enabling us to compare the most significant features across classification tasks. Additionally, SHAP values were generated (<xref ref-type="bibr" rid="B15">Lundberg and Lee, 2017</xref>). SHAP is an approach rooted in game theory and frequently used to explain the output of ML models. It reveals the extent to which each feature contributes to the target feature. The interpretation of SHAP is akin to feature importance, but SHAP goes further by indicating whether each feature has a positive or negative relationship with the predicted value. It allows a richer understanding of feature impact, since it allows us to identify the most influential predictors associated with increased risk of suicide-related behaviors.</p></sec>
<sec>
<label>2.4</label>
<title>Experimental setup</title>
<p>To assess model performance, we used a stratified 10-fold cross-validation strategy, following the methodology detailed in (<xref ref-type="bibr" rid="B3">Bishop 2006</xref>). To prevent data leakage, we employed patient-level grouping: all admissions associated with a single individual were restricted to a single fold, ensuring the model was never tested on data from a patient it had already seen during training. For each iteration, the dataset was partitioned into training (eight folds), validation (one fold), and independent test sets (one fold). The validation set was used exclusively for hyperparameter optimization, whereas the test set was used only to assess model generalization. It is important to note that, in experiments using oversampling, the test set retained the original data distribution.</p>
<p>The performance of the models was assessed using four metrics:
<list list-type="order">
<list-item><p>Area under the receiver operating characteristic curve (AUC): assesses the model&#x00027;s performance across all classification thresholds of the true positive (TP) rate and false positive (FP) rate, providing a comprehensive view of the model&#x00027;s ability to discriminate between classes.</p></list-item>
<list-item><p>Positive predictive value (PPV): proportion of correctly predicted positive instances out of all predicted positive instances, offering insights into the accuracy of positive predictions.</p></list-item>
<list-item><p>Sensitivity: proportion of actual positive instances correctly identified by the classifier, indicating how well the model captures TP cases.</p></list-item>
<list-item><p>Specificity: proportion of actual negative instances correctly identified by the classifier, indicating how well the model captures true negative (TN) cases.</p></list-item>
</list></p>
<p>These metrics collectively provide a comprehensive evaluation of the model&#x00027;s performance on classification tasks. However, in the context of this paper, the sensitivity is considered more important than the other metrics, because the impact of not identifying a positive case of suicide attempt (or ideation, or self-harm) is considered more serious than misclassifying a negative case. This metric will be used to evaluate the models&#x00027; performance relative to one another.</p>
<p>Regarding hyperparameter tuning, for XGB, a grid search was performed to identify a near-optimal parameter combination. This search encompassed four parameters: (1) the number of boosting iterations, (2) the ratio of features used to train a tree, (3) the maximum tree depth, and (4) the ratio of training instances in a subsample.</p>
<p>For RF, five parameters were assessed: (1) number of trees in the forest, (2) minimum number of samples required to split an internal node, (3) maximum depth of the tree, (4) minimum number of samples required to be at a leaf node and (5) whether bootstrap samples are used when building trees. Due to the large number of possible parameter combinations, an initial random search was conducted over the hyperparameter space. Subsequently, the best values identified in this search were evaluated using a grid search to determine the best parameter configuration. <xref ref-type="table" rid="T1">Table 1</xref> presents the best parameter values found for Random Forest in the three scenarios investigated.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Best parameter configurations returned by the grid-search for the Random Forest algorithm.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th valign="top" align="center" colspan="3"><bold>Model output</bold></th>
</tr>
<tr>
<th valign="top" align="left"><bold>Parameters</bold></th>
<th valign="top" align="center"><bold>Suicide attempt</bold></th>
<th valign="top" align="center"><bold>Suicide ideation</bold></th>
<th valign="top" align="center"><bold>Self-harm</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Number of trees</td>
<td valign="top" align="center">10</td>
<td valign="top" align="center">10</td>
<td valign="top" align="center">100</td>
</tr>
<tr>
<td valign="top" align="left">Max tree depth</td>
<td valign="top" align="center">None</td>
<td valign="top" align="center">None</td>
<td valign="top" align="center">None</td>
</tr>
<tr>
<td valign="top" align="left">Min. number of split samples</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">Min. number of leaf samples</td>
<td valign="top" align="center">10</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">Use of bootstrap</td>
<td valign="top" align="center">True</td>
<td valign="top" align="center">True</td>
<td valign="top" align="center">True</td>
</tr></tbody>
</table>
</table-wrap>
<p>Once the parameters for both RF and XGB models were determined, further tuning involved adjusting their classification thresholds, which determine whether an example is classified as positive or negative (default value is 0.5), using the validation set. This experiment was also performed for LR. In this scenario, we balanced sensitivity and specificity using the F1 score, which is the harmonic mean of PPV and sensitivity. After that, the models were evaluated on the test sets.</p>
<p>The three models underwent testing with both the complete set of attributes and the reduced set of features (&#x0201C;Feature Selection&#x0201D;). Both experiments were conducted with and without oversampling.</p></sec></sec>
<sec sec-type="results" id="s3">
<label>3</label>
<title>Results</title>
<sec>
<label>3.1</label>
<title>Descriptive results</title>
<p><xref ref-type="fig" rid="F1">Figure 1</xref> shows the basic statistics of the dataset. As observed in <xref ref-type="fig" rid="F1">Figure 1a</xref>, most patients (&#x0007E;62%) were between 13 and 18 years old. <xref ref-type="fig" rid="F1">Figure 1b</xref> shows the number of admissions to CEPAI-FHEMIG. Although most of the patients were admitted only once, 21% of the individuals were admitted at least twice in the studied period, revealing an incidence of repeated suicide behaviors, in line with the literature. <xref ref-type="fig" rid="F2">Figure 2</xref> illustrates the distribution of diagnoses given by the psychiatric professional (after assessment). Depression and general mood disorders were diagnosed in 21,69% of all admissions, being the most common diagnosis.</p>
<fig position="float" id="F1">
<label>Figure 1</label>
<caption><p>Statistics of the dataset. <bold>(a)</bold> Frequency of children searching for care in child psychiatry facilities; <bold>(b)</bold>Frequency of admissions for the same patient.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frai-09-1662264-g0001.tif">
<alt-text content-type="machine-generated">Histogram labeled (a) illustrates the frequency of ages from 1 to 18, showing increasing frequency with age, peaking at age 17 of search for child psychiatric emergency care Histogram labeled (b) displays the frequency of the number of admissions per patient, with most patients having only one admission and sharply declining frequencies for higher admission numbers. Both plots support analysis of patient age distribution and admission count.</alt-text>
</graphic>
</fig>
<fig position="float" id="F2">
<label>Figure 2</label>
<caption><p>Frequency of diagnosis from admission in the psychiatric facility.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frai-09-1662264-g0002.tif">
<alt-text content-type="machine-generated">Horizontal bar chart showing the frequency of various mental health diagnosis identified at admission of the facility (past and actual), with depression or mood disorder being most common, followed by conduct disorders and psychosis; eating disorder is least frequent.</alt-text>
</graphic>
</fig>
<p><xref ref-type="table" rid="T2">Table 2</xref> presents descriptive statistics for a subset of features, including motives that led the family to seek help and other dependent features considered relevant to the model, using suicide attempt as the dependent variable. The most common reasons were related to agitation, aggressiveness, irritability and learning difficulties, which are not traditionally associated with suicidal behaviors. Factors commonly related to suicidal behavior include depression, self-harm, anxiety, and self-aggressiveness, which were present in 19,07%, 14,7%, 14,36% and 5,28% of the admissions registered, respectively, and follow the distribution in the table.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Descriptive statistics of a subset of predictive variables, including motives to seek help, considering suicide attempt as the dependent variable.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left"><bold>Independent variable</bold></th>
<th valign="top" align="center"><bold>No suicide attempt (<italic>N</italic>= 1,966)</bold></th>
<th valign="top" align="center"><bold>Suicide attempt (<italic>N</italic>=323)</bold></th>
<th valign="top" align="center"><bold><italic>p</italic>-value</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Gender (male)</td>
<td valign="top" align="center">1,309 (66.6%)</td>
<td valign="top" align="center">129 (39.9%)</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Gender (female)</td>
<td valign="top" align="center">657 (33.4%)</td>
<td valign="top" align="center">194 (60.1%)</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Was hospitalized?</td>
<td valign="top" align="center">193 (9.8%)</td>
<td valign="top" align="center">81 (25.1%)</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Age</td>
<td valign="top" align="center">12.6 &#x000B1; 3.9</td>
<td valign="top" align="center">15.1 &#x000B1; 1.9</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Depression</td>
<td valign="top" align="center">288 (14.6%)</td>
<td valign="top" align="center">149 (46.1%)</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Suicidal ideation</td>
<td valign="top" align="center">197 (10.0%)</td>
<td valign="top" align="center">112 (34.7%)</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Self-harm</td>
<td valign="top" align="center">230 (11.7%)</td>
<td valign="top" align="center">107 (33.1%)</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Substance abuse</td>
<td valign="top" align="center">324 (16.5%)</td>
<td valign="top" align="center">84 (26.0%)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Irritability</td>
<td valign="top" align="center">598 (30.4%)</td>
<td valign="top" align="center">74 (22.9%)</td>
<td valign="top" align="center">0.007</td>
</tr>
<tr>
<td valign="top" align="left">Aggressiveness</td>
<td valign="top" align="center">830 (42.2%)</td>
<td valign="top" align="center">69 (21.4%)</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Insomnia</td>
<td valign="top" align="center">288 (14.6%)</td>
<td valign="top" align="center">63 (19.5%)</td>
<td valign="top" align="center">0.031</td>
</tr>
<tr>
<td valign="top" align="left">Isolation</td>
<td valign="top" align="center">236 (12.0%)</td>
<td valign="top" align="center">59 (18.3%)</td>
<td valign="top" align="center">0.003</td>
</tr>
<tr>
<td valign="top" align="left">Agitation</td>
<td valign="top" align="center">905 (46.0%)</td>
<td valign="top" align="center">49 (15.2%)</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Anxiety</td>
<td valign="top" align="center">279 (14.2%)</td>
<td valign="top" align="center">47 (14.6%)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Hallucination</td>
<td valign="top" align="center">271 (13.8%)</td>
<td valign="top" align="center">46 (14.2%)</td>
<td valign="top" align="center">0.894</td>
</tr>
<tr>
<td valign="top" align="left">School difficulty</td>
<td valign="top" align="center">482 (24.5%)</td>
<td valign="top" align="center">40 (12.4%)</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Disobedience</td>
<td valign="top" align="center">414 (21.1%)</td>
<td valign="top" align="center">38 (11.8%)</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Mood swings</td>
<td valign="top" align="center">156 (7.9%)</td>
<td valign="top" align="center">21 (6.5%)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Attention difficulty</td>
<td valign="top" align="center">320 (16.3%)</td>
<td valign="top" align="center">15 (4.6%)</td>
<td valign="top" align="center">&#x0003C; 0.001</td>
</tr>
<tr>
<td valign="top" align="left">Delusion</td>
<td valign="top" align="center">182 (9.3%)</td>
<td valign="top" align="center">15 (4.6%)</td>
<td valign="top" align="center">0.008</td>
</tr>
<tr>
<td valign="top" align="left">Self-aggressiveness</td>
<td valign="top" align="center">108 (5.5%)</td>
<td valign="top" align="center">13 (4.0%)</td>
<td valign="top" align="center">0.338</td>
</tr>
<tr>
<td valign="top" align="left">Hypersexuality</td>
<td valign="top" align="center">47 (2.4%)</td>
<td valign="top" align="center">9 (2.8%)</td>
<td valign="top" align="center">0.816</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p><italic>p</italic>-values were obtained with a &#x003C7;<sup>2</sup> test for categorical attributes and a <italic>t</italic>-test for age, the only numerical attribute.</p>
</table-wrap-foot>
</table-wrap>
<p>Suicide-related behaviors were among the motivations given by patients or their guardians to seek psychiatric care. As previously reported, the motivations were used to define the model&#x00027;s outcome variables. The dataset had 337 out of 2,291 cases of self-harm (14.71%), 309 cases of suicide ideation (13.48%) and 323 positive suicide attempts (14.09%).</p></sec>
<sec>
<label>3.2</label>
<title>Suicide behavior prediction results</title>
<p><xref ref-type="table" rid="T3">Tables 3</xref>&#x02013;<xref ref-type="table" rid="T5">5</xref> present the results of the prediction models predicting suicide attempts, suicidal ideation, and self-harm, respectively. In the tables, the acronym OV denotes Oversampling, referring to models in which the data distribution was modified. The ratio of the outcome we want to predict corresponded to 30% of the training dataset. The RF model achieved the best overall performance across the four metrics for all three tasks. Oversampling does not affect the current sample&#x00027;s results, as the method&#x00027;s results with and without oversampling differ only in confidence intervals, which overlap. For suicide attempt and ideation prediction, the best-performing model used only the &#x0201C;Feature Selection&#x0201D; subset of features, achieving a sensitivity of 0.7118, specificity of 0.7592 and PPV of 0.3350 for suicide attempt prediction. For suicide ideation prediction, the method presented a sensitivity of 0.7804, specificity of 0.7763 and PPV of 0.3602. In the case of self-harm, the best model was trained using all available features, resulting in a sensitivity of 0.6937, specificity of 0.8177 and PPV of 0.4086.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Suicide attempt prediction results for the three classifiers tested with and without oversampling (OV).</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left"><bold>Features</bold></th>
<th valign="top" align="center"><bold>Models</bold></th>
<th valign="top" align="center"><bold>AUC</bold></th>
<th valign="top" align="center"><bold>PPV</bold></th>
<th valign="top" align="center"><bold>Sensitivity</bold></th>
<th valign="top" align="center"><bold>Specificity</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">All features</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">0.6582 &#x000B1; 0.0628</td>
<td valign="top" align="center">0.3841 &#x000B1; 0.0835</td>
<td valign="top" align="center">0.4350 &#x000B1; 0.1494</td>
<td valign="top" align="center">0.8814 &#x000B1; 0.0462</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">LR OV</td>
<td valign="top" align="center">0.6956 &#x000B1; 0.0678</td>
<td valign="top" align="center">0.3372 &#x000B1; 0.0542</td>
<td valign="top" align="center">0.5837 &#x000B1; 0.1614</td>
<td valign="top" align="center">0.8076 &#x000B1; 0.0577</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF</td>
<td valign="top" align="center">0.7338 &#x000B1; 0.0659</td>
<td valign="top" align="center">0.3719 &#x000B1; 0.0829</td>
<td valign="top" align="center">0.6583 &#x000B1; 0.1067</td>
<td valign="top" align="center">0.8092 &#x000B1; 0.0547</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF OV</td>
<td valign="top" align="center">0.7379 &#x000B1; 0.0543</td>
<td valign="top" align="center">0.3461 &#x000B1; 0.0701</td>
<td valign="top" align="center">0.7047 &#x000B1; 0.0990</td>
<td valign="top" align="center">0.7710 &#x000B1; 0.0637</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB</td>
<td valign="top" align="center">0.6769 &#x000B1; 0.0489</td>
<td valign="top" align="center">0.3256 &#x000B1; 0.0565</td>
<td valign="top" align="center">0.5406 &#x000B1; 0.1007</td>
<td valign="top" align="center">0.8132 &#x000B1; 0.0394</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB OV</td>
<td valign="top" align="center">0.6989 &#x000B1; 0.0786</td>
<td valign="top" align="center">0.3574 &#x000B1; 0.0734</td>
<td valign="top" align="center">0.5682 &#x000B1; 0.1610</td>
<td valign="top" align="center">0.8295 &#x000B1; 0.0434</td>
</tr>
<tr>
<td valign="top" align="left">Feat. selection</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">0.6808 &#x000B1; 0.0523</td>
<td valign="top" align="center">0.4380 &#x000B1; 0.0951</td>
<td valign="top" align="center">0.4665 &#x000B1; 0.1135</td>
<td valign="top" align="center">0.8951 &#x000B1; 0.0376</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">LR OV</td>
<td valign="top" align="center">0.7264 &#x000B1; 0.0644</td>
<td valign="top" align="center">0.3686 &#x000B1; 0.0661</td>
<td valign="top" align="center">0.6428 &#x000B1; 0.1504</td>
<td valign="top" align="center">0.8100 &#x000B1; 0.0627</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF</td>
<td valign="top" align="center">0.7225 &#x000B1; 0.0430</td>
<td valign="top" align="center">0.3151 &#x000B1; 0.0563</td>
<td valign="top" align="center">0.7055 &#x000B1; 0.0932</td>
<td valign="top" align="center">0.7395 &#x000B1; 0.0636</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF OV</td>
<td valign="top" align="center">0.7355 &#x000B1; 0.0430</td>
<td valign="top" align="center">0.3350 &#x000B1; 0.0514</td>
<td valign="top" align="center"><bold>0.7118</bold> <bold>&#x000B1;0.1079</bold></td>
<td valign="top" align="center">0.7592 &#x000B1; 0.0627</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB</td>
<td valign="top" align="center">0.6812 &#x000B1; 0.0553</td>
<td valign="top" align="center">0.3155 &#x000B1; 0.0502</td>
<td valign="top" align="center">0.5628 &#x000B1; 0.1272</td>
<td valign="top" align="center">0.7995 &#x000B1; 0.0391</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB OV</td>
<td valign="top" align="center">0.7132 &#x000B1; 0.0406</td>
<td valign="top" align="center">0.3012 &#x000B1; 0.0241</td>
<td valign="top" align="center">0.6899 &#x000B1; 0.0989</td>
<td valign="top" align="center">0.7364 &#x000B1; 0.0366</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>In bold, there is the model and strategy with the best sensitivity.</p>
</table-wrap-foot>
</table-wrap>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p>Suicide ideation prediction results for the three classifiers tested with and without oversampling (OV).</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left"><bold>Features</bold></th>
<th valign="top" align="center"><bold>Models</bold></th>
<th valign="top" align="center"><bold>AUC</bold></th>
<th valign="top" align="center"><bold>PPV</bold></th>
<th valign="top" align="center"><bold>Sensitivity</bold></th>
<th valign="top" align="center"><bold>Specificity</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">All features</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">0.7053 &#x000B1; 0.0406</td>
<td valign="top" align="center">0.4640 &#x000B1; 0.0765</td>
<td valign="top" align="center">0.5075 &#x000B1; 0.1040</td>
<td valign="top" align="center">0.9031 &#x000B1; 0.0334</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">LR OV</td>
<td valign="top" align="center">0.7418 &#x000B1; 0.0445</td>
<td valign="top" align="center">0.4219 &#x000B1; 0.0861</td>
<td valign="top" align="center">0.6274 &#x000B1; 0.1252</td>
<td valign="top" align="center">0.8561 &#x000B1; 0.0492</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF</td>
<td valign="top" align="center">0.7599 &#x000B1; 0.0434</td>
<td valign="top" align="center">0.4324 &#x000B1; 0.0688</td>
<td valign="top" align="center">0.6625 &#x000B1; 0.1212</td>
<td valign="top" align="center">0.8572 &#x000B1; 0.0434</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF OV</td>
<td valign="top" align="center">0.7819 &#x000B1; 0.0540</td>
<td valign="top" align="center">0.4178 &#x000B1; 0.0751</td>
<td valign="top" align="center">0.7287 &#x000B1; 0.1373</td>
<td valign="top" align="center">0.8351 &#x000B1; 0.0467</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB</td>
<td valign="top" align="center">0.7265 &#x000B1; 0.0513</td>
<td valign="top" align="center">0.3596 &#x000B1; 0.0683</td>
<td valign="top" align="center">0.6321 &#x000B1; 0.1086</td>
<td valign="top" align="center">0.8210 &#x000B1; 0.0384</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB OV</td>
<td valign="top" align="center">0.7782 &#x000B1; 0.0304</td>
<td valign="top" align="center">0.3656 &#x000B1; 0.0667</td>
<td valign="top" align="center">0.7755 &#x000B1; 0.0896</td>
<td valign="top" align="center">0.7809 &#x000B1; 0.0573</td>
</tr>
<tr>
<td valign="top" align="left">Feat. selection</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">0.7250 &#x000B1; 0.0415</td>
<td valign="top" align="center">0.4952 &#x000B1; 0.1064</td>
<td valign="top" align="center">0.5449 &#x000B1; 0.1096</td>
<td valign="top" align="center">0.9051 &#x000B1; 0.0352</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">LR OV</td>
<td valign="top" align="center">0.7397 &#x000B1; 0.0364</td>
<td valign="top" align="center">0.4346 &#x000B1; 0.0696</td>
<td valign="top" align="center">0.6099 &#x000B1; 0.1046</td>
<td valign="top" align="center">0.8696 &#x000B1; 0.0397</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF</td>
<td valign="top" align="center">0.7557 &#x000B1; 0.0340</td>
<td valign="top" align="center">0.3999 &#x000B1; 0.0730</td>
<td valign="top" align="center">0.6781 &#x000B1; 0.1020</td>
<td valign="top" align="center">0.8334 &#x000B1; 0.0471</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF OV</td>
<td valign="top" align="center">0.7783 &#x000B1; 0.0363</td>
<td valign="top" align="center">0.3601 &#x000B1; 0.0615</td>
<td valign="top" align="center"><bold>0.7804</bold> <bold>&#x000B1;0.0954</bold></td>
<td valign="top" align="center">0.7763 &#x000B1; 0.0525</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB</td>
<td valign="top" align="center">0.6991 &#x000B1; 0.0466</td>
<td valign="top" align="center">0.3685 &#x000B1; 0.0615</td>
<td valign="top" align="center">0.5477 &#x000B1; 0.1001</td>
<td valign="top" align="center">0.8504 &#x000B1; 0.0362</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB OV</td>
<td valign="top" align="center">0.7514 &#x000B1; 0.0505</td>
<td valign="top" align="center">0.3929 &#x000B1; 0.0643</td>
<td valign="top" align="center">0.6703 &#x000B1; 0.1304</td>
<td valign="top" align="center">0.8324 &#x000B1; 0.0475</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>In bold, there is the model and strategy with the best sensitivity.</p>
</table-wrap-foot>
</table-wrap>
<table-wrap position="float" id="T5">
<label>Table 5</label>
<caption><p>Self-harm prediction results for the three classifiers tested with and without oversampling (OV).</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left"><bold>Features</bold></th>
<th valign="top" align="center"><bold>Models</bold></th>
<th valign="top" align="center"><bold>AUC</bold></th>
<th valign="top" align="center"><bold>PPV</bold></th>
<th valign="top" align="center"><bold>Sensitivity</bold></th>
<th valign="top" align="center"><bold>Specificity</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">All features</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">0.6989 &#x000B1; 0.0511</td>
<td valign="top" align="center">0.4593 &#x000B1; 0.0702</td>
<td valign="top" align="center">0.5072 &#x000B1; 0.1348</td>
<td valign="top" align="center">0.8905 &#x000B1; 0.0481</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">LR OV</td>
<td valign="top" align="center">0.7315 &#x000B1; 0.0582</td>
<td valign="top" align="center">0.4045 &#x000B1; 0.0831</td>
<td valign="top" align="center">0.6348 &#x000B1; 0.1394</td>
<td valign="top" align="center">0.8281 &#x000B1; 0.0628</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF</td>
<td valign="top" align="center">0.7333 &#x000B1; 0.0367</td>
<td valign="top" align="center">0.4567 &#x000B1; 0.0678</td>
<td valign="top" align="center">0.5955 &#x000B1; 0.1039</td>
<td valign="top" align="center">0.8710 &#x000B1; 0.0490</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF OV</td>
<td valign="top" align="center">0.7557 &#x000B1; 0.0340</td>
<td valign="top" align="center">0.4086 &#x000B1; 0.0700</td>
<td valign="top" align="center"><bold>0.6937</bold> <bold>&#x000B1;0.1075</bold></td>
<td valign="top" align="center">0.8177 &#x000B1; 0.0600</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB</td>
<td valign="top" align="center">0.7198 &#x000B1; 0.0288</td>
<td valign="top" align="center">0.3690 &#x000B1; 0.0438</td>
<td valign="top" align="center">0.6305 &#x000B1; 0.0873</td>
<td valign="top" align="center">0.8091 &#x000B1; 0.0492</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB OV</td>
<td valign="top" align="center">0.7199 &#x000B1; 0.0571</td>
<td valign="top" align="center">0.4693 &#x000B1; 0.0692</td>
<td valign="top" align="center">0.5524 &#x000B1; 0.1425</td>
<td valign="top" align="center">0.8874 &#x000B1; 0.0447</td>
</tr>
<tr>
<td valign="top" align="left">Feat. selection</td>
<td valign="top" align="center">LR</td>
<td valign="top" align="center">0.7070 &#x000B1; 0.0492</td>
<td valign="top" align="center">0.4906 &#x000B1; 0.0809</td>
<td valign="top" align="center">0.5107 &#x000B1; 0.1155</td>
<td valign="top" align="center">0.9033 &#x000B1; 0.0391</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">LR OV</td>
<td valign="top" align="center">0.7398 &#x000B1; 0.0340</td>
<td valign="top" align="center">0.4112 &#x000B1; 0.0640</td>
<td valign="top" align="center">0.6469 &#x000B1; 0.0995</td>
<td valign="top" align="center">0.8327 &#x000B1; 0.0505</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF</td>
<td valign="top" align="center">0.7233 &#x000B1; 0.0409</td>
<td valign="top" align="center">0.4594 &#x000B1; 0.0817</td>
<td valign="top" align="center">0.5695 &#x000B1; 0.1094</td>
<td valign="top" align="center">0.8771 &#x000B1; 0.0483</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">RF OV</td>
<td valign="top" align="center">0.7362 &#x000B1; 0.0338</td>
<td valign="top" align="center">0.4065 &#x000B1; 0.0608</td>
<td valign="top" align="center">0.6404 &#x000B1; 0.0956</td>
<td valign="top" align="center">0.8321 &#x000B1; 0.0498</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB</td>
<td valign="top" align="center">0.7155 &#x000B1; 0.0405</td>
<td valign="top" align="center">0.3947 &#x000B1; 0.0395</td>
<td valign="top" align="center">0.5902 &#x000B1; 0.1084</td>
<td valign="top" align="center">0.8408 &#x000B1; 0.0427</td>
</tr>
<tr>
<td/>
<td valign="top" align="center">XGB OV</td>
<td valign="top" align="center">0.7049 &#x000B1; 0.0579</td>
<td valign="top" align="center">0.4877 &#x000B1; 0.0454</td>
<td valign="top" align="center">0.5025 &#x000B1; 0.1407</td>
<td valign="top" align="center">0.9073 &#x000B1; 0.0299</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>In bold, there is the model and strategy with the best sensitivity.</p>
</table-wrap-foot>
</table-wrap>
<p>In summary, a combination of sensitivity above 0.69 and specificity above 0.75 indicates accurate predictions, correctly identifying more than 69 out of 100 positive cases and more than 75 out of 100 negative cases. However, further studies are still needed to improve PPV. PPV indicates the likelihood that an individual with a positive suicide prediction is truly going to commit suicide. Although in this context false positives are more desirable than false negatives, more accurate models have better economic and social advantages and are more feasible. Improving the current model would require additional data, and we believe longitudinal data are key. We are pursuing efforts to obtain a more comprehensive dataset from CEPAI-FHEMIG. Given that we initially intend to use the system for triage, the burden of low PPV is smaller than that of a fully predictive system in operation. The worst-case scenario would prioritize an individual with low risk over one with higher risk.</p>
<p>Finally, it is important to say that we have analyzed the differences in the metrics regarding the training and test sets, and the model does not present any indication of overfitting. A cross-validation procedure was performed to obtain statistically meaningful results. However, we cannot guarantee the method will generalize to other contexts without further adaptation, and testing it in new scenarios is part of our future work.</p></sec>
<sec>
<label>3.3</label>
<title>SHAP values</title>
<p>As we are interested in identifying the factors that most influence the prediction of suicidal behaviors, the impact of each feature on the model&#x00027;s output was assessed using SHAP values. <xref ref-type="fig" rid="F3">Figures 3</xref>&#x02013;<xref ref-type="fig" rid="F5">5</xref> depict these values for the three tasks. In these plots, the horizontal axis indicates whether a particular value is associated with a higher or lower prediction value. The colors denote whether that attribute presents a high (red) or low (blue) value. For this analysis, the gender feature is coded as 0 for female and 1 for male.</p>
<fig position="float" id="F3">
<label>Figure 3</label>
<caption><p>SHAP values for suicide attempt prediction. Each line represents a feature in decreasing order of importance, and the violin plot shows the impact of each feature in the model output. Features concentrated on the right side of the graph (positive SHAP) increase the prediction of suicide attempt, while features on the negative side decrease the prediction. Colors indicate whether a high (red) or low (blue) value of the feature is responsible for the increase/decrease in the prediction.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frai-09-1662264-g0003.tif">
<alt-text content-type="machine-generated">Beeswarm plot displaying SHAP values for ten mental health-related features influencing a model&#x02019;s suicide attempt output, with Age, Agitation, depression, self-harm, previous hospitalization features and Suicidal ideation showing significant efects, but different contributions. Color scale from blue (low) to pink (high) feature values.</alt-text>
</graphic>
</fig>
<p>For example, higher values of &#x0201C;Agitation,&#x0201D; &#x0201C;Gender&#x0201D; (which means the patients are male), and &#x0201C;Learning difficulties&#x0201D; tend to produce lower predicted values for a suicide attempt (axis <italic>x</italic>), suggesting that male patients reporting agitation and learning difficulties are less likely to make a suicide attempt than the patients characterized by the opposite values of these binary variables (i.e., female patients, with no signs of agitation or learning difficulties). On the other hand, patients with depression, self-harm and suicidal ideation as motives for looking for help, who were hospitalized in CEPAI-FHEMIG and diagnosed with depression, are more likely to have a suicide attempt.</p>
<p>For suicide ideation (<xref ref-type="fig" rid="F4">Figure 4</xref>), intellectual disability is linked to decreased risk, while isolation and hallucinations are associated with increased risk. As for the self-harm model (<xref ref-type="fig" rid="F5">Figure 5</xref>), the relationships of gender and age with its prediction seem to be more regular, with older female patients being associated with a higher risk, while a patient with no trauma history using only CEPAI-FHEMIG&#x00027;s social services is linked to decreased risk, highlighting the distinct factors contributing to each outcome.</p>
<fig position="float" id="F4">
<label>Figure 4</label>
<caption><p>SHAP Values for Suicide Ideation Prediction. Each line represents a feature in decreasing order of importance, and the violin plot shows the impact of each feature in the model output. Features concentrated on the right side of the graph (positive SHAP) increase the prediction of suicide ideation, while features on the negative side decrease the prediction. Colors indicate whether a high (red) or low (blue) value of the feature is responsible for the increase/decrease in the prediction.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frai-09-1662264-g0004.tif">
<alt-text content-type="machine-generated">Violin plot visualizes SHAP values for features impacting a model&#x02019;s self-harm output related to suicide risk, including depression, suicidal ideation, gender, and age. Color gradient indicates feature value from low (blue) to high (pink). </alt-text>
</graphic>
</fig>
<fig position="float" id="F5">
<label>Figure 5</label>
<caption><p>SHAP Values for Self-Harm Prediction. Each line represents a feature in decreasing order of importance, and the violin plot shows the impact of each feature in the model output. Features concentrated on the right side of the graph (positive SHAP) increase the prediction of self-harm, while features on the negative side decrease the prediction. Colors indicate whether a high (red) or low (blue) value of the feature is responsible for the increase/decrease in the prediction.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="frai-09-1662264-g0005.tif">
<alt-text content-type="machine-generated">Violin plot summarizes the SHAP values of ten mental health-related features impacting a model&#x02019;s suicide ideation output, with higher feature values in pink and lower values in blue; depression-related features were the most influent in the model.</alt-text>
</graphic>
</fig>
</sec></sec>
<sec sec-type="discussion" id="s4">
<label>4</label>
<title>Discussion</title>
<p>The matter of children and adolescents requiring psychiatric care warrants attention. Roughly 1 in 5 children struggle with a mental, emotional, or behavioral disorder, yet fewer than 20% receive care from a mental health specialist (<xref ref-type="bibr" rid="B34">Vial and Almon, 2023</xref>). This lack of access to appropriate treatment is a pressing concern, particularly given that suicidal behavior, the most severe consequence of commonly untreated mental health issues, is a significant risk for this vulnerable population. In LMICs, accessing mental health services is even more difficult. Many individuals do not receive the care they need, and available services are often inefficient.</p>
<p>Suicidal behavior is a serious concern among adolescents, particularly during middle and late adolescence, with consequences that often persist into adulthood, especially for those who have previously attempted suicide. Research indicates that both short-term (6 months) and long-term (5 years) recurrence are common, increasing the risk among individuals who have been hospitalized for suicide attempts (<xref ref-type="bibr" rid="B28">Scoliers et al., 2009</xref>; <xref ref-type="bibr" rid="B1">Azc&#x000E1;rate-Jim&#x000E9;nez et al., 2019</xref>). Prevalence rates for suicidal ideation and attempts range from 14.3% to 22.6% and 4.6% to 15.8%, respectively (<xref ref-type="bibr" rid="B32">Van Meter et al., 2023</xref>). The transition from adolescence to young adulthood is associated with high healthcare costs and frequently results in interruptions in psychiatric care (<xref ref-type="bibr" rid="B4">Canaway et al., 2023</xref>). Late adolescence is the period of greatest risk for suicidal behavior, particularly during stressful times (<xref ref-type="bibr" rid="B35">Whalen et al., 2022</xref>; <xref ref-type="bibr" rid="B23">Orri et al., 2020</xref>). There is a pressing need to understand the predictors of suicidal behaviors to develop effective preventive interventions and ensure accessible, appropriate care for adolescents and young adults.</p>
<p>While ML excels at general classification and prediction tasks, predicting suicide behaviors remains a complex challenge. Suicide-related behaviors are influenced by numerous, interrelated factors that cannot be addressed with simple solutions. As noted earlier, a suicide attempt prediction model achieved a sensitivity of 0.47 and a specificity of 0.91 (<xref ref-type="bibr" rid="B31">van Mens et al., 2020</xref>). Although direct comparison is difficult due to differences in datasets, their study demonstrated higher specificity (0.76) but lower sensitivity (0.71) compared to ours. This underscores the critical importance of calibrating classifier thresholds. Adjusting these thresholds can significantly affect model performance, enabling tailored outcomes aligned with clinical priorities. Given the potential severity of missed cases, we prioritize increased sensitivity, while acknowledging that this often comes at the expense of specificity.</p>
<p>In sum, dealing with prediction tasks of suicidal behaviors is hard because (i) the data has an intrinsic bias&#x02014;all patients presenting at the emergency had psychiatric symptoms; (ii) the suicide attempt itself is an unbalanced data; (iii) the dataset is limited to a low number of patients; (iv) mispredicting a high-risk patient has more serious consequences, given that it is a cost-sensitive classification task. As most health-related models, the one generated here would need to be adapted to a setting that resembles the prevalence of these events in the general population (<xref ref-type="bibr" rid="B26">Richter et al., 2025</xref>). We are currently looking for a new dataset to validate our findings.</p>
<p>Given the numerous predisposing conditions, the relatively low frequency of the tragic event, and the undesirable possibility of error, the models proposed in this study demonstrate acceptable accuracy and can serve as valuable screening tools. These models can aid health professionals by identifying patients at risk of suicidal behavior. They may function effectively as screening tools, prioritizing individuals with a high probability of suicide risk for prompt medical attention. Such measures that facilitate access could help minimize adverse outcomes. This approach is particularly crucial in middle-income scenarios where access to psychiatric facilities and treatment is insufficient for the multitude of people in deep need of care (<xref ref-type="bibr" rid="B6">Dalgalarrondo et al., 2023</xref>).</p>
<p>The unique context of addressing psychiatric cases in an emergency setting significantly differentiates our work. Patients in crisis alter the population-level expectation of rare events, making them more frequent. The emphasis put on identifying predictors of suicide-related behaviors allowed our models to pinpoint the most relevant factors for self-harm, suicidal ideation, and suicide attempts, permitting timely intervention. The potential of these predictor models lies in prioritizing higher-risk patients for immediate emergency care and identifying the risk factors involved in each case. Given the rarity of the outcome in high-risk populations (lower heterogeneity), there is a clear need to validate our model on data from other psychiatric centers to generalize the results (<xref ref-type="bibr" rid="B33">Varoquaux, 2018</xref>). Beyond the difficulties in predicting low-frequency events, another limitation of the study was the associative character of the risk features, which does not add causal knowledge that should be addressed at some point.</p>
<p>The consistent identification of the 10 most relevant features across models for predicting self-harm, suicidal ideation, and suicide attempts highlights the strong interconnection among these outcomes. When assessment resources are limited, key indicators of suicidal behavior become increasingly prominent, especially those linked to lack of treatment, inadequate care, and repeated psychiatric service utilization. Social factors, such as household size, may also shed light on vulnerability, particularly in LMICs, where these dynamics differ. While emergency settings provide a valuable source of cases for model training, they also introduce limitations, as findings may not generalize readily to other clinical contexts.</p>
<p>Depression and its symptoms consistently stand out as major predictors of suicide-related behaviors, as supported by previous research (<xref ref-type="bibr" rid="B13">Li, 2023</xref>; <xref ref-type="bibr" rid="B10">Jiang et al., 2021</xref>; <xref ref-type="bibr" rid="B19">Mubasyiroh et al., 2018</xref>). Given its substantial predictive value, depression should be prioritized as a key target for intervention. Early detection and effective treatment of depression could substantially reduce the risk of suicide-related outcomes. In addition, self-harm and suicidal ideation are vital warning signs that may indicate the potential for more severe developments. Addressing modifiable social determinants, integrated into risk screening, can further enhance the comprehensiveness of suicide prevention strategies. Limited access to mental health care is also strongly associated with increased risk, as individuals often seek help in emergency settings due to inadequate prior psychiatric support. These findings highlight the urgent need to improve access to mental health services and initiate timely interventions to prevent escalation and severe outcomes.</p></sec>
<sec id="s5">
<label>5</label>
<title>Conclusions</title>
<p>This study introduces a machine learning framework designed to predict suicidal behaviors, including suicidal ideation, self-harm, and suicide attempts, within a pediatric psychiatric emergency context. By focusing on a middle-income population in Brazil, this research addresses a significant geographic gap. Although most global suicides occur in LMICs, these settings remain significantly underrepresented in predictive modeling literature.</p>
<p>Our findings lead to several key conclusions regarding the intersection of artificial intelligence and youth mental health: The Random Forest model with oversampling achieved sensitivities ranging from 69% to 78%, demonstrating its clinical utility for identifying at-risk individuals who might otherwise be missed in overstretched emergency services. By using SHAP values, we moved from &#x0201C;black-box&#x0201D; predictions, showing social determinants are primary drivers of risk in middle-income contexts.</p>
<p>Ultimately, this study serves as a proof-of-concept for the deployment of AI-supported screening tools in psychiatric emergency departments. By integrating these models into triage workflows, we can shift from reactive crisis management to proactive, data-driven identification, potentially reducing suicide rates in vulnerable youth populations worldwide.</p></sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec sec-type="ethics-statement" id="s7">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Comite de Etica em Pesquisa da Ciencias Medicas. The studies were conducted in accordance with the local legislation and institutional requirements. The ethics committee/institutional review board waived the requirement of written informed consent for participation from the participants or the participants&#x00027; legal guardians/next of kin because It consist in a retrospective medical data evaluation.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>IC: Formal analysis, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. AC: Formal analysis, Supervision, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. AL: Formal analysis, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. WM: Conceptualization, Formal analysis, Investigation, Methodology, Project administration, Supervision, Visualization, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. DB: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. LM: Data curation, Formal analysis, Writing &#x02013; original draft. AS: Conceptualization, Investigation, Methodology, Project administration, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. MM: Data curation, Investigation, Resources, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. MR-S: Conceptualization, Investigation, Resources, Supervision, Funding acquisition, Project administration, Writing &#x02013; original draft. DM: Conceptualization, Investigation, Resources, Supervision, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. GP: Conceptualization, Data curation, Formal analysis, Funding acquisition, Investigation, Methodology, Project administration, Supervision, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s10">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was used in the creation of this manuscript. We used Chat GPT to improve readability and grammar issues.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="web"><person-group person-group-type="author"><name><surname>Azc&#x000E1;rate-Jim&#x000E9;nez</surname> <given-names>L.</given-names></name> <name><surname>L&#x000F3;pez-Go&#x000F1;i</surname> <given-names>J.</given-names></name> <name><surname>Go&#x000F1;i-Sarri&#x000E9;s</surname> <given-names>A.</given-names></name> <name><surname>Montes-Reula</surname> <given-names>L.</given-names></name> <name><surname>Portilla-Fern&#x000E1;ndez</surname> <given-names>A.</given-names></name> <name><surname>Elorza-Pardo</surname> <given-names>R.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Repeated suicide attempts: a follow-up study</article-title>. <source>Actas Esp. Psiquiatr</source>. <volume>47</volume>, <fpage>127</fpage>&#x02013;<lpage>136</lpage>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://actaspsiquiatria.es/index.php/actas/article/view/245">https://actaspsiquiatria.es/index.php/actas/article/view/245</ext-link> (Accessed January, 2026). <pub-id pub-id-type="pmid">31461152</pub-id></mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bersia</surname> <given-names>M.</given-names></name> <name><surname>Koumantakis</surname> <given-names>E.</given-names></name> <name><surname>Berchialla</surname> <given-names>P.</given-names></name> <name><surname>Charrier</surname> <given-names>L.</given-names></name> <name><surname>Ricotti</surname> <given-names>A.</given-names></name> <name><surname>Grimaldi</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Suicide spectrum among young people during the COVID-19 pandemic: a systematic review and meta-analysis</article-title>. <source>EClinicalMedicine</source> <volume>54</volume>:<fpage>101705</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.eclinm.2022.101705</pub-id><pub-id pub-id-type="pmid">36338787</pub-id></mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Bishop</surname> <given-names>C.</given-names></name></person-group> (<year>2006</year>). <source>Pattern Recognition and Machine Learning</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>.</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Canaway</surname> <given-names>A.</given-names></name> <name><surname>Appleton</surname> <given-names>R.</given-names></name> <name><surname>van Bodegom</surname> <given-names>L.</given-names></name> <name><surname>Dieleman</surname> <given-names>G.</given-names></name> <name><surname>Frani&#x00107;</surname> <given-names>T.</given-names></name> <name><surname>Gerritsen</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Healthcare costs for young people transitioning the boundary between child/adolescent and adult mental health services in seven European countries: results from the milestone study</article-title>. <source>BJPsych Open</source> <volume>9</volume>:<fpage>e175</fpage>. doi: <pub-id pub-id-type="doi">10.1192/bjo.2023.559</pub-id><pub-id pub-id-type="pmid">37749976</pub-id></mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>T.</given-names></name> <name><surname>Guestrin</surname> <given-names>C.</given-names></name></person-group> (<year>2016</year>). <article-title>&#x0201C;Xgboost: a scalable tree boosting system,&#x0201D;</article-title> in <source>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>785</fpage>&#x02013;<lpage>794</lpage>. doi: <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id></mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dalgalarrondo</surname> <given-names>P.</given-names></name> <name><surname>Oda</surname> <given-names>A.</given-names></name> <name><surname>Onocko-Campos</surname> <given-names>R.</given-names></name> <name><surname>Banzato</surname> <given-names>C.</given-names></name></person-group> (<year>2023</year>). <article-title>Challenges facing the psychiatric reform and mental health care in Brazil: critical unmet needs and prospects for better integrating the public and university sectors</article-title>. <source>SSM</source> - <source>Ment. Health</source> <volume>4</volume>:<fpage>100262</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ssmmh.2023.100262</pub-id></mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Glenn</surname> <given-names>C.</given-names></name> <name><surname>Kleiman</surname> <given-names>E.</given-names></name> <name><surname>Kellerman</surname> <given-names>J.</given-names></name> <name><surname>Pollak</surname> <given-names>O.</given-names></name> <name><surname>Cha</surname> <given-names>C.</given-names></name> <name><surname>Esposito</surname> <given-names>E.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Annual research review: a meta-analytic review of worldwide suicide rates in adolescents</article-title>. <source>J. Child Psychol. Psychiatry</source> <volume>61</volume>, <fpage>294</fpage>&#x02013;<lpage>308</lpage>. doi: <pub-id pub-id-type="doi">10.1111/jcpp.13106</pub-id><pub-id pub-id-type="pmid">31373003</pub-id></mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Harris</surname> <given-names>I.</given-names></name> <name><surname>Beese</surname> <given-names>S.</given-names></name> <name><surname>Moore</surname> <given-names>D.</given-names></name></person-group> (<year>2019a</year>). <article-title>Predicting future self-harm or suicide in adolescents: a systematic review of risk assessment scales/tools</article-title>. <source>BMJ Open</source> <volume>9</volume>:<fpage>e029311</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmjopen-2019-029311</pub-id><pub-id pub-id-type="pmid">31494608</pub-id></mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Harris</surname> <given-names>I.</given-names></name> <name><surname>Beese</surname> <given-names>S.</given-names></name> <name><surname>Moore</surname> <given-names>D.</given-names></name></person-group> (<year>2019b</year>). <article-title>Predicting repeated self-harm or suicide in adolescents and young adults using risk assessment scales/tools: a systematic review protocol</article-title>. <source>Syst. Rev</source>. <volume>8</volume>:<fpage>87</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13643-019-1007-7</pub-id><pub-id pub-id-type="pmid">30947743</pub-id></mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jiang</surname> <given-names>T.</given-names></name> <name><surname>Nagy</surname> <given-names>D.</given-names></name> <name><surname>Rosellini</surname> <given-names>A.</given-names></name> <name><surname>Horv&#x000E1;th-Puh&#x000F3;</surname> <given-names>E.</given-names></name> <name><surname>Keyes</surname> <given-names>K.</given-names></name> <name><surname>Lash</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Suicide prediction among men and women with depression: a population-based study</article-title>. <source>J. Psychiatr. Res</source>. <volume>142</volume>, <fpage>275</fpage>&#x02013;<lpage>282</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jpsychires.2021.08.003</pub-id><pub-id pub-id-type="pmid">34403969</pub-id></mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Klonsky</surname> <given-names>E.</given-names></name> <name><surname>May</surname> <given-names>A.</given-names></name> <name><surname>Saffer</surname> <given-names>B.</given-names></name></person-group> (<year>2016</year>). <article-title>Suicide, suicide attempts, and suicidal ideation</article-title>. <source>Annu. Rev. Clin. Psychol</source>. <volume>12</volume>, <fpage>307</fpage>&#x02013;<lpage>330</lpage>. doi: <pub-id pub-id-type="doi">10.1146/annurev-clinpsy-021815-093204</pub-id><pub-id pub-id-type="pmid">26772209</pub-id></mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Knipe</surname> <given-names>D.</given-names></name> <name><surname>Padmanathan</surname> <given-names>P.</given-names></name> <name><surname>Newton-Howes</surname> <given-names>G.</given-names></name> <name><surname>Chan</surname> <given-names>L.</given-names></name> <name><surname>Kapur</surname> <given-names>N.</given-names></name></person-group> (<year>2022</year>). <article-title>Suicide and self-harm</article-title>. <source>Lancet</source> <volume>399</volume>, <fpage>1903</fpage>&#x02013;<lpage>1916</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(22)00173-8</pub-id></mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>Y.</given-names></name></person-group> (<year>2023</year>). <article-title>Depression and suicide risk prediction based on machine learning models</article-title>. <source>J. Educ. Humanit. Soc. Sci</source>. <volume>15</volume>, <fpage>302</fpage>&#x02013;<lpage>307</lpage>. doi: <pub-id pub-id-type="doi">10.54097/ehss.v15i.9312</pub-id></mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lobato Machado</surname> <given-names>M.</given-names></name> <name><surname>Hibner</surname> <given-names>M.</given-names></name> <name><surname>Nogueira</surname> <given-names>D.</given-names></name> <name><surname>Rezende</surname> <given-names>M.</given-names></name> <name><surname>B&#x000F3;rem</surname> <given-names>I.</given-names></name> <name><surname>da Cunha</surname> <given-names>L.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Irritability in an open-door pediatric psychiatric emergency service in a middle-income country</article-title>. <source>Neuropsychiatr. Enfance Adolesc</source>. <volume>70</volume>, <fpage>336</fpage>&#x02013;<lpage>342</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neurenf.2022.05.007</pub-id></mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Lundberg</surname> <given-names>S.</given-names></name> <name><surname>Lee</surname> <given-names>S.</given-names></name></person-group> (<year>2017</year>). <article-title>&#x0201C;A unified approach to interpreting model predictions&#x0201D;</article-title> in <source>Paper Presented at the 31st Conference on Neural Information Processing Systems (NIPS 2017)</source> (<publisher-loc>Long Beach, CA</publisher-loc>).</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mars</surname> <given-names>B.</given-names></name> <name><surname>Heron</surname> <given-names>J.</given-names></name> <name><surname>Klonsky</surname> <given-names>E.</given-names></name> <name><surname>Moran</surname> <given-names>P.</given-names></name> <name><surname>O&#x00027;Connor</surname> <given-names>R.</given-names></name> <name><surname>Tilling</surname> <given-names>K.</given-names></name> <etal/></person-group>. (<year>2019a</year>). <article-title>Predictors of future suicide attempt among adolescents with suicidal thoughts or non-suicidal self-harm: a population-based birth cohort study</article-title>. <source>Lancet Psychiatry</source> <volume>6</volume>, <fpage>327</fpage>&#x02013;<lpage>337</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S2215-0366(19)30030-6</pub-id><pub-id pub-id-type="pmid">30879972</pub-id></mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mars</surname> <given-names>B.</given-names></name> <name><surname>Heron</surname> <given-names>J.</given-names></name> <name><surname>Klonsky</surname> <given-names>E.</given-names></name> <name><surname>Moran</surname> <given-names>P.</given-names></name> <name><surname>O&#x00027;Connor</surname> <given-names>R.</given-names></name> <name><surname>Tilling</surname> <given-names>K.</given-names></name> <etal/></person-group>. (<year>2019b</year>). <article-title>What distinguishes adolescents with suicidal thoughts from those who have attempted suicide? A population-based birth cohort study</article-title>. <source>J. Child Psychol. Psychiatry</source> <volume>60</volume>, <fpage>91</fpage>&#x02013;<lpage>99</lpage>. doi: <pub-id pub-id-type="doi">10.1111/jcpp.12878</pub-id><pub-id pub-id-type="pmid">29492978</pub-id></mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Miladinov</surname> <given-names>G.</given-names></name></person-group> (<year>2023</year>). <article-title>The economics of suicide: evidence from LMICS and HICS</article-title>. <source>J. Res. Soc. Sci. Humanit</source>. <volume>2</volume>, <fpage>9</fpage>&#x02013;<lpage>25</lpage>. doi: <pub-id pub-id-type="doi">10.56397/JRSSH.2023.06.02</pub-id></mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mubasyiroh</surname> <given-names>R.</given-names></name> <name><surname>Pradono</surname> <given-names>J.</given-names></name> <name><surname>Nurkhotimah</surname> <given-names>E.</given-names></name> <name><surname>Kusumawardani</surname> <given-names>N.</given-names></name> <name><surname>Idaiani</surname> <given-names>S.</given-names></name></person-group> (<year>2018</year>). <article-title>Depression as a strong prediction of suicide risk</article-title>. <source>Glob. J. Health Sci</source>. <volume>10</volume>:<fpage>52</fpage>. doi: <pub-id pub-id-type="doi">10.5539/gjhs.v10n12p52</pub-id></mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Naghavi</surname> <given-names>M.</given-names></name></person-group> (<year>2019</year>). <article-title>Global, regional, and national burden of suicide mortality 1990 to 2016: systematic analysis for the global burden of disease study 2016</article-title>. <source>BMJ</source> <volume>364</volume>:<fpage>l94</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmj.l94</pub-id><pub-id pub-id-type="pmid">31339847</pub-id></mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Navarro</surname> <given-names>M.</given-names></name> <name><surname>Ouellet-Morin</surname> <given-names>I.</given-names></name> <name><surname>Geoffroy</surname> <given-names>M.</given-names></name> <name><surname>Boivin</surname> <given-names>M.</given-names></name> <name><surname>Tremblay</surname> <given-names>R.</given-names></name> <name><surname>C&#x000F4;t&#x000E9;</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Machine learning assessment of early life factors predicting suicide attempt in adolescence or young adulthood</article-title>. <source>JAMA Netw. Open</source> <volume>4</volume>:<fpage>e211450</fpage>. doi: <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2021.1450</pub-id><pub-id pub-id-type="pmid">33710292</pub-id></mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Orellana</surname> <given-names>J.</given-names></name> <name><surname>Ribeiro</surname> <given-names>M.</given-names></name> <name><surname>Barbieri</surname> <given-names>M.</given-names></name> <name><surname>Saraiva</surname> <given-names>M. C.</given-names></name> <name><surname>Cardoso</surname> <given-names>V.</given-names></name> <name><surname>Bettiol</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Mental disorders in adolescents, youth, and adults in the RPS birth cohort consortium (Ribeir&#x000E3;o Preto, Pelotas and S&#x000E3;o Lu&#x000ED;s), Brazil</article-title>. <source>Cad. Saude Publica</source> <volume>36</volume>:<fpage>e00154319</fpage>. doi: <pub-id pub-id-type="doi">10.1590/0102-311x00154319</pub-id><pub-id pub-id-type="pmid">32022176</pub-id></mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Orri</surname> <given-names>M.</given-names></name> <name><surname>Scardera</surname> <given-names>S.</given-names></name> <name><surname>Perret</surname> <given-names>L.</given-names></name> <name><surname>Bolanis</surname> <given-names>D.</given-names></name> <name><surname>Temcheff</surname> <given-names>C.</given-names></name> <name><surname>S&#x000E9;guin</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Mental health problems and risk of suicidal ideation and attempts in adolescents</article-title>. <source>Pediatrics</source> <volume>146</volume>:<fpage>e20193823</fpage>. doi: <pub-id pub-id-type="doi">10.1542/peds.2019-3823</pub-id><pub-id pub-id-type="pmid">32513840</pub-id></mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="web"><person-group person-group-type="author"><name><surname>Pedregosa</surname> <given-names>F.</given-names></name> <name><surname>Varoquaux</surname> <given-names>G.</given-names></name> <name><surname>Gramfort</surname> <given-names>A.</given-names></name> <name><surname>Michel</surname> <given-names>V.</given-names></name> <name><surname>Thirion</surname> <given-names>B.</given-names></name> <name><surname>Grisel</surname> <given-names>O.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Scikit-learn: machine learning in python</article-title>. <source>J. Mach. Learn. Res</source>. <volume>12</volume>, <fpage>2825</fpage>&#x02013;<lpage>2830</lpage>. Available online at: <ext-link ext-link-type="uri" xlink:href="http://scikit-learn.sourceforge.net">http://scikit-learn.sourceforge.net</ext-link> (Accessed January, 2026).</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Pollock</surname> <given-names>N.</given-names></name></person-group> (<year>2019</year>). <article-title>Place, the built environment, and means restriction in suicide prevention</article-title>. <source>Int. J. Environ. Res. Public Health</source>, 16. doi: <pub-id pub-id-type="doi">10.3390/ijerph16224389</pub-id><pub-id pub-id-type="pmid">31717635</pub-id></mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Richter</surname> <given-names>M.</given-names></name> <name><surname>Emden</surname> <given-names>D.</given-names></name> <name><surname>Leenings</surname> <given-names>R.</given-names></name> <name><surname>Winter</surname> <given-names>N. R.</given-names></name> <name><surname>Mikolajczyk</surname> <given-names>R.</given-names></name> <name><surname>Massag</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Generalizability of clinical prediction models in mental health</article-title>. <source>Mol. Psychiatry</source> <volume>30</volume>, <fpage>3632</fpage>&#x02013;<lpage>3639</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41380-025-02950-0</pub-id><pub-id pub-id-type="pmid">40108256</pub-id></mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Robinson</surname> <given-names>J.</given-names></name> <name><surname>Bailey</surname> <given-names>E.</given-names></name> <name><surname>Witt</surname> <given-names>K.</given-names></name> <name><surname>Stefanac</surname> <given-names>N.</given-names></name> <name><surname>Milner</surname> <given-names>A.</given-names></name> <name><surname>Currier</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>What works in youth suicide prevention? A systematic review and meta-analysis</article-title>. <source>EClinicalMedicine</source> 4&#x02013;<volume>5</volume>, <fpage>52</fpage>&#x02013;<lpage>91</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.eclinm.2018.10.004</pub-id><pub-id pub-id-type="pmid">31193651</pub-id></mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Scoliers</surname> <given-names>G.</given-names></name> <name><surname>Portzky</surname> <given-names>G.</given-names></name> <name><surname>van Heeringen</surname> <given-names>K.</given-names></name> <name><surname>Audenaert</surname> <given-names>K.</given-names></name></person-group> (<year>2009</year>). <article-title>Sociodemographic and psychopathological risk factors for repetition of attempted suicide: a 5-year follow-up study</article-title>. <source>Arch. Suicide Res</source>. <volume>13</volume>, <fpage>201</fpage>&#x02013;<lpage>213</lpage>. doi: <pub-id pub-id-type="doi">10.1080/13811110902835130</pub-id><pub-id pub-id-type="pmid">19590995</pub-id></mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Su</surname> <given-names>C.</given-names></name> <name><surname>Aseltine</surname> <given-names>R.</given-names></name> <name><surname>Doshi</surname> <given-names>R.</given-names></name> <name><surname>Chen</surname> <given-names>K.</given-names></name> <name><surname>Rogers</surname> <given-names>S.</given-names></name> <name><surname>Wang</surname> <given-names>F.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Machine learning for suicide risk prediction in children and adolescents with electronic health records</article-title>. <source>Transl. Psychiatry</source> <volume>10</volume>:<fpage>413</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41398-020-01100-0</pub-id><pub-id pub-id-type="pmid">33243979</pub-id></mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Uddin</surname> <given-names>R.</given-names></name> <name><surname>Burton</surname> <given-names>N.</given-names></name> <name><surname>Maple</surname> <given-names>M.</given-names></name> <name><surname>Khan</surname> <given-names>S.</given-names></name> <name><surname>Khan</surname> <given-names>A.</given-names></name></person-group> (<year>2019</year>). <article-title>Suicidal ideation, suicide planning, and suicide attempts among adolescents in 59 low-income and middle-income countries: a population-based study</article-title>. <source>Lancet Child Adolesc Health</source> <volume>3</volume>, <fpage>223</fpage>&#x02013;<lpage>233</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S2352-4642(18)30403-6</pub-id><pub-id pub-id-type="pmid">30878117</pub-id></mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>van Mens</surname> <given-names>K.</given-names></name> <name><surname>de Schepper</surname> <given-names>C.</given-names></name> <name><surname>Wijnen</surname> <given-names>B.</given-names></name> <name><surname>Koldijk</surname> <given-names>S.</given-names></name> <name><surname>Schnack</surname> <given-names>H.</given-names></name> <name><surname>de Looff</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Predicting future suicidal behaviour in young adults, with different machine learning techniques: a population-based longitudinal study</article-title>. <source>J. Affect. Disord</source>. <volume>271</volume>, <fpage>169</fpage>&#x02013;<lpage>177</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jad.2020.03.081</pub-id><pub-id pub-id-type="pmid">32479313</pub-id></mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Van Meter</surname> <given-names>A.</given-names></name> <name><surname>Knowles</surname> <given-names>E.</given-names></name> <name><surname>Mintz</surname> <given-names>E.</given-names></name></person-group> (<year>2023</year>). <article-title>Systematic review and meta-analysis: international prevalence of suicidal ideation and attempt in youth</article-title>. <source>J. Am. Acad. Child Adolesc. Psychiatry</source> <volume>62</volume>, <fpage>973</fpage>&#x02013;<lpage>986</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jaac.2022.07.867</pub-id><pub-id pub-id-type="pmid">36563876</pub-id></mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Varoquaux</surname> <given-names>G.</given-names></name></person-group> (<year>2018</year>). <article-title>Cross-validation failure: small sample sizes lead to large error bars</article-title>. <source>Neuroimage</source> <volume>180</volume>, <fpage>68</fpage>&#x02013;<lpage>77</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neuroimage.2017.06.061</pub-id><pub-id pub-id-type="pmid">28655633</pub-id></mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vial</surname> <given-names>T.</given-names></name> <name><surname>Almon</surname> <given-names>A.</given-names></name></person-group> (<year>2023</year>). <article-title>Artificial intelligence in mental health therapy for children and adolescents</article-title>. <source>JAMA Pediatr</source>. <volume>177</volume>, <fpage>1251</fpage>&#x02013;<lpage>1252</lpage>. doi: <pub-id pub-id-type="doi">10.1001/jamapediatrics.2023.4212</pub-id><pub-id pub-id-type="pmid">37843842</pub-id></mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Whalen</surname> <given-names>D.</given-names></name> <name><surname>Hennefield</surname> <given-names>L.</given-names></name> <name><surname>Elsayed</surname> <given-names>N.</given-names></name> <name><surname>Tillman</surname> <given-names>R.</given-names></name> <name><surname>Barch</surname> <given-names>D.</given-names></name> <name><surname>Luby</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Trajectories of suicidal thoughts and behaviors from preschool through late adolescence</article-title>. <source>J. Am. Acad. Child Adolesc. Psychiatry</source> <volume>61</volume>, <fpage>676</fpage>&#x02013;<lpage>685</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jaac.2021.08.020</pub-id><pub-id pub-id-type="pmid">34506928</pub-id></mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Zaki</surname> <given-names>M.</given-names></name> <name><surname>Meira</surname> <given-names>W.</given-names></name></person-group> (<year>2014</year>). <source>Data Mining and Analysis: Fundamental Concepts and Algorithms</source>. <publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>. doi: <pub-id pub-id-type="doi">10.1017/CBO9780511810114</pub-id></mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0001">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/532820/overview">Gregory R. Hart</ext-link>, Institute for Disease Modeling (IDM), United States</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0002">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3041906/overview">Soomin Shin</ext-link>, Korea National University of Transportation, Republic of Korea</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3134685/overview">Kyungwon Kim</ext-link>, Incheon National University, Republic of Korea</p>
</fn>
</fn-group>
</back>
</article>
