<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychiatry</journal-id>
<journal-title>Frontiers in Psychiatry</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychiatry</abbrev-journal-title>
<issn pub-type="epub">1664-0640</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyt.2023.1208856</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Psychiatry</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Validation of natural language processing methods capturing semantic incoherence in the speech of patients with non-affective psychosis</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Just</surname>
<given-names>Sandra Anna</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<xref rid="c001" ref-type="corresp"><sup>&#x002A;</sup></xref>
<xref rid="fn0001" ref-type="author-notes"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/987886/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Br&#x00F6;cker</surname>
<given-names>Anna-Lena</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<xref rid="fn0001" ref-type="author-notes"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/838985/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ryazanskaya</surname>
<given-names>Galina</given-names>
</name>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Nenchev</surname>
<given-names>Ivan</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Schneider</surname>
<given-names>Maria</given-names>
</name>
<xref rid="aff3" ref-type="aff"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bermpohl</surname>
<given-names>Felix</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1579668/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Heinz</surname>
<given-names>Andreas</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/5872/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Montag</surname>
<given-names>Christiane</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/53384/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Psychiatry and Neurosciences, Campus Charit&#x00E9; Mitte, Charit&#x00E9; &#x2013; Universit&#x00E4;tsmedizin Berlin, Corporate Member of Freie Universit&#x00E4;t Berlin and Humboldt Universit&#x00E4;t zu Berlin</institution>, <addr-line>Berlin</addr-line>, <country>Germany</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Linguistics, University of Potsdam</institution>, <addr-line>Potsdam</addr-line>, <country>Germany</country></aff>
<aff id="aff3"><sup>3</sup><institution>IPB Institut f&#x00FC;r Integrative Psychotherapieausbildung Berlin, MSB Medical School Berlin, GmbH</institution>, <addr-line>Berlin</addr-line>, <country>Germany</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0002"><p>Edited by: Olivier Dufor, Yncr&#x00E9;a Hauts-de-France, France</p></fn>
<fn fn-type="edited-by" id="fn0003"><p>Reviewed by: Alban Voppel, University Medical Center Groningen, Netherlands; Marta Bosia, Vita-Salute San Raffaele University, Italy; Peter F. Liddle, University of Nottingham, United Kingdom</p></fn>
<corresp id="c001">&#x002A;Correspondence: Sandra Anna Just, <email>sandra-anna.just@charite.de</email></corresp>
<fn fn-type="equal" id="fn0001"><p><sup>&#x2020;</sup>These authors have contributed equally to this work and share first authorship</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>25</day>
<month>07</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1208856</elocation-id>
<history>
<date date-type="received">
<day>19</day>
<month>04</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>07</day>
<month>07</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2023 Just, Br&#x00F6;cker, Ryazanskaya, Nenchev, Schneider, Bermpohl, Heinz and Montag.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Just, Br&#x00F6;cker, Ryazanskaya, Nenchev, Schneider, Bermpohl, Heinz and Montag</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec id="sec1">
<title>Background</title>
<p>Impairments in speech production are a core symptom of non-affective psychosis (NAP). While traditional clinical ratings of patients&#x2019; speech involve a subjective human factor, modern methods of natural language processing (NLP) promise an automatic and objective way of analyzing patients&#x2019; speech. This study aimed to validate NLP methods for analyzing speech production in NAP patients.</p>
</sec>
<sec id="sec2">
<title>Methods</title>
<p>Speech samples from patients with a diagnosis of schizophrenia or schizoaffective disorder were obtained at two measurement points, 6&#x2009;months apart. Out of <italic>N</italic>&#x2009;=&#x2009;71 patients at T<sub>1</sub>, speech samples were also available for <italic>N</italic>&#x2009;=&#x2009;54 patients at T<sub>2</sub>. Global and local models of semantic coherence as well as different word embeddings (word2vec vs. GloVe) were applied to the transcribed speech samples. They were tested and compared regarding their correlation with clinical ratings and external criteria from cross-sectional and longitudinal measurements.</p>
</sec>
<sec id="sec3">
<title>Results</title>
<p>Results did not show differences for global vs. local coherence models and found more significant correlations between word2vec models and clinically relevant outcome variables than for GloVe models. Exploratory analysis of longitudinal data did not yield significant correlation with coherence scores.</p>
</sec>
<sec id="sec4">
<title>Conclusion</title>
<p>These results indicate that natural language processing methods need to be critically validated in more studies and carefully selected before clinical application.</p>
</sec>
</abstract>
<kwd-group>
<kwd>coherence</kwd>
<kwd>speech analysis</kwd>
<kwd>automated analysis</kwd>
<kwd>natural language processing</kwd>
<kwd>artificial intelligence</kwd>
<kwd>psychosis</kwd>
<kwd>schizophrenia</kwd>
<kwd>formal thought disorder</kwd>
</kwd-group>
<contract-num rid="cn1">BIH_PRO_279</contract-num>
<contract-num rid="cn2">S112/10211/16</contract-num>
<contract-sponsor id="cn1">Berlin Institute of Health</contract-sponsor>
<contract-sponsor id="cn2">Deutsche Gesellschaft f&#x00FC;r Psychoanalyse, Psychotherapie, Psychosomatik und Tiefenpsychologie (DGPT e.V.) and by K&#x00F6;hler Stiftung</contract-sponsor>
<counts>
<fig-count count="0"/>
<table-count count="3"/>
<equation-count count="2"/>
<ref-count count="44"/>
<page-count count="8"/>
<word-count count="6799"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Schizophrenia</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="sec5" sec-type="intro">
<label>1.</label>
<title>Introduction</title>
<p>Patients with non-affective psychosis (NAP), such as schizophrenia and schizoaffective disorder, can show limited function in a range of cognitive, emotional, and social abilities, including speech comprehension and speech production, affecting vocabulary, semantics, pragmatics, cohesion, and coherence (<xref ref-type="bibr" rid="ref1">1</xref>). Incoherence, one of the most frequently examined features of speech in patients with NAP, is a type of formal thought disorder (FTD) and defined in psychiatry as the loss of meaningful associations in patients&#x2019; speech (<xref ref-type="bibr" rid="ref2 ref3 ref4">2&#x2013;4</xref>). Jaspers (<xref ref-type="bibr" rid="ref5">5</xref>) and Bleuler (<xref ref-type="bibr" rid="ref6">6</xref>) already described incoherence as an essential aspect of the altered self-experience in schizophrenia, which is considered a core feature of the disorder. Incoherent speech can entail severe impairments of functioning and impede societal inclusion as well as complicate therapeutic interventions (<xref ref-type="bibr" rid="ref2">2</xref>, <xref ref-type="bibr" rid="ref7">7</xref>). In linguistics, discourse coherence refers to the connectedness of speech beyond the level of individual sentences, which involves topicality, reference, and thematic structure of a text (<xref ref-type="bibr" rid="ref8">8</xref>). Discourse coherence is maintained on many different levels &#x2013; intonational, lexical, syntactic, logical. It is present as local coherence, connecting sentences and their parts, as well as global coherence, as the overall topic of speech. Incoherence in the speech of patients with a NAP diagnosis can be evaluated by clinical experts, in expert-rating scales such as the Thought, Language and Communication Scale (TLC, <xref ref-type="bibr" rid="ref4">4</xref>), or the Scale for the Assessment of Positive Symptoms (SAPS, <xref ref-type="bibr" rid="ref9">9</xref>). However, clinical ratings of coherence are naturally prone to bias because they depend on the clinician&#x2019;s intuition and ability to comprehend patients, i.e., on their mental representation of patients&#x2019; speech (<xref ref-type="bibr" rid="ref10">10</xref>). In contrast, modern methods of Natural Language Processing (NLP), a field in Machine Learning, offer means of analyzing speech automatically and consistently &#x2013; and they could potentially be more objective than clinical assessments. NLP methods may find subtle changes in patients&#x2019; speech that are not confounded by the listener&#x2019;s interpretation of what they hear or read and potentially not detectable by human listeners, even when they are trained clinicians. This is what makes NLP and machine learning methods in general powerful: possibly detecting patterns that are not noticeable to humans, going beyond clinical impressions and making NLP methods potentially useful in early detection of psychosis onset and exacerbation.</p>
<p>By now, many studies have reported evidence for the association between coherence scores and patient status: Coherence scores were shown to differentiate between NAP patients or people at clinical high risk (CHR) for psychosis versus healthy controls (<xref ref-type="bibr" rid="ref11 ref12 ref13 ref14 ref15 ref16">11&#x2013;16</xref>), and predict psychosis onset in CHR populations (<xref ref-type="bibr" rid="ref17">17</xref>, <xref ref-type="bibr" rid="ref18">18</xref>). Moreover, multiple studies have found that coherence measures were significantly correlated with clinical ratings of FTD in NAP patients (<xref ref-type="bibr" rid="ref15">15</xref>, <xref ref-type="bibr" rid="ref16">16</xref>) and people at CHR for psychosis (<xref ref-type="bibr" rid="ref19">19</xref>). Some researchers have suggested that incoherence may be a promising biomarker for NAP and could be linked to other biomarkers in genetic or neuroscientific research in the future (<xref ref-type="bibr" rid="ref20">20</xref>, <xref ref-type="bibr" rid="ref21">21</xref>). However, the clinical relevance and therapeutic value of NLP methods in psychiatry still needs to be proven &#x2013; especially against the background that a prognostic assessment may significantly affect or even stigmatize individuals (<xref ref-type="bibr" rid="ref22">22</xref>) and that patients may be triggered by stressful situations including clinical settings (<xref ref-type="bibr" rid="ref23">23</xref>).</p>
<p>Moreover, there is a need for more NLP studies with non-English speaking patients since current coherence models appear to have limited generalizability across different languages (<xref ref-type="bibr" rid="ref24">24</xref>). In addition, studies on coherence in NAP have used a large variety of different models, embeddings and training data, raising the question which approach may promise the highest predictive value. Approaches to discourse coherence that have been successfully automated are global and local coherence as well as tangentiality (i.e., modeling how relevant a response is to a question). Elvev&#x00E5;g et al. were the first to introduce an automated approach to measuring global coherence and tangentiality, while the incoherence model by Bedi et al. automated local coherence. The found association between tangentiality and clinical ratings of FTD could not be replicated (<xref ref-type="bibr" rid="ref16">16</xref>, <xref ref-type="bibr" rid="ref25">25</xref>, <xref ref-type="bibr" rid="ref26">26</xref>). Iter et al. (<xref ref-type="bibr" rid="ref27">27</xref>) used tangentiality and local coherence methods with various embeddings and sentence-averaging methods &#x2013; only four out of the 20 models tested were able to differentiate patients from controls. Similarly in another study (<xref ref-type="bibr" rid="ref25">25</xref>), three out of 13 coherence scores showed group differences between CHR individuals and controls, and none were significant after correcting for multiple testing. To this end, NLP methods need to be further validated.</p>
<p>The general aim of this primarily methodological, exploratory study was to further validate NLP methods for coherence analysis in NAP, namely local and global coherence, adapted from Bedi et al. and Elvev&#x00E5;g et al., as well as to compare two different word embeddings [GloVe (<xref ref-type="bibr" rid="ref28">28</xref>) vs. word2vec (<xref ref-type="bibr" rid="ref29">29</xref>)]. We chose coherence over tangentiality since coherence scores have outperformed tangentiality in former research (<xref ref-type="bibr" rid="ref16">16</xref>). Since coherence scores may represent different patterns in patients&#x2019; speech compared to clinical ratings, they should not only be validated against clinical ratings, but also against external criteria which are associated with functioning and psychopathology and may represent important events such as exacerbation. And as the potential clinical and therapeutic value of algorithms lies in their predictive power, we aim to include data both from cross-sectional and longitudinal measurements. If NLP methods can predict the aspects of psychotic disorders beyond clinical ratings, this could further prove their usability in psychiatry, potentially help to identify individuals at high risk and at best prevent exacerbation or hospital admission. In summary, the specific aims of this study were first, comparison of coherence scores derived from different NLP methods of coherence analysis (global vs. local), second, comparison of different word embeddings (GloVe vs. word2vec), and third, validation against clinical ratings and external criteria from cross-sectional and longitudinal measurement points. Our analysis is exploratory, aiming to pave the way for future validation studies.</p>
</sec>
<sec id="sec6" sec-type="methods">
<label>2.</label>
<title>Method</title>
<sec id="sec7">
<label>2.1.</label>
<title>Participants</title>
<p>The study is based on a sub-sample of the MPP-S study (<ext-link xlink:href="http://ClinicalTrials.gov" ext-link-type="uri">ClinicalTrials.gov</ext-link>-ID: NCT02576613), a randomized controlled trial called: &#x201C;Modified Psychodynamic Psychotherapy for Patients with Schizophrenia.&#x201D; It was conducted from December 2015 to December 2021 in cooperation with the International Psychoanalytic University (IPU) at the Charit&#x00E9; Universit&#x00E4;tsmedizin in Berlin, Germany &#x2013; including a baseline and further measurements after 6 months, one, two, and 6 years. A sub-sample was taken from the 6 months follow-up, defined as time one (T<sub>1</sub>), as this was the first time that speech samples were collected in the study.</p>
<p><italic>N</italic>&#x2009;=&#x2009;71 patients were included with a diagnosis of schizophrenia (<italic>n</italic>&#x2009;=&#x2009;51) or schizoaffective disorder (<italic>n</italic>&#x2009;=&#x2009;20), according to Diagnostic and Statistical Manual of Mental Disorders, Fourth Edition, Text Revision (DSM-IV-TR, <xref ref-type="bibr" rid="ref30">30</xref>), confirmed by trained clinicians. For this study, transcribed speech samples were only available from T<sub>1</sub>. Clinical data for the sample were taken from T<sub>1</sub> and, in order to include longitudinal data, from a one-year follow-up measurement after baseline, time two (T<sub>2</sub>). Not all patients had participated at T<sub>2</sub>, so that longitudinal data were available for <italic>n</italic>&#x2009;=&#x2009;54 out of the initial 71 patients. Inclusion criteria beyond diagnosis were age between 18 and 65&#x2009;years and native proficiency in German language. Exclusion criteria were organic brain diseases, other relevant somatic diseases, active substance dependence, or acute suicidality. Sociodemographic data and characteristics of illness are presented in <xref rid="tab1" ref-type="table">Table 1</xref>. The study was approved by the ethics committee of the Charit&#x00E9; Universit&#x00E4;tsmedizin Berlin (approval number: EA1/200/15). All participants provided written informed consent.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Characteristics of the sample.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th align="center" valign="top">T<sub>1</sub> (<italic>N</italic> =&#x2009;71)</th>
<th align="center" valign="top">T<sub>2</sub> (<italic>N</italic> =&#x2009;54)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Age (years)</td>
<td align="char" valign="top" char="(">38.83 (&#x00B1;10.44)<xref rid="tfn1" ref-type="table-fn"><sup>a</sup></xref></td>
<td align="char" valign="top" char="(">39.19 (&#x00B1;10.39)</td>
</tr>
<tr>
<td align="left" valign="top">Sex (male)</td>
<td align="char" valign="top" char="(">45 (63.4%)<xref rid="tfn2" ref-type="table-fn"><sup>b</sup></xref></td>
<td align="char" valign="top" char="(">33 (61.1%)</td>
</tr>
<tr>
<td align="left" valign="top">Verbal IQ</td>
<td align="char" valign="top" char="(">105.35 (&#x00B1;12.15)</td>
<td align="char" valign="top" char="(">105.54 (&#x00B1;12.28)</td>
</tr>
<tr>
<td align="left" valign="top">Education years</td>
<td align="char" valign="top" char="(">15.32 (&#x00B1;3.42)</td>
<td align="char" valign="top" char="(">15.98 (&#x00B1;3.48)</td>
</tr>
<tr>
<td align="left" valign="top" colspan="3">Main diagnosis</td>
</tr>
<tr>
<td align="left" valign="top">F20.x</td>
<td align="char" valign="top" char="(">51 (71.8%)</td>
<td align="char" valign="top" char="(">38 (70.4%)</td>
</tr>
<tr>
<td align="left" valign="top">F25.x</td>
<td align="char" valign="top" char="(">20 (28.2.%)</td>
<td align="char" valign="top" char="(">16 (29.6%)</td>
</tr>
<tr>
<td align="left" valign="top">Patients with comorbid psychiatric disorder</td>
<td align="char" valign="top" char="(">15 (21.1%)</td>
<td align="char" valign="top" char="(">12 (22.2%)</td>
</tr>
<tr>
<td align="left" valign="top">Patients with comorbid somatic disorder</td>
<td align="char" valign="top" char="(">29 (40.8%)</td>
<td align="char" valign="top" char="(">24 (44.4%)</td>
</tr>
<tr>
<td align="left" valign="top">Patients with current antipsychotic medication</td>
<td align="char" valign="top" char="(">62 (87.3%)</td>
<td align="char" valign="top" char="(">47 (87.0%)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="tfn1">
<label>a</label>
<p>Mean (standard deviation).</p>
</fn>
<fn id="tfn2">
<label>b</label>
<p>Frequency (percent).</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="sec8">
<label>2.2.</label>
<title>Measures</title>
<sec id="sec9">
<label>2.2.1.</label>
<title>Natural language processing</title>
<sec id="sec10">
<label>2.2.1.1.</label>
<title>Speech samples</title>
<p>We used the Narrative of Emotions Task (NET, <xref ref-type="bibr" rid="ref31">31</xref>) to collect speech samples, a short semi-structured interview, originally developed to assess social cognition, at T<sub>1</sub>. We used a short version of the NET, translated into German, including three questions about four basic emotions: sadness, fear, anger, and happiness: (1) What does this emotion mean to you? (2) Describe a situation where you felt this emotion, and (3) Why do you think you felt this emotion in this situation? All interviews were conducted by trained clinicians (including SJ, A-LB, CM), recorded and manually transcribed by two authors (SJ, MS), following defined rules for transcription. Collecting speech samples from answers to (semi-)structured questions is a frequent and economic method in NLP studies (<xref ref-type="bibr" rid="ref11">11</xref>, <xref ref-type="bibr" rid="ref15">15</xref>, <xref ref-type="bibr" rid="ref16">16</xref>, <xref ref-type="bibr" rid="ref18">18</xref>, <xref ref-type="bibr" rid="ref27">27</xref>), increases comparability, and has been shown to outperform analysis of free conversational speech (<xref ref-type="bibr" rid="ref14">14</xref>).</p>
</sec>
<sec id="sec11">
<label>2.2.1.2.</label>
<title>Annotation</title>
<p>The data consisted of 71 recorded and transcribed NET interviews. Transcripts underwent systematic preprocessing to reduce bias in analysis (<xref ref-type="bibr" rid="ref15">15</xref>, <xref ref-type="bibr" rid="ref16">16</xref>, <xref ref-type="bibr" rid="ref27">27</xref>). Uniform sentence annotation guidelines were established for manual coding of sentence boundaries based on syntax, as has been done elsewhere (<xref ref-type="bibr" rid="ref24">24</xref>). Clear annotation guidelines for sentence separation are crucial as automated coherence metrics are calculated over sentences and thus, can be influenced by sentence boundary decisions (<xref ref-type="bibr" rid="ref32">32</xref>, <xref ref-type="bibr" rid="ref33">33</xref>). A sentence was defined as at least containing a subject and verb (e.g., &#x201C;John eats.&#x201D;). The main and the corresponding side clauses were grouped together as one sentence (e.g., &#x201C;John eats when he is hungry.&#x201D;). Incomplete main clauses were ended on a period (&#x201C;John eats when. No, I wanted to say something else.&#x201D;), main clauses connected by conjunctions were separated (&#x201C;John eats when he is hungry. And he laughs when he is happy. And he sleeps when he is tired.&#x201D;).</p>
</sec>
<sec id="sec12">
<label>2.2.1.3.</label>
<title>Preprocessing</title>
<p>The interviews were split into questions on each emotion, and the questions themselves were left out of the analysis. Verbal fillers (such as &#x201C;ehm&#x201D;) and German stopwords were removed from the transcripts. The words were lemmatized (e. i. put to their dictionary form). The resulting transcripts had an average length of 243 words (range 57&#x2013;824) with 140 unique words (range 48&#x2013;358). The interviews were split into sentences using nltk.sent_tokenize.</p>
</sec>
<sec id="sec13">
<label>2.2.1.4.</label>
<title>Vector-based coherence metrics</title>
<p>One of the key NLP methods is word embeddings. In this method, words in a text are mathematically represented as vectors. Different word embeddings utilize different methods of vectorization (see Almeida and Xex&#x00E9;o (<xref ref-type="bibr" rid="ref34">34</xref>) for an overview). Semantic coherence can be approximated with a mathematical function on these vectors so that semantically similar words have vectors that are closer together (<xref ref-type="bibr" rid="ref17">17</xref>). This definition does not try to reflect whether the discourse is intelligible but focuses on how semantically similar the words or sentences are to each other.</p>
<p>Word2vec (<xref ref-type="bibr" rid="ref29">29</xref>) and GloVe (<xref ref-type="bibr" rid="ref28">28</xref>) are traditional word embedding models which represent words as vectors and have been most widely used in NLP research with NAP patients. To ensure comparability with former research (<xref ref-type="bibr" rid="ref12">12</xref>, <xref ref-type="bibr" rid="ref14 ref15 ref16">14&#x2013;16</xref>, <xref ref-type="bibr" rid="ref20">20</xref>, <xref ref-type="bibr" rid="ref27">27</xref>, <xref ref-type="bibr" rid="ref35">35</xref>), we decided to use word2vec and GloVe models in this study. Moreover, more advanced word embeddings such as BERT and ELMo appear to yield similar coherence scores as compared to word2vec and GloVe (<xref ref-type="bibr" rid="ref25">25</xref>).</p>
<p>Two open source vectorization models were used to compare their task-sensitivity. The first model used was the Spacy&#x2019;s (<xref ref-type="bibr" rid="ref36">36</xref>) tok2vec model (de_core_news_lg, specifically) trained on OSCAR Common Crawl and German Wikipedia. The second model was a GloVe model trained on German Wikipedia provided by deepset (<xref ref-type="bibr" rid="ref37">37</xref>). The words absent from the models&#x2019; vocabularies (out-of-vocabulary words) were left out of the analysis. The word vectors were averaged across the sentence to obtain a sentence vector.</p>
<p>Two cosine similarity-based metrics were used to assess the coherence of the interviews. Cosine similarity is a measure of vector proximity used to assess semantic and grammatical similarity of words or sentences encoded by the vectors.</p>
<p>The first metric is local coherence (or first-order coherence), defined as the cosine similarities between adjacent sentences (<xref ref-type="bibr" rid="ref17">17</xref>). This coherence metric has been the most widely used metric in NLP research with schizophrenia patients (<xref ref-type="bibr" rid="ref24">24</xref>). The similarity is averaged across all sentence pairs in the text.</p>
<disp-formula id="E1">
<mml:math id="M1">
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi mathvariant="normal"> </mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>h</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>S</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>N</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mi>cos</mml:mi>
<mml:mspace width="thickmathspace"/>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mi mathvariant="normal">,</mml:mi>
<mml:msub>
<mml:mi>s</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mi>N</mml:mi>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>S</italic> is a list of sentences from <inline-formula>
<mml:math id="M2">
<mml:mrow>
<mml:msub>
<mml:mi>s</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> to <inline-formula>
<mml:math id="M3">
<mml:mrow>
<mml:msub>
<mml:mi>s</mml:mi>
<mml:mi>N</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
<p>The second metric is global coherence, defined as the cosine similarity between each sentence and the average of all sentences [adapted from Elvev&#x00E5;g et al. (<xref ref-type="bibr" rid="ref11">11</xref>)]. The similarity is averaged across all sentences in the text.</p>
<disp-formula id="E2">
<mml:math id="M4">
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>b</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi mathvariant="normal"> </mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>h</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>S</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>N</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mi>cos</mml:mi>
<mml:mspace width="thickmathspace"/>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mi mathvariant="normal">,</mml:mi>
<mml:msub>
<mml:mi>s</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mi>N</mml:mi>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M5">
<mml:mrow>
<mml:msub>
<mml:mi>s</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi mathvariant="normal">i=1</mml:mi>
</mml:mrow>
<mml:mi mathvariant="normal">N</mml:mi>
</mml:msubsup>
<mml:msub>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mi mathvariant="normal">N</mml:mi>
</mml:mfrac>
</mml:mrow>
</mml:math>
</inline-formula>, and <italic>S</italic> is a list of sentences from <inline-formula>
<mml:math id="M6">
<mml:mrow>
<mml:msub>
<mml:mi>s</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>to <inline-formula>
<mml:math id="M7">
<mml:mrow>
<mml:msub>
<mml:mi>s</mml:mi>
<mml:mi>N</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
<p>Both metrics were calculated for each question for each participant twice, based on the two different vectorization models. The metrics were then averaged across the emotion questions to obtain four metrics of coherence per participant, two local and two global coherence scores, one for each model.</p>
<p>The code used for the analysis is available on request.</p>
</sec>
</sec>
<sec id="sec14">
<label>2.2.2.</label>
<title>Clinical measures</title>
<p>The expert-rated Positive and Negative Syndrome Scale was used to assess psychopathology. The scale contains 30 items, rated on a 7-point Likert scale (from 1&#x2009;=&#x2009;absent to 7&#x2009;=&#x2009;extreme). In further analysis, we applied a five-factor solution derived from van der Gaag et al. (<xref ref-type="bibr" rid="ref38">38</xref>, <xref ref-type="bibr" rid="ref39">39</xref>) to the data, namely: positive and negative symptoms, disorganization, excitement, and emotional distress.</p>
<p>The MINI-ICF is a short version of the WHO International Classification of Functioning, Disability and Health where experts rate 13 subdimensions of functioning on a 5-point Likert scale (from 0&#x2009;=&#x2009;no impairment to 4&#x2009;=&#x2009;total disability). The rating requires a comparison between the actual and the premorbid state, so that disease-related changes in functioning are represented. A sum score was built for further analyses.</p>
<p>We selected external criteria of illness which are associated with functioning and psychopathology and may represent severity of illness beyond clinical ratings. External criteria we included were days of inpatient psychiatric treatment during the last 2.5&#x2009;years and 0.5&#x2009;years before T<sub>1</sub> as well as 0.5&#x2009;years after T<sub>1</sub>, and two characteristics of illness (age at psychosis onset, duration of illness). These variables were assessed as part of an interview regarding sociodemographic and medical characteristics.</p>
<p>The German vocabulary test Wortschatztest (WST, <xref ref-type="bibr" rid="ref40">40</xref>) was used to control for verbal IQ.</p>
</sec>
</sec>
<sec id="sec15">
<label>2.3.</label>
<title>Statistics</title>
<p>Statistical analysis was performed using IBM SPSS Statistics for Windows (version 29.0, SPSS Inc., Armonk, NY, United States). Pearson correlations were computed to examine the relationship between coherence scores and continuous outcome variables at T<sub>1</sub>. For categorial variables (sex, antipsychotic medication), independent <italic>t</italic>-tests were computed to analyze mean differences in coherence scores. Partial correlations were computed to examine the relationship between the coherence scores at T<sub>1</sub> and the outcome variables at T<sub>2</sub> while controlling for expression of the outcome variables at T<sub>1</sub>. The correlational analyses are exploratory. Thus, <italic>p</italic>-values are only given for descriptive reasons.</p>
</sec>
</sec>
<sec id="sec16" sec-type="results">
<label>3.</label>
<title>Results</title>
<sec id="sec17">
<label>3.1.</label>
<title>Cross-sectional data: correlations at T<sub>1</sub></title>
<p><xref rid="tab2" ref-type="table">Table 2</xref> shows the mean coherence scores and expression of outcome variables of participants, <xref rid="tab3" ref-type="table">Table 3</xref> shows all exploratory correlations at T<sub>1</sub>. The four coherence scores were highly correlated with each other. Comparison of local vs. global coherence scores did not yield divergent results. Except for one case, where the global coherence score of the GloVe model was significantly correlated with the sum score of the MINI-ICF and its local coherence score was not, all global and local coherence scores of the GloVe and word2vec model showed the same significant correlations.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Coherence scores and clinical outcome variables.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th align="center" valign="top">Participants&#x2019; (<italic>N</italic> =&#x2009;71) scores at T<sub>1</sub> <italic>M</italic> (<italic>SD</italic>)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Local coherence GloVe</td>
<td align="char" valign="top" char="(">0.77 (&#x00B1;0.07)</td>
</tr>
<tr>
<td align="left" valign="top">Global coherence GloVe</td>
<td align="char" valign="top" char="(">0.86 (&#x00B1;0.05)</td>
</tr>
<tr>
<td align="left" valign="top">Local coherence word2vec</td>
<td align="char" valign="top" char="(">0.57 (&#x00B1;0.07)</td>
</tr>
<tr>
<td align="left" valign="top">Global coherence word2vec</td>
<td align="char" valign="top" char="(">0.72 (&#x00B1;0.05)</td>
</tr>
<tr>
<td align="left" valign="top">PANSS positive symptoms</td>
<td align="char" valign="top" char="(">13.34 (&#x00B1;6.25)</td>
</tr>
<tr>
<td align="left" valign="top">PANSS negative symptoms</td>
<td align="char" valign="top" char="(">15.66 (&#x00B1;6.86)</td>
</tr>
<tr>
<td align="left" valign="top">PANSS disorganized symptoms</td>
<td align="char" valign="top" char="(">16.87 (&#x00B1;5.91)</td>
</tr>
<tr>
<td align="left" valign="top">PANSS excitement</td>
<td align="char" valign="top" char="(">12.62 (&#x00B1;3.97)</td>
</tr>
<tr>
<td align="left" valign="top">PANSS emotional distress</td>
<td align="char" valign="top" char="(">17.32 (&#x00B1;5.85)</td>
</tr>
<tr>
<td align="left" valign="top">Mini-ICF sum score</td>
<td align="char" valign="top" char="(">16.3 (&#x00B1;9.34)</td>
</tr>
<tr>
<td align="left" valign="top">Age at psychosis onset</td>
<td align="char" valign="top" char="(">25.36 (&#x00B1;7.63)</td>
</tr>
<tr>
<td align="left" valign="top">Duration of illness (years)</td>
<td align="char" valign="top" char="(">13.47 (&#x00B1;9.05)</td>
</tr>
<tr>
<td align="left" valign="top">Days of inpatient care 2.5&#x2009;years before T<sub>1</sub></td>
<td align="char" valign="top" char="(">39.84 (&#x00B1;68.43)</td>
</tr>
<tr>
<td align="left" valign="top">Days of inpatient care 6&#x2009;months before T<sub>1</sub></td>
<td align="char" valign="top" char="(">10.07 (&#x00B1;34.39)</td>
</tr>
<tr>
<td align="left" valign="top">Days of inpatient care 6&#x2009;months after T<sub>1</sub><xref rid="tfn3" ref-type="table-fn"><sup>a</sup></xref></td>
<td align="char" valign="top" char="(">5.74 (&#x00B1;16.16)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>PANSS, Positive and Negative Syndrome Scale, five-factor solution of van der Gaag et al. (<xref ref-type="bibr" rid="ref38">38</xref>, <xref ref-type="bibr" rid="ref39">39</xref>); MINI-ICF, International Classification of Functioning, Disability and Health (short version) (<xref ref-type="bibr" rid="ref41">41</xref>).</p>
<fn id="tfn3">
<label>a</label>
<p>Days of inpatient care 6&#x2009;months after T<sub>1</sub> was assessed at T<sub>2</sub> with <italic>N</italic>&#x2009;=&#x2009;54 patients.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Exploratory correlational analysis: Pearson correlations between coherence scores and clinical outcome variables at T<sub>1</sub> (<italic>N</italic>&#x2009;=&#x2009;71).</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th align="center" valign="top">Local coherence GloVe</th>
<th align="center" valign="top">Global coherence GloVe</th>
<th align="center" valign="top">Local coherence word2vec</th>
<th align="center" valign="top">Global coherence word2vec</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Local coherence GloVe</td>
<td align="char" valign="top" char=".">&#x2013;</td>
<td align="char" valign="top" char=".">0.969<sup>&#x002A;&#x002A;</sup></td>
<td align="char" valign="top" char=".">0.576<sup>&#x002A;&#x002A;</sup></td>
<td align="char" valign="top" char=".">0.487<sup>&#x002A;&#x002A;</sup></td>
</tr>
<tr>
<td align="left" valign="top">Global coherence GloVe</td>
<td align="char" valign="top" char=".">0.969<sup>&#x002A;&#x002A;</sup></td>
<td align="char" valign="top" char=".">&#x2013;</td>
<td align="char" valign="top" char=".">0.569<sup>&#x002A;&#x002A;</sup></td>
<td align="char" valign="top" char=".">0.533<sup>&#x002A;&#x002A;</sup></td>
</tr>
<tr>
<td align="left" valign="top">Local coherence word2vec</td>
<td align="char" valign="top" char=".">0.576<sup>&#x002A;&#x002A;</sup></td>
<td align="char" valign="top" char=".">0.569<sup>&#x002A;&#x002A;</sup></td>
<td align="char" valign="top" char=".">&#x2013;</td>
<td align="char" valign="top" char=".">0.923<sup>&#x002A;&#x002A;</sup></td>
</tr>
<tr>
<td align="left" valign="top">Global coherence word2vec</td>
<td align="char" valign="top" char=".">0.487<sup>&#x002A;&#x002A;</sup></td>
<td align="char" valign="top" char=".">0.533<sup>&#x002A;&#x002A;</sup></td>
<td align="char" valign="top" char=".">0.923<sup>&#x002A;&#x002A;</sup></td>
<td align="char" valign="top" char=".">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">Duration of illness</td>
<td align="char" valign="top" char=".">0.087</td>
<td align="char" valign="top" char=".">0.059</td>
<td align="char" valign="top" char=".">0.056</td>
<td align="char" valign="top" char=".">&#x2212;0.012</td>
</tr>
<tr>
<td align="left" valign="top">Age at psychosis onset</td>
<td align="char" valign="top" char=".">0.037</td>
<td align="char" valign="top" char=".">0.128</td>
<td align="char" valign="top" char=".">&#x2212;0.090</td>
<td align="char" valign="top" char=".">0.008</td>
</tr>
<tr>
<td align="left" valign="top">Days of inpatient care 2.5&#x2009;years before T<sub>1</sub></td>
<td align="char" valign="top" char=".">&#x2212;0.163</td>
<td align="char" valign="top" char=".">&#x2212;0.165</td>
<td align="char" valign="top" char=".">&#x2212;0.078</td>
<td align="char" valign="top" char=".">&#x2212;0.094</td>
</tr>
<tr>
<td align="left" valign="top">Days of inpatient care 6&#x2009;months before T<sub>1</sub></td>
<td align="char" valign="top" char=".">&#x2212;0.190</td>
<td align="char" valign="top" char=".">&#x2212;0.193</td>
<td align="char" valign="top" char=".">&#x2212;0.253<sup>&#x002A;</sup></td>
<td align="char" valign="top" char=".">&#x2212;0.257<sup>&#x002A;</sup></td>
</tr>
<tr>
<td align="left" valign="top">Days of inpatient care 6&#x2009;months after T<sub>1</sub></td>
<td align="char" valign="top" char=".">&#x2212;0.081</td>
<td align="char" valign="top" char=".">&#x2212;0.107</td>
<td align="char" valign="top" char=".">0.107</td>
<td align="char" valign="top" char=".">0.117</td>
</tr>
<tr>
<td align="left" valign="top">PANSS positive symptoms</td>
<td align="char" valign="top" char=".">&#x2212;0.018</td>
<td align="char" valign="top" char=".">&#x2212;0.047</td>
<td align="char" valign="top" char=".">&#x2212;0.153</td>
<td align="char" valign="top" char=".">&#x2212;0.223</td>
</tr>
<tr>
<td align="left" valign="top">PANSS negative symptoms</td>
<td align="char" valign="top" char=".">&#x2212;0.279<sup>&#x002A;</sup></td>
<td align="char" valign="top" char=".">&#x2212;0.269<sup>&#x002A;</sup></td>
<td align="char" valign="top" char=".">&#x2212;0.310<sup>&#x002A;&#x002A;</sup></td>
<td align="char" valign="top" char=".">&#x2212;0.264<sup>&#x002A;</sup></td>
</tr>
<tr>
<td align="left" valign="top">PANSS disorganized symptoms</td>
<td align="char" valign="top" char=".">&#x2212;0.175</td>
<td align="char" valign="top" char=".">&#x2212;0.199</td>
<td align="char" valign="top" char=".">&#x2212;0.311<sup>&#x002A;&#x002A;</sup></td>
<td align="char" valign="top" char=".">&#x2212;0.359<sup>&#x002A;&#x002A;</sup></td>
</tr>
<tr>
<td align="left" valign="top">PANSS excitement</td>
<td align="char" valign="top" char=".">&#x2212;0.054</td>
<td align="char" valign="top" char=".">&#x2212;0.093</td>
<td align="char" valign="top" char=".">&#x2212;0.278<sup>&#x002A;</sup></td>
<td align="char" valign="top" char=".">&#x2212;0.331<sup>&#x002A;&#x002A;</sup></td>
</tr>
<tr>
<td align="left" valign="top">PANSS emotional distress</td>
<td align="char" valign="top" char=".">&#x2212;0.135</td>
<td align="char" valign="top" char=".">&#x2212;0.143</td>
<td align="char" valign="top" char=".">&#x2212;0.129</td>
<td align="char" valign="top" char=".">&#x2212;0.160</td>
</tr>
<tr>
<td align="left" valign="top">Mini-ICF sum score</td>
<td align="char" valign="top" char=".">&#x2212;0.227</td>
<td align="char" valign="top" char=".">&#x2212;0.266<sup>&#x002A;</sup></td>
<td align="char" valign="top" char=".">&#x2212;0.164</td>
<td align="char" valign="top" char=".">&#x2212;0.209</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>PANSS, Positive and Negative Syndrome Scale, five-factor solution of van der Gaag and colleagues (<xref ref-type="bibr" rid="ref38">38</xref>); MINI-ICF, International Classification of Functioning, Disability and Health (short version) (<xref ref-type="bibr" rid="ref41">41</xref>). <italic>p</italic>-values are reported for descriptive reasons: <sup>&#x002A;</sup><italic>p</italic>&#x2009;&#x003C;&#x2009;0.05; <sup>&#x002A;&#x002A;</sup><italic>p</italic>&#x2009;&#x003C;&#x2009;0.01.</p>
</table-wrap-foot>
</table-wrap>
<p>Examining correlations of the GloVe and word2vec model showed that the GloVe model yielded three significant correlations with outcome variables while there were eight significant correlations with the word2vec model.</p>
<p>Regarding exploratory validation against clinical ratings, all coherence scores showed significant negative correlations with the PANSS factor for negative symptoms. In addition, local and global coherence scores of the word2vec model showed significant negative correlations with the PANSS factor for disorganized symptoms and excitement. None of the four coherence scores were significantly correlated with the PANSS factors for positive symptoms and emotional distress. Global coherence scores of the GloVe model were significantly negatively correlated with the sum score of the MINI-ICF.</p>
<p>Regarding external criteria, there was a significant negative correlation between local and global coherence scores of the word2vec model and the days in inpatient treatment 6 months before T<sub>1</sub>. There was no significant correlation between coherence scores and days in inpatient treatment 2.5 before or 0.5&#x2009;years after T<sub>1</sub> or characteristics of illness (age at psychosis onset, duration of illness).</p>
<p>When controlling for psychopathology in a partial correlation by including the five PANSS factors as control, the correlations with the MINI-ICF and days of inpatient care did not remain significant.</p>
<p>Coherence scores were not significantly correlated with the control variables age, education years, verbal IQ, length of transcripts in words, nor did they differ significantly between patients with schizophrenia or schizoaffective disorder, or between patients who did or did not take antipsychotic medication. However, the global coherence score of the GloVe model was significantly negatively correlated with transcript length. Also, female patients&#x2019; coherence scores of the global word2vec model were significantly higher than those of men. Closer examination of sex differences in the sample through independent <italic>t</italic>-tests revealed that men had significantly higher mean values in four PANNS factors as compared to women: positive and negative symptoms, disorganization, excitement.</p>
</sec>
<sec id="sec18">
<label>3.2.</label>
<title>Longitudinal data: correlations at T<sub>2</sub></title>
<p>None of the partial correlations between coherence scores at T<sub>1</sub> and outcome variables at T<sub>2</sub> were significant. The partial correlations as well as Pearson correlations between all variables at T<sub>1</sub> and T<sub>2</sub> are provided in the <xref ref-type="supplementary-material" rid="SM1">Supplementary Tables S1</xref>, <xref ref-type="supplementary-material" rid="SM1">S2</xref>.</p>
</sec>
</sec>
<sec id="sec19" sec-type="discussions">
<label>4.</label>
<title>Discussion</title>
<p>The overall aim of this study was an exploratory analysis of correlations between coherence scores and clinical outcome variables to carve out a potential direction for future NLP validation studies. The specific aims of the study were, first, to compare different NLP methods of coherence analysis, second, to compare different word embeddings, and third, to validate them against clinical ratings and external criteria &#x2013; using both cross-sectional and longitudinal clinical data.</p>
<p>Comparison of different NLP methods and word embeddings revealed that the word2vec models (both global and local coherence) were significantly correlated with four clinical outcome variables while the GloVe models were significantly associated with only one and two outcomes, respectively. The global GloVe model was also sensitive to transcript length &#x2013; a potential confounding factor in its coherence scores. Furthermore, coherence scores generated with the global word2vec model showed significant sex differences. One could argue that the global word2vec model was the only model to represent that male patients had significantly higher ratings of psychopathology than female patients in this sample. While these results should be interpreted with caution, it might imply that the word2vec models outperformed the GloVe models in calculating coherence scores that were associated with clinically relevant outcomes in this study. This corresponds to findings by Iter et al. (<xref ref-type="bibr" rid="ref27">27</xref>) who found significant group differences between patients and controls for the word2vec incoherence model, not GloVe, but contrasts our own previous study that found a superiority of the GloVe model in prediction of psychopathology in NAP (<xref ref-type="bibr" rid="ref16">16</xref>). These results indicate that the choice of NLP model should not be arbitrary. It has to be taken into account that different models, that is models with different architecture (e.g., GloVe vs. word2vec) as well as models trained on different corpora, produce different word vectors &#x2013; this could explain the different results between this current and the previous study (<xref ref-type="bibr" rid="ref16">16</xref>), having used different training data as well as different preprocessing and a more sophisticated sentence annotation. A concern would be that the chosen model has a stronger effect on the coherence scores than the difference between groups or coherence metric used (e.g., local vs. global). In this study, all coherence scores were still highly correlated with each other (see <xref rid="tab2" ref-type="table">Table 2</xref>). The reason for this is, probably, the fact that the two models are both trained on the same material, that is German Wikipedia. If models are trained on different material, correlation between them can be low. This might be one of the key challenges of cross-linguistic application of NLP methods (<xref ref-type="bibr" rid="ref24">24</xref>) and the reason for limited replicability of the results within one language across models (<xref ref-type="bibr" rid="ref25">25</xref>) and studies (<xref ref-type="bibr" rid="ref16">16</xref>, <xref ref-type="bibr" rid="ref25">25</xref>, <xref ref-type="bibr" rid="ref26">26</xref>). Nevertheless, our results show that models trained on the same material can still yield different results. The effect of different embedding models both intra- and cross-linguistically therefore requires further investigation.</p>
<p>It should be noted that the number of significant correlation coefficients should not be the only criterion for choosing a model. As Holmlund et al. (<xref ref-type="bibr" rid="ref42">42</xref>) put it, &#x201C;There is no &#x2018;one size fits all&#x2019; approach to choosing the right operationalization of disorganization in speech&#x201D; (p. 3). While there is more need for validation studies of different embeddings, future studies should also aim to understand better which coherence metrics represent which specific impairments in patients&#x2019; speech (<xref ref-type="bibr" rid="ref42">42</xref>).</p>
<p>Concerning validation against clinical ratings, one might expect to find most reliable correlations between coherence scores and ratings of incoherence, in this study represented in the PANSS factor for disorganization. After all, the embeddings are supposed to model speech (in)coherence and have been found to be correlated with ratings of positive FTD and incoherence in former studies (<xref ref-type="bibr" rid="ref15">15</xref>, <xref ref-type="bibr" rid="ref16">16</xref>, <xref ref-type="bibr" rid="ref19">19</xref>). However, we found the most consistent correlation between coherence scores and the PANSS factor for negative symptoms. A significant correlation with the factor for disorganization was only found for the word2vec models. This may support the assumption that word2vec models outperformed GloVe models in our sample. From an application perspective, other questions arise: On the one hand, one could argue that coherence scores could be useful as long as they are correlated with any relevant characteristics of the illness &#x2013; positive FTD or not. Identification and treatment of psychosis may sometimes focus too much on productive symptomatology. Clinical application and usefulness of NLP methods would rely on their ability to predict illness &#x2013; our results suggest that we should focus more on negative symptoms in this context. These often represent the first sign of the onset of psychosis and occur before the onset of positive symptoms (<xref ref-type="bibr" rid="ref43">43</xref>). If NLP coherence scores are significantly correlated with clinical appearance of negative symptoms, this might explain their effectiveness in prediction of psychosis onset (<xref ref-type="bibr" rid="ref17">17</xref>, <xref ref-type="bibr" rid="ref18">18</xref>). On the other hand, not all characteristics of illness are a sign of psychosis onset or exacerbation and require urgent intervention. As mentioned in the introduction, early labeling can also lead to stigmatization (<xref ref-type="bibr" rid="ref22">22</xref>). While negative symptoms may be a predictor of psychosis onset, they are not a sign of acute exacerbation characterized more by positive symptoms. One may conclude that correlation with clinical ratings of psychopathology appears to be a necessary but not sufficient condition for the predictive power of NLP coherence models in NAP. Their application may also depend on the prediction of subtle changes in patients&#x2019; life that are not recognized easily or early enough by clinicians for appropriate intervention.</p>
<p>To this end, we attempted an exploratory validation of NLP methods against external criteria and longitudinal data. This analysis revealed only one significant correlation between the word2vec models and days of inpatient care 6 months before the speech samples were collected. However, this correlation did not remain significant after controlling for psychopathology. This result may question the potential usefulness of NLP coherence analysis to predict relapse. If NLP analyses cannot outperform clinical ratings to predict exacerbation, a clinically relevant benefit for patients seems uncertain. On the other hand, NLP methods have been proven powerful in the prediction of psychosis onset in the past (<xref ref-type="bibr" rid="ref17">17</xref>, <xref ref-type="bibr" rid="ref18">18</xref>). Also, this is the first study to validate coherence scores against external criteria and longitudinal data. Selection of variables might not have been appropriate to operationalize exacerbation beyond clinical ratings. We recommend further attempts to validate NLP methods against external and longitudinal data in future research.</p>
<sec id="sec20">
<label>4.1.</label>
<title>Limitations</title>
<p>There are some limitations that should be taken into account. As results did not have any predictive value with respect to outcomes, future research should include &#x201C;harder&#x201D; external criteria and more data on patients&#x2019; course of illness. For instance, medical health records about hospitalization and medication could be examined to utilize more objective data on exacerbation. As mentioned above, the consequences and risks of stigmatization due to false predictions for the individual should always be critically reflected upon and results interpreted with appropriate caution. The results should be replicated with larger sample sizes, other diagnostic groups, healthy controls as well as CHR individuals. Moreover, in this study we decided to focus solely on NLP coherence scores. Past NLP research has shown that inclusion of other characteristics of patients&#x2019; speech can improve predictive value of coherence models (<xref ref-type="bibr" rid="ref15">15</xref>, <xref ref-type="bibr" rid="ref17">17</xref>, <xref ref-type="bibr" rid="ref18">18</xref>, <xref ref-type="bibr" rid="ref27">27</xref>, <xref ref-type="bibr" rid="ref35">35</xref>) &#x2013; for instance, syntactic features, referential ambiguities, neologisms, cohesion scores, perseverations, and acoustic features. Since different patterns of linguistic impairment appear to be associated with different levels of psychopathology and functioning (<xref ref-type="bibr" rid="ref44">44</xref>), future studies should consider developing and validating speech models of NAP containing more features of speech than coherence. Psychometric evaluation of coherence scores should also examine reliability, e.g., by intra-individual correlation of coherence scores across multiple measurement time points.</p>
<p>A statistical limitation is the large number of different output parameters, which could have led to an overestimation of significance.</p>
</sec>
<sec id="sec21">
<label>4.2.</label>
<title>Implications and conclusion</title>
<p>The study showed that coherence scores derived with NLP methods are correlated with clinical ratings of psychopathology, but not with external or longitudinal data. The word2vec model was significantly correlated with more variables than the GloVe model while there were no major differences between local and global coherence models. While the results support construct validity of NLP models of coherence, they raise questions about the usefulness of their application in the clinical context. As results for the used models differed, we recommend careful selection of model and training data.</p>
<p>It remains an important task for clinical researchers to engage in the debates and studies revolving around machine learning in psychiatry. Clinical experts&#x2019; considerations about the ethics, feasibility and usefulness of machine learning and NLP methods in the field need to always accompany this research.</p>
</sec>
</sec>
<sec id="sec22" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="sec23">
<title>Ethics statement</title>
<p>The studies involving human participants were reviewed and approved by Ethikkommission der Charit&#x00E9; &#x2013; Universit&#x00E4;tsmedizin Berlin. The patients/participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="sec24">
<title>Author contributions</title>
<p>SJ and A-LB contributed equally to the manuscript by developing and testing the hypotheses and writing the first draft. GR conducted the NLP analysis and made an essential contribution to the draft. MS completed the annotation of all transcripts. CM was responsible for and conceptually involved in the conduct of the study. SJ, A-LB, GR, IN, MS, FB, AH, and CM critically read and revised the manuscript. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec sec-type="funding-information" id="sec25">
<title>Funding</title>
<p>CM received personal funding (Berlin Institute of Health BIH_PRO_279). The MPP-S study is supported by Deutsche Gesellschaft f&#x00FC;r Psychoanalyse, Psychotherapie, Psychosomatik und Tiefenpsychologie (DGPT e.V.) and by K&#x00F6;hler Stiftung (Grant number: S112/10211/16). We acknowledge financial support from the Open Access Publication Fund of Charit&#x00E9; &#x2013; Universit&#x00E4;tsmedizin Berlin and the German Research Foundation (DFG).</p>
</sec>
<sec sec-type="COI-statement" id="sec26">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="sec100" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<ack>
<p>The authors thank the participants of the MPP-S study. Moreover, they thank N. Ko&#x0159;&#x00E1;nov&#x00E1; for the transcription of part of the interviews, and M. Stede for his advice. Last but not least they thank their research colleagues who were involved in conducting the interviews, namely: S. Bayer, G. Bertram, M. B&#x00FC;ttner, J. Funcke, F. Stuke, and C. Thiele-Winkler (in alphabetic order).</p>
</ack>
<sec id="sec27" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fpsyt.2023.1208856/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fpsyt.2023.1208856/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_2.xlsx" id="SM2" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><label>1.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Covington</surname><given-names>MA</given-names></name> <name><surname>He</surname><given-names>C</given-names></name> <name><surname>Brown</surname><given-names>C</given-names></name> <name><surname>Na&#x00E7;i</surname><given-names>L</given-names></name> <name><surname>McClain</surname><given-names>JT</given-names></name> <name><surname>Fjordbak</surname><given-names>BS</given-names></name> <etal/></person-group>. <article-title>Schizophrenia and the structure of language: the linguist's view</article-title>. <source>Schizophr Res</source>. (<year>2005</year>) <volume>77</volume>:<fpage>85</fpage>&#x2013;<lpage>98</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.schres.2005.01.016</pub-id>, PMID: <pub-id pub-id-type="pmid">16005388</pub-id></citation></ref>
<ref id="ref2"><label>2.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Roche</surname><given-names>E</given-names></name> <name><surname>Creed</surname><given-names>L</given-names></name> <name><surname>MacMahon</surname><given-names>D</given-names></name> <name><surname>Brennan</surname><given-names>D</given-names></name> <name><surname>Clarke</surname><given-names>M</given-names></name></person-group>. <article-title>The epidemiology and associated phenomenology of formal thought disorder: a systematic review</article-title>. <source>Schizophr Bull</source>. (<year>2015</year>) <volume>41</volume>:<fpage>951</fpage>&#x2013;<lpage>62</lpage>. doi: <pub-id pub-id-type="doi">10.1093/schbul/sbu129</pub-id>, PMID: <pub-id pub-id-type="pmid">25180313</pub-id></citation></ref>
<ref id="ref3"><label>3.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mercado</surname><given-names>CL</given-names></name> <name><surname>Johannesen</surname><given-names>JK</given-names></name> <name><surname>Bell</surname><given-names>MD</given-names></name></person-group>. <article-title>Thought disorder severity in compromised, deteriorated, and preserved intellectual course of schizophrenia</article-title>. <source>J Nerv Ment Dis</source>. (<year>2011</year>) <volume>199</volume>:<fpage>111</fpage>&#x2013;<lpage>6</lpage>. doi: <pub-id pub-id-type="doi">10.1097/NMD.0b013e3182083bae</pub-id>, PMID: <pub-id pub-id-type="pmid">21278540</pub-id></citation></ref>
<ref id="ref4"><label>4.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Andreasen</surname><given-names>NC</given-names></name> <name><surname>Grove</surname><given-names>WM</given-names></name></person-group>. <article-title>Thought, language, and communication in schizophrenia: diagnosis and prognosis</article-title>. <source>Schizophr Bull</source>. (<year>1986</year>) <volume>12</volume>:<fpage>348</fpage>&#x2013;<lpage>59</lpage>. doi: <pub-id pub-id-type="doi">10.1093/schbul/12.3.348</pub-id>, PMID: <pub-id pub-id-type="pmid">3764356</pub-id></citation></ref>
<ref id="ref5"><label>5.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Jaspers</surname><given-names>K</given-names></name></person-group>. <source>Allgemeine Psychopathologie</source>. <edition>9 (based on the unchanged 4th edition of 1946)</edition> ed. <publisher-loc>Berlin</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>1973</year>).</citation></ref>
<ref id="ref6"><label>6.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Bleuler</surname><given-names>E</given-names></name></person-group>. <source>Dementia praecox oder Gruppe der Schizophrenien</source>. <publisher-loc>Wien</publisher-loc>: <publisher-name>Leipzig</publisher-name> (<year>1911</year>).</citation></ref>
<ref id="ref7"><label>7.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kuperberg</surname><given-names>GR</given-names></name></person-group>. <article-title>Language in schizophrenia part 1: an introduction</article-title>. <source>Lang Linguist Compass</source>. (<year>2010</year>) <volume>4</volume>:<fpage>576</fpage>&#x2013;<lpage>89</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1749-818X.2010.00216.x</pub-id>, PMID: <pub-id pub-id-type="pmid">20936080</pub-id></citation></ref>
<ref id="ref8"><label>8.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jucker</surname><given-names>AH</given-names></name></person-group>. <article-title>The discourse marker well in the history of English</article-title>. <source>Engl Lang Linguist</source>. (<year>1997</year>) <volume>1</volume>:<fpage>91</fpage>&#x2013;<lpage>110</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S136067430000037X</pub-id></citation></ref>
<ref id="ref9"><label>9.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Andreasen</surname><given-names>NC</given-names></name></person-group>. <source>Scale for the assessment of positive symptoms</source>. <publisher-loc>Iowa City</publisher-loc>: <publisher-name>IA University of Iowa</publisher-name> (<year>1984</year>).</citation></ref>
<ref id="ref10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Graesser Arthur</surname><given-names>C</given-names></name> <name><surname>McNamara Danielle</surname><given-names>S</given-names></name> <name><surname>Louwerse Max</surname><given-names>M</given-names></name> <name><surname>Cai</surname><given-names>Z</given-names></name></person-group>. <article-title>Coh-Metrix: analysis of text on cohesion and language</article-title>. <source>Behav Res Methods Instrum Comput</source>. (<year>2004</year>) <volume>36</volume>:<fpage>193</fpage>&#x2013;<lpage>202</lpage>. doi: <pub-id pub-id-type="doi">10.3758/BF03195564</pub-id></citation></ref>
<ref id="ref11"><label>11.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Elvev&#x00E5;g</surname><given-names>B</given-names></name> <name><surname>Foltz</surname><given-names>PW</given-names></name> <name><surname>Weinberger</surname><given-names>DR</given-names></name> <name><surname>Goldberg</surname><given-names>TE</given-names></name></person-group>. <article-title>Quantifying incoherence in speech: an automated methodology and novel application to schizophrenia</article-title>. <source>Schizophr Res</source>. (<year>2007</year>) <volume>93</volume>:<fpage>304</fpage>&#x2013;<lpage>16</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.schres.2007.03.001</pub-id>, PMID: <pub-id pub-id-type="pmid">17433866</pub-id></citation></ref>
<ref id="ref12"><label>12.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sarzynska-Wawer</surname><given-names>J</given-names></name> <name><surname>Wawer</surname><given-names>A</given-names></name> <name><surname>Pawlak</surname><given-names>A</given-names></name> <name><surname>Szymanowska</surname><given-names>J</given-names></name> <name><surname>Stefaniak</surname><given-names>I</given-names></name> <name><surname>Jarkiewicz</surname><given-names>M</given-names></name> <etal/></person-group>. <article-title>Detecting formal thought disorder by deep contextualized word representations</article-title>. <source>Psychiatry Res</source>. (<year>2021</year>) <volume>304</volume>:<fpage>114135</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.psychres.2021.114135</pub-id>, PMID: <pub-id pub-id-type="pmid">34343877</pub-id></citation></ref>
<ref id="ref13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname><given-names>SX</given-names></name> <name><surname>Kriz</surname><given-names>R</given-names></name> <name><surname>Cho</surname><given-names>S</given-names></name> <name><surname>Park</surname><given-names>SJ</given-names></name> <name><surname>Harowitz</surname><given-names>J</given-names></name> <name><surname>Gur</surname><given-names>RE</given-names></name> <etal/></person-group>. <article-title>Natural language processing methods are sensitive to sub-clinical linguistic differences in schizophrenia spectrum disorders</article-title>. <source>NPJ Schizophr</source>. (<year>2021</year>) <volume>7</volume>:<fpage>25</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41537-021-00154-3</pub-id></citation></ref>
<ref id="ref14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morgan</surname><given-names>SE</given-names></name> <name><surname>Diederen</surname><given-names>K</given-names></name> <name><surname>V&#x00E9;rtes</surname><given-names>PE</given-names></name> <name><surname>Ip</surname><given-names>SH</given-names></name> <name><surname>Wang</surname><given-names>B</given-names></name> <name><surname>Thompson</surname><given-names>B</given-names></name> <etal/></person-group>. <article-title>Natural language processing markers in first episode psychosis and people at clinical high-risk</article-title>. <source>Transl Psychiatry</source>. (<year>2021</year>) <volume>11</volume>:<fpage>630</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41398-021-01722-y</pub-id>, PMID: <pub-id pub-id-type="pmid">34903724</pub-id></citation></ref>
<ref id="ref15"><label>15.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Just</surname><given-names>SA</given-names></name> <name><surname>Haegert</surname><given-names>E</given-names></name> <name><surname>Ko&#x0159;&#x00E1;nov&#x00E1;</surname><given-names>N</given-names></name> <name><surname>Br&#x00F6;cker</surname><given-names>A-L</given-names></name> <name><surname>Nenchev</surname><given-names>I</given-names></name> <name><surname>Funcke</surname><given-names>J</given-names></name> <etal/></person-group>. <article-title>Modeling incoherent discourse in non-affective psychosis</article-title>. <source>Front Psych</source>. (<year>2020</year>) <volume>11</volume>:<fpage>846</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpsyt.2020.00846</pub-id>, PMID: <pub-id pub-id-type="pmid">32973586</pub-id></citation></ref>
<ref id="ref16"><label>16.</label><citation citation-type="other"><person-group person-group-type="editor"><name><surname>Just</surname> <given-names>SA</given-names></name> <name><surname>Haegert</surname> <given-names>E</given-names></name> <name><surname>Ko&#x0159;&#x00E1;nov&#x00E1;</surname> <given-names>N</given-names></name> <name><surname>Br&#x00F6;cker</surname> <given-names>A-L</given-names></name> <name><surname>Nenchev</surname> <given-names>I</given-names></name> <name><surname>Funcke</surname> <given-names>J</given-names></name> <etal/></person-group>., editors. (<year>2019</year>). Coherence models in schizophrenia. Proceedings of the sixth workshop on computational linguistics and clinical psychology. <publisher-loc>Minneapolis, MN</publisher-loc>: <publisher-name>Association for Computational Linguistics</publisher-name>.</citation></ref>
<ref id="ref17"><label>17.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bedi</surname><given-names>G</given-names></name> <name><surname>Carrillo</surname><given-names>F</given-names></name> <name><surname>Cecchi</surname><given-names>GA</given-names></name> <name><surname>Slezak</surname><given-names>DF</given-names></name> <name><surname>Sigman</surname><given-names>M</given-names></name> <name><surname>Mota</surname><given-names>NB</given-names></name> <etal/></person-group>. <article-title>Automated analysis of free speech predicts psychosis onset in high-risk youths</article-title>. <source>NPJ Schizophr</source>. (<year>2015</year>) <volume>1</volume>:<fpage>15030</fpage>&#x2013;<lpage>7</lpage>. doi: <pub-id pub-id-type="doi">10.1038/npjschz.2015.30</pub-id>, PMID: <pub-id pub-id-type="pmid">27336038</pub-id></citation></ref>
<ref id="ref18"><label>18.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Corcoran</surname><given-names>CM</given-names></name> <name><surname>Carrillo</surname><given-names>F</given-names></name> <name><surname>Fern&#x00E1;ndez-Slezak</surname><given-names>D</given-names></name> <name><surname>Bedi</surname><given-names>G</given-names></name> <name><surname>Klim</surname><given-names>C</given-names></name> <name><surname>Javitt</surname><given-names>DC</given-names></name> <etal/></person-group>. <article-title>Prediction of psychosis across protocols and risk cohorts using automated language analysis</article-title>. <source>World Psychiatry</source>. (<year>2018</year>) <volume>17</volume>:<fpage>67</fpage>&#x2013;<lpage>75</lpage>. doi: <pub-id pub-id-type="doi">10.1002/wps.20491</pub-id>, PMID: <pub-id pub-id-type="pmid">29352548</pub-id></citation></ref>
<ref id="ref19"><label>19.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bilgrami</surname><given-names>ZR</given-names></name> <name><surname>Sarac</surname><given-names>C</given-names></name> <name><surname>Srivastava</surname><given-names>A</given-names></name> <name><surname>Herrera</surname><given-names>SN</given-names></name> <name><surname>Azis</surname><given-names>M</given-names></name> <name><surname>Haas</surname><given-names>SS</given-names></name> <etal/></person-group>. <article-title>Construct validity for computational linguistic metrics in individuals at clinical risk for psychosis: associations with clinical ratings</article-title>. <source>Schizophr Res</source>. (<year>2022</year>) <volume>245</volume>:<fpage>90</fpage>&#x2013;<lpage>6</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.schres.2022.01.019</pub-id>, PMID: <pub-id pub-id-type="pmid">35094918</pub-id></citation></ref>
<ref id="ref20"><label>20.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Corcoran</surname><given-names>CM</given-names></name> <name><surname>Mittal</surname><given-names>VA</given-names></name> <name><surname>Bearden</surname><given-names>CE</given-names></name> <name><surname>Gur</surname><given-names>RE</given-names></name> <name><surname>Hitczenko</surname><given-names>K</given-names></name> <name><surname>Bilgrami</surname><given-names>Z</given-names></name> <etal/></person-group>. <article-title>Language as a biomarker for psychosis: a natural language processing approach</article-title>. <source>Schizophr Res</source>. (<year>2020</year>) <volume>226</volume>:<fpage>158</fpage>&#x2013;<lpage>66</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.schres.2020.04.032</pub-id>, PMID: <pub-id pub-id-type="pmid">32499162</pub-id></citation></ref>
<ref id="ref21"><label>21.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Palaniyappan</surname><given-names>L</given-names></name></person-group>. <article-title>More than a biomarker: could language be a biosocial marker of psychosis?</article-title> <source>NPJ Schizophr</source>. (<year>2021</year>) <volume>7</volume>:<fpage>42</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41537-021-00172-1</pub-id>, PMID: <pub-id pub-id-type="pmid">34465778</pub-id></citation></ref>
<ref id="ref22"><label>22.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moritz</surname><given-names>S</given-names></name> <name><surname>Gaw&#x0119;da</surname><given-names>&#x0141;</given-names></name> <name><surname>Heinz</surname><given-names>A</given-names></name> <name><surname>Gallinat</surname><given-names>J</given-names></name></person-group>. <article-title>Four reasons why early detection centers for psychosis should be renamed and their treatment targets reconsidered: we should not catastrophize a future we can neither reliably predict nor change</article-title>. <source>Psychol Med</source>. (<year>2019</year>) <volume>49</volume>:<fpage>2134</fpage>&#x2013;<lpage>40</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S0033291719001740</pub-id></citation></ref>
<ref id="ref23"><label>23.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Heinz</surname><given-names>A</given-names></name></person-group>. <source>A new understanding of mental disorders</source>. <publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>Computational Models for dimensional Psychiatry</publisher-name> (<year>2017</year>).</citation></ref>
<ref id="ref24"><label>24.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Parola</surname><given-names>A</given-names></name> <name><surname>Lin</surname><given-names>JM</given-names></name> <name><surname>Simonsen</surname><given-names>A</given-names></name> <name><surname>Bliksted</surname><given-names>V</given-names></name> <name><surname>Zhou</surname><given-names>Y</given-names></name> <name><surname>Wang</surname><given-names>H</given-names></name> <etal/></person-group>. <article-title>Speech disturbances in schizophrenia: assessing cross-linguistic generalizability of NLP automated measures of coherence</article-title>. <source>Schizophr Res</source>. (<year>2022</year>). doi: <pub-id pub-id-type="doi">10.1016/j.schres.2022.07.002</pub-id>, PMID: <pub-id pub-id-type="pmid">35927097</pub-id></citation></ref>
<ref id="ref25"><label>25.</label><citation citation-type="other"><person-group person-group-type="editor"><name><surname>Hitczenko</surname> <given-names>K</given-names></name> <name><surname>Cowan</surname> <given-names>H</given-names></name> <name><surname>Mittal</surname> <given-names>V</given-names></name> <name><surname>Goldrick</surname> <given-names>M</given-names></name></person-group>, editors. (<year>2021</year>). Automated coherence measures fail to index thought disorder in individuals at risk for psychosis. Proceedings of the seventh workshop on computational linguistics and clinical psychology: improving access. <publisher-name>Association for Computational Linguistics</publisher-name>.</citation></ref>
<ref id="ref26"><label>26.</label><citation citation-type="other"><person-group person-group-type="author"><name><surname>Panicheva</surname><given-names>P</given-names></name> <name><surname>Litvinova</surname><given-names>T</given-names></name></person-group>, editors. (<year>2019</year>). Semantic coherence in schizophrenia in Russian written texts. 2019 25th Conference of Open Innovations Association (FRUCT). <publisher-loc>Helsinki</publisher-loc>: IEEE.</citation></ref>
<ref id="ref27"><label>27.</label><citation citation-type="other"><person-group person-group-type="editor"><name><surname>Iter</surname> <given-names>D</given-names></name> <name><surname>Yoon</surname> <given-names>J</given-names></name> <name><surname>Jurafsky</surname> <given-names>D</given-names></name></person-group>, editors. (<year>2018</year>). Automatic detection of incoherent speech for diagnosing schizophrenia. Proceedings of the fifth workshop on computational linguistics and clinical psychology: from keyboard to clinic. <publisher-loc>Minneapolis, MN</publisher-loc>: <publisher-name>Association for Computational Linguistics</publisher-name>.</citation></ref>
<ref id="ref28"><label>28.</label><citation citation-type="other"><person-group person-group-type="author"><name><surname>Pennington</surname><given-names>J</given-names></name> <name><surname>Socher</surname><given-names>R</given-names></name> <name><surname>Manning</surname><given-names>C</given-names></name></person-group>. (<year>2014</year>). Glove: global vectors for word representation. Conference on empirical methods in natural language processing (EMNLP). <publisher-loc>Doha</publisher-loc>: <publisher-name>Association for Computational Linguistics</publisher-name>.</citation></ref>
<ref id="ref29"><label>29.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mikolov</surname><given-names>T</given-names></name> <name><surname>Chen</surname><given-names>K</given-names></name> <name><surname>Corrado</surname><given-names>G</given-names></name> <name><surname>Dean</surname><given-names>J</given-names></name></person-group>. <article-title>Efficient estimation of word representations in vector space</article-title>. <source>arXiv preprint arXiv</source>. (<year>2013</year>):<fpage>13013781</fpage>. doi: <pub-id pub-id-type="doi">10.48550/arXiv.1301.3781</pub-id></citation></ref>
<ref id="ref30"><label>30.</label><citation citation-type="book"><person-group person-group-type="author"><collab id="coll2">APA</collab></person-group>. <source>Diagnostisches und Statistisches Manual Psychischer St&#x00F6;rungen &#x2013; Textrevision &#x2013; DSM-IV-TR</source>. <publisher-loc>G&#x00F6;ttingen</publisher-loc>: <publisher-name>Hogrefe</publisher-name> (<year>2003</year>).</citation></ref>
<ref id="ref31"><label>31.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Buck</surname><given-names>B</given-names></name> <name><surname>Ludwig</surname><given-names>K</given-names></name> <name><surname>Meyer</surname><given-names>PS</given-names></name> <name><surname>Penn</surname><given-names>DL</given-names></name></person-group>. <article-title>The use of narrative sampling in the assessment of social cognition: the narrative of emotions task (NET)</article-title>. <source>Psychiatry Res</source>. (<year>2014</year>) <volume>217</volume>:<fpage>233</fpage>&#x2013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.psychres.2014.03.014</pub-id>, PMID: <pub-id pub-id-type="pmid">24726270</pub-id></citation></ref>
<ref id="ref32"><label>32.</label><citation citation-type="other"><person-group person-group-type="author"><name><surname>Wicks</surname><given-names>R</given-names></name> <name><surname>Post</surname><given-names>M</given-names></name></person-group>. (<year>2021</year>). A unified approach to sentence segmentation of punctuated text in many languages. <publisher-name>Association for Computational Linguistics</publisher-name>. <fpage>3995</fpage>&#x2013;<lpage>4007</lpage> p.</citation></ref>
<ref id="ref33"><label>33.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Palmer</surname><given-names>DD</given-names></name></person-group>. <article-title>Tokenisation and sentence segmentation</article-title> In: <person-group person-group-type="editor"><name><surname>Dale</surname> <given-names>R</given-names></name> <name><surname>Moisl</surname> <given-names>H</given-names></name> <name><surname>Somers</surname> <given-names>H</given-names></name></person-group>, editors. <source>Handbook of natural language processing</source>. <publisher-loc>New York</publisher-loc>: <publisher-name>Marcel Dekker Inc</publisher-name> (<year>2000</year>). <fpage>11</fpage>&#x2013;<lpage>35</lpage>.</citation></ref>
<ref id="ref34"><label>34.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Almeida</surname><given-names>F</given-names></name> <name><surname>Xex&#x00E9;o</surname><given-names>G</given-names></name></person-group>. <article-title>Word embeddings: a survey</article-title>. <source>arXiv preprint arXiv</source>. (<year>2019</year>):<fpage>190109069</fpage>. doi: <pub-id pub-id-type="doi">10.48550/arXiv.1901.09069</pub-id></citation></ref>
<ref id="ref35"><label>35.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Voppel</surname><given-names>AE</given-names></name> <name><surname>de Boer</surname><given-names>JN</given-names></name> <name><surname>Brederoo</surname><given-names>SG</given-names></name> <name><surname>Schnack</surname><given-names>HG</given-names></name> <name><surname>Sommer</surname><given-names>IEC</given-names></name></person-group>. <article-title>Semantic and acoustic markers in schizophrenia-Spectrum disorders: a combinatory machine learning approach</article-title>. <source>Schizophr Bull</source>. (<year>2022</year>) <volume>49</volume>:<fpage>S163</fpage>&#x2013;<lpage>71</lpage>. doi: <pub-id pub-id-type="doi">10.1093/schbul/sbac142</pub-id>, PMID: <pub-id pub-id-type="pmid">36305054</pub-id></citation></ref>
<ref id="ref36"><label>36.</label><citation citation-type="other"><person-group person-group-type="author"><name><surname>Honnibal</surname><given-names>M</given-names></name> <name><surname>Montani</surname><given-names>I</given-names></name></person-group>. (<year>2023</year>). spaCy. Industrial-strength natural language processing. Available at: <ext-link xlink:href="https://spacy.io/api/tok2vec/" ext-link-type="uri">https://spacy.io/api/tok2vec/</ext-link>.</citation></ref>
<ref id="ref37"><label>37.</label><citation citation-type="book"><person-group person-group-type="author"><collab id="coll1">Deepset</collab></person-group>. <source>German word Embeddings</source>. <publisher-loc>Berlin</publisher-loc>: <publisher-name>deepest GmbH</publisher-name> (<year>2023</year>) <comment>Available at: </comment><ext-link xlink:href="https://www.deepset.ai/german-word-embeddings" ext-link-type="uri">https://www.deepset.ai/german-word-embeddings</ext-link>.</citation></ref>
<ref id="ref38"><label>38.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>van der Gaag</surname><given-names>M</given-names></name> <name><surname>Hoffman</surname><given-names>T</given-names></name> <name><surname>Remijsen</surname><given-names>M</given-names></name> <name><surname>Hijman</surname><given-names>R</given-names></name> <name><surname>de Haan</surname><given-names>L</given-names></name> <name><surname>van Meijel</surname><given-names>B</given-names></name> <etal/></person-group>. <article-title>The five-factor model of the positive and negative syndrome scale II: a ten-fold cross-validation of a revised model</article-title>. <source>Schizophr Res</source>. (<year>2006</year>) <volume>85</volume>:<fpage>280</fpage>&#x2013;<lpage>7</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.schres.2006.03.021</pub-id></citation></ref>
<ref id="ref39"><label>39.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Woodward</surname><given-names>TS</given-names></name> <name><surname>Jung</surname><given-names>K</given-names></name> <name><surname>Smith</surname><given-names>GN</given-names></name> <name><surname>Hwang</surname><given-names>H</given-names></name> <name><surname>Barr</surname><given-names>AM</given-names></name> <name><surname>Procyshyn</surname><given-names>RM</given-names></name> <etal/></person-group>. <article-title>Symptom changes in five dimensions of the positive and negative syndrome scale in refractory psychosis</article-title>. <source>Eur Arch Psychiatry Clin Neurosci</source>. (<year>2014</year>) <volume>264</volume>:<fpage>673</fpage>&#x2013;<lpage>82</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00406-013-0460-x</pub-id>, PMID: <pub-id pub-id-type="pmid">24126470</pub-id></citation></ref>
<ref id="ref40"><label>40.</label><citation citation-type="other"><person-group person-group-type="author"><name><surname>Schmidt</surname><given-names>K-H</given-names></name> <name><surname>Metzler</surname><given-names>P</given-names></name></person-group>. (<year>1992</year>). <source>Wortschatztest [vocabulary test (WST)]</source>. <publisher-loc>Beltz</publisher-loc>: <publisher-name>Weinheim</publisher-name>.</citation></ref>
<ref id="ref41"><label>41.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Linden</surname><given-names>M</given-names></name> <name><surname>Baron</surname><given-names>S</given-names></name></person-group>. <article-title>Das Mini-ICF-Rating f&#x00FC;r psychische St&#x00F6;rungen (Mini-ICF-P). Ein Kurzinstrument zur Beurteilung von F&#x00E4;higkeitsst&#x00F6;rungen bei psychischen Erkrankungen</article-title>. <source>Rehabilitation</source>. (<year>2005</year>) <volume>44</volume>:<fpage>144</fpage>&#x2013;<lpage>51</lpage>. doi: <pub-id pub-id-type="doi">10.1055/s-2004-834786</pub-id>, PMID: <pub-id pub-id-type="pmid">15933950</pub-id></citation></ref>
<ref id="ref42"><label>42.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Holmlund</surname><given-names>TB</given-names></name> <name><surname>Chandler</surname><given-names>C</given-names></name> <name><surname>Foltz</surname><given-names>PW</given-names></name> <name><surname>Diaz-Asper</surname><given-names>C</given-names></name> <name><surname>Cohen</surname><given-names>AS</given-names></name> <name><surname>Rodriguez</surname><given-names>Z</given-names></name> <etal/></person-group>. <article-title>Towards a temporospatial framework for measurements of disorganization in speech using semantic vectors</article-title>. <source>Schizophr Res</source>. (<year>2022</year>). doi: <pub-id pub-id-type="doi">10.1016/j.schres.2022.09.020</pub-id>, PMID: <pub-id pub-id-type="pmid">36372683</pub-id></citation></ref>
<ref id="ref43"><label>43.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Correll</surname><given-names>CU</given-names></name> <name><surname>Schooler</surname><given-names>NR</given-names></name></person-group>. <article-title>Negative symptoms in schizophrenia: a review and clinical guide for recognition, assessment, and treatment</article-title>. <source>Neuropsychiatr Dis Treat</source>. (<year>2020</year>) <volume>16</volume>:<fpage>519</fpage>&#x2013;<lpage>34</lpage>. doi: <pub-id pub-id-type="doi">10.2147/NDT.S225643</pub-id>, PMID: <pub-id pub-id-type="pmid">32110026</pub-id></citation></ref>
<ref id="ref44"><label>44.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bambini</surname><given-names>V</given-names></name> <name><surname>Frau</surname><given-names>F</given-names></name> <name><surname>Bischetti</surname><given-names>L</given-names></name> <name><surname>Cuoco</surname><given-names>F</given-names></name> <name><surname>Bechi</surname><given-names>M</given-names></name> <name><surname>Buonocore</surname><given-names>M</given-names></name> <etal/></person-group>. <article-title>Deconstructing heterogeneity in schizophrenia through language: a semi-automated linguistic analysis and data-driven clustering approach</article-title>. <source>Schizophrenia (Heidelb)</source>. (<year>2022</year>) <volume>8</volume>:<fpage>102</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41537-022-00306-z</pub-id>, PMID: <pub-id pub-id-type="pmid">36446789</pub-id></citation></ref>
</ref-list>
</back>
</article>