<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychiatry</journal-id>
<journal-title>Frontiers in Psychiatry</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychiatry</abbrev-journal-title>
<issn pub-type="epub">1664-0640</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyt.2025.1504306</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Psychiatry</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Employing large language models for emotion detection in psychotherapy transcripts</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Lalk</surname>
<given-names>Christopher</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2834550/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Targan</surname>
<given-names>Kim</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2856869/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Steinbrenner</surname>
<given-names>Tobias</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Schaffrath</surname>
<given-names>Jana</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Eberhardt</surname>
<given-names>Steffen</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Schwartz</surname>
<given-names>Brian</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/997501/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Vehlen</surname>
<given-names>Antonia</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1384645/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lutz</surname>
<given-names>Wolfgang</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Rubel</surname>
<given-names>Julian</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Psychology, Osnabr&#xfc;ck University</institution>, <addr-line>Osnabr&#xfc;ck</addr-line>, <country>Germany</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Psychology, University of Trier</institution>, <addr-line>Trier</addr-line>, <country>Germany</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Kerstin Denecke, Bern University of Applied Sciences, Switzerland</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Mark Melnykowycz, IDUN Technologies AG, Switzerland</p>
<p>Ebrahim Ghaderpour, Sapienza University of Rome, Italy</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Christopher Lalk, <email xlink:href="mailto:christopher.lalk@uni-osnabrueck.de">christopher.lalk@uni-osnabrueck.de</email>
</p>
</fn>
<fn fn-type="other" id="fn003">
<p>&#x2020;ORCID: Christopher Lalk, <uri xlink:href="https://orcid.org/0000-0002-1793-3507">orcid.org/0000-0002-1793-3507</uri>; Kim Targan, <uri xlink:href="https://orcid.org/0009-0003-5935-1649">orcid.org/0009-0003-5935-1649</uri>; Tobias Steinbrenner, <uri xlink:href="https://orcid.org/0009-0005-0434-2870">orcid.org/0009-0005-0434-2870</uri>; Jana Schaffrath, <uri xlink:href="https://orcid.org/0000-0003-0106-0243">orcid.org/0000-0003-0106-0243</uri>; Steffen Eberhardt, <uri xlink:href="https://orcid.org/0000-0002-9900-4671">orcid.org/0000-0002-9900-4671</uri>; Brian Schwartz, <uri xlink:href="https://orcid.org/0000-0003-4695-4953">orcid.org/0000-0003-4695-4953</uri>; Antonia Vehlen, <uri xlink:href="https://orcid.org/0000-0002-6019-3161">orcid.org/0000-0002-6019-3161</uri>; Wolfgang Lutz, <uri xlink:href="https://orcid.org/0000-0002-5141-3847">orcid.org/0000-0002-5141-3847</uri>; Julian Rubel, <uri xlink:href="https://orcid.org/0000-0002-9625-6611">orcid.org/0000-0002-9625-6611</uri>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>09</day>
<month>05</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1504306</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>09</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>14</day>
<month>04</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Lalk, Targan, Steinbrenner, Schaffrath, Eberhardt, Schwartz, Vehlen, Lutz and Rubel</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Lalk, Targan, Steinbrenner, Schaffrath, Eberhardt, Schwartz, Vehlen, Lutz and Rubel</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Purpose</title>
<p>In the context of psychotherapy, emotions play an important role both through their association with symptom severity, as well as their effects on the therapeutic relationship. In this analysis, we aim to train a large language model (LLM) for the detection of emotions in German speech. We want to apply this model on a corpus of psychotherapy transcripts to predict symptom severity and alliance aiming to identify the most important emotions for the prediction of symptom severity and therapeutic alliance.</p>
</sec>
<sec>
<title>Methods</title>
<p>We employed a public labeled dataset of 28 emotions and translated the dataset into German. A pre-trained LLM was then fine-tuned on this dataset for emotion classification. We applied the fine-tuned model to a dataset containing 553 psychotherapy sessions of 124 patients. Using machine learning (ML) and explainable artificial intelligence (AI), we predicted symptom severity and alliance by the detected emotions.</p>
</sec>
<sec>
<title>Results</title>
<p>Our fine-tuned model achieved modest classification performance (<italic>F1<sub>macro</sub>
</italic> =0.45, <italic>Accuracy</italic>=0.41, <italic>Kappa</italic>=0.42) across the 28 emotions. Incorporating all emotions, our ML model showed satisfying performance for the prediction of symptom severity (<italic>r</italic> = .50; 95%-CI:.42,.57) and moderate performance for the prediction of alliance scores (<italic>r</italic> = .20; 95%-CI:.06,.32). The most important emotions for the prediction of symptom severity were <italic>approval, anger</italic>, and <italic>fear</italic>. The most important emotions for the prediction of alliance were <italic>curiosity, confusion</italic>, and <italic>surprise</italic>.</p>
</sec>
<sec>
<title>Conclusions</title>
<p>Even though the classification results were only moderate, our model achieved a good performance especially for prediction of symptom severity. The results confirm the role of negative emotions in the prediction of symptom severity, while they also highlight the role of positive emotions in fostering a good alliance. Future directions entail the improvement of the labeled dataset, especially with regards to domain-specificity and incorporating context information. Additionally, other modalities and Natural Language Processsing (NLP)-based alliance assessment could be integrated.</p>
</sec>
</abstract>
<kwd-group>
<kwd>natural language processing</kwd>
<kwd>computational psychotherapy research</kwd>
<kwd>machine learning</kwd>
<kwd>explainable artificial intelligence</kwd>
<kwd>symptom severity</kwd>
<kwd>alliance</kwd>
<kwd>process-outcome-research</kwd>
</kwd-group>
<contract-num rid="cn001">LU 660/16-1, LU 660/20-1, LU 660/10-1</contract-num>
<contract-sponsor id="cn001">Deutsche Forschungsgemeinschaft<named-content content-type="fundref-id">10.13039/501100001659</named-content>
</contract-sponsor>
<counts>
<fig-count count="3"/>
<table-count count="4"/>
<equation-count count="0"/>
<ref-count count="98"/>
<page-count count="13"/>
<word-count count="6533"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Digital Mental Health</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>Emotions can be conceptualized as &#x201c;biologically based reactions that coordinate adaptive responding to important opportunities and challenges&#x201d; (<xref ref-type="bibr" rid="B1">1</xref>, p. 152). There are qualitative differences between emotions based on the opportunity or challenge that the emotion has been evolved to address, as well as its expression (<xref ref-type="bibr" rid="B2">2</xref>). Further, emotions can immediately impact behavior, quickly regulating one&#x2019;s behavior based on the situation (<xref ref-type="bibr" rid="B3">3</xref>). For instance, anger may be an adaptive reaction to an unfair treatment (<xref ref-type="bibr" rid="B4">4</xref>), prompting the person at which it is targeted to change their behavior according to the demand. Simultaneously, anger comes with specific facial features (<xref ref-type="bibr" rid="B5">5</xref>) and associated behaviors, such as speaking forcefully or even yelling.</p>
<p>Since emotions are an essential part of daily functioning, it is important that individuals are able to regulate them, that is, modulate the emotional experience and its expression (<xref ref-type="bibr" rid="B1">1</xref>). People who lack this ability, may be compromised in several domains of life, which could negatively affect mental health (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B6">6</xref>). Therefore, it comes as no surprise that many mental health disorders are associated with emotion regulation deficits (<xref ref-type="bibr" rid="B7">7</xref>).</p>
<p>Because of the importance of emotion regulation processes across various mental health disorders, emotions play an essential role in psychotherapy (<xref ref-type="bibr" rid="B8">8</xref>). Most importantly, they are associated with symptom severity in mood and anxiety disorders (<xref ref-type="bibr" rid="B9">9</xref>&#x2013;<xref ref-type="bibr" rid="B11">11</xref>). Even though, emotions and affect can be differentiated (e.g., affect is longer in duration, is less intentional, tends to have unknown causes, and has lower intensity), there is substantial overlap between both constructs (<xref ref-type="bibr" rid="B9">9</xref>). For instance, the correlation between fear (emotion) and anxiety (affect) was calculated as <italic>r</italic> = .72, amounting to more than 50% of shared variance (<xref ref-type="bibr" rid="B10">10</xref>). Therefore, the measurement of someone&#x2019;s emotions can provide an estimate of their affect. Simultaneously, dysregulated affect is an important feature in anxiety and depression (<xref ref-type="bibr" rid="B11">11</xref>), which are characterized by excessive negative (NA) and a lack of positive affect (PA). Generally, affect is sensitive to change: In a meta-analysis, psychotherapy for depression has been shown to decrease NA and increase PA (<xref ref-type="bibr" rid="B12">12</xref>).</p>
<p>According to the broaden-and-built theory, PA helps to strengthen and build resources by extending one&#x2019;s thought-action repertoire (<xref ref-type="bibr" rid="B13">13</xref>). For instance, PA comes with the urge to play, explore, savor, and connect, all of which can foster resources through the creation of new opportunities and strengthening of relationships. This, in turn, raises wellbeing and PA (<xref ref-type="bibr" rid="B13">13</xref>). Consequently, it is not surprising that PA can protect against depression (<xref ref-type="bibr" rid="B14">14</xref>), may mediate depression recovery (<xref ref-type="bibr" rid="B15">15</xref>), and that lack of PA is associated with typical depression symptoms, such as sadness, loss of interest, little energy, and apathy (<xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B17">17</xref>). Conversely, NA is linked with stress levels (<xref ref-type="bibr" rid="B18">18</xref>) and depressive symptoms (<xref ref-type="bibr" rid="B19">19</xref>). NA is a better predictor of depression deterioration than PA, differentiates better between depressed and healthy individuals (<xref ref-type="bibr" rid="B20">20</xref>), and predicts future depression onset while PA does not (<xref ref-type="bibr" rid="B21">21</xref>). Therefore, NA is likely a better marker for symptom severity than PA.</p>
<p>Beyond their association with symptom severity, emotions play another crucial role in the context of psychotherapy through their impact on the therapeutic alliance, which is one of the best predictors of successful treatment (<xref ref-type="bibr" rid="B22">22</xref>). Human beings are fundamentally social creatures and emotions are an essential mechanism for the regulation of social relationships (<xref ref-type="bibr" rid="B23">23</xref>). Much of the adaptive strength of emotions is mediated by their effects on interpersonal functioning so that they can be described as intrinsically interpersonal (<xref ref-type="bibr" rid="B24">24</xref>): Emotion expression helps people to recognize our needs and wishes, allowing them to support us and strengthening the mutual bond. However, positive interpersonal effects of emotion expression are not automatically given, but depend on several crucial factors (<xref ref-type="bibr" rid="B23">23</xref>). In particular, emotion regulation plays an important role: For instance, individuals with high levels of NA report more difficult and less satisfying romantic relationships (<xref ref-type="bibr" rid="B25">25</xref>). Though negative emotions can play an adaptive role as well, the excessive expression of NA can be devastating for romantic relationships, because it perpetuates a reciprocal spiral, from which it is difficult to disengage (<xref ref-type="bibr" rid="B26">26</xref>). Similarly, the expression of negative sentiment towards the therapist or the therapeutic situation is associated with lower levels of alliance (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B28">28</xref>). Depressed mood is associated with lower levels of emotion regulation, which can lead to anger management difficulties, reduced trust and forgiveness, heightened levels of social comparison, as well as social withdrawal, all of which can impair social functioning and therefore harm the therapeutic relationship (<xref ref-type="bibr" rid="B29">29</xref>). In summary, patient emotions associated with either withdrawal or confrontation and criticism may be particular harmful to the alliance (<xref ref-type="bibr" rid="B30">30</xref>). For example, patients with a lot of shame tend to withdraw, which leads to negative effects on the alliance (<xref ref-type="bibr" rid="B31">31</xref>), while anger, hostility, and frustration can impair the alliance via confrontation and criticism (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B28">28</xref>).</p>
<p>Contrary, positive emotions serve important social functions, which can improve the therapeutic alliance (<xref ref-type="bibr" rid="B32">32</xref>&#x2013;<xref ref-type="bibr" rid="B35">35</xref>). Most importantly, they can increase intimacy and emotional bond, as well as enhance motivation to achieve shared goals (<xref ref-type="bibr" rid="B35">35</xref>), both of which are pillars of the working alliance (<xref ref-type="bibr" rid="B36">36</xref>). These considerations are confirmed through longitudinal studies, that have shown bidirectional effects between positive emotions and alliance (<xref ref-type="bibr" rid="B32">32</xref>, <xref ref-type="bibr" rid="B34">34</xref>). Though we did not find results regarding the relative strength of negative and positive emotions on the therapeutic relationship, it is likely that negative emotions may have the greater impact, since negative events tend to have greater effects on most areas of life, including interpersonal relations (<xref ref-type="bibr" rid="B37">37</xref>).</p>
<p>Emotions can be assessed via many different means, including video, audio, electroencephalography (for an overview see <xref ref-type="bibr" rid="B38">38</xref>), electromyography, various other physiological measures (e.g., heart rate, blood pressure), or a combination of several modalities (<xref ref-type="bibr" rid="B39">39</xref>&#x2013;<xref ref-type="bibr" rid="B41">41</xref>). Different methods have been successfully employed depending on the data source. For electroencephalography (see <xref ref-type="bibr" rid="B38">38</xref>), features can be employed for machine learning from different domains, such as the time, frequency, or both. Additionally, employing deep learning, the raw data can be used without feature engineering. For instance, using frequency features, good accuracy (&gt;80%) has been achieved both for the classification of valence and arousal (<xref ref-type="bibr" rid="B42">42</xref>). Similar approaches are possible for other physiological data (<xref ref-type="bibr" rid="B39">39</xref>). For video emotion classification, deep learning models show competitive performance with a convolutional neural network achieving 66% accuracy in a facial classification (<xref ref-type="bibr" rid="B43">43</xref>). In the voice domain, a combination of convolutional neural networks and a transformer architectures (wav2vec 2.0; <xref ref-type="bibr" rid="B44">44</xref>) shows state-of-the-art performance across various tasks (<xref ref-type="bibr" rid="B45">45</xref>). For text data, current models successfully employ a transformer architecture (e.g., <xref ref-type="bibr" rid="B46">46</xref>).</p>
<p>However, better results can be achieved for multimodal models. For instance, automatic classification of basic emotions based on text, speech, and video in a hidden Markov model achieved good accuracy in an experimental setting (<xref ref-type="bibr" rid="B47">47</xref>). Regarding a naturalistic psychotherapy setting, emotions were mainly assessed via questionnaire measures (<xref ref-type="bibr" rid="B48">48</xref>) with notable exceptions, where emotions were judged by human raters (e.g., <xref ref-type="bibr" rid="B49">49</xref>, <xref ref-type="bibr" rid="B50">50</xref>). However, both of these approaches have drawbacks: Questionnaire measures can be burdensome for patients and are unable to track emotions over the course of a session. While human raters can indeed track emotions over the session, this is very time-consuming, so that it is difficult to apply to large session datasets. With the emergence of artificial intelligence (AI) and natural language processing (NLP), new approaches for the automatic analyses of large language corpora are available (<xref ref-type="bibr" rid="B51">51</xref>). NLP has already shown promising success in the identification of therapist skills (<xref ref-type="bibr" rid="B52">52</xref>), motivational interview adherence (<xref ref-type="bibr" rid="B53">53</xref>), or relevant session themes (<xref ref-type="bibr" rid="B54">54</xref>, <xref ref-type="bibr" rid="B55">55</xref>). In the context of emotion detection, M. Tanana et&#xa0;al. (<xref ref-type="bibr" rid="B56">56</xref>) trained uni-, bi-, and trigram<xref ref-type="fn" rid="fn1">
<sup>1</sup>
</xref> models on the detection of sentiment on 100,000 rated utterances from psychotherapy transcripts. This work was later extended by the inclusion of the transformer model Bidirectional Encoder Representations and Transformations (BERT; <xref ref-type="bibr" rid="B57">57</xref>) and a model based on positive and negative affective words from the Linguistic Inquiry and Word Count (LIWC; <xref ref-type="bibr" rid="B58">58</xref>). In this analysis, the BERT model showed the best performance (<xref ref-type="bibr" rid="B59">59</xref>). More recently, Eberhardt et&#xa0;al. (<xref ref-type="bibr" rid="B60">60</xref>) validated the performance of another transformer model on a set of 85 transcripts. They found significant correlations between automatically calculated sentiment and patient- and therapist-reported emotions. Further, symptom severity was significantly associated with negative sentiment.</p>
<p>While these results provide evidence for the reliability and validity of sentiment analysis, they are restricted to the valence dimension, classifying all utterance on a single dimension from negative to positive. Though the valence dimension is highly relevant in this context, at least six basic emotions can be distinguished with additional affect states (<xref ref-type="bibr" rid="B2">2</xref>), that can be organized across multiple dimensions (e.g., valence, intensity, intentionality, duration) and multiple categories (e.g., causes, function, mimic, behavior).</p>
<sec id="s1_1">
<title>Objectives</title>
<p>Therefore, we aim to fine-tune a large language model (LLM) for a more fine-grained analysis of emotions in the German language. We want to show the clinical utility of this approach by applying this model to a dataset of psychotherapy sessions to predict symptom severity and alliance, employing explainable AI to identify the most important emotions for the prediction of both.</p>
</sec>
<sec id="s1_2">
<title>Hypotheses</title>
<p>We expect our fine-tuned German model to accurately capture emotions in the transcript, allowing for a prediction of patient symptom severity. Regarding symptom severity, we expect negative emotions to predict higher symptom severity and positive emotions to predict lower symptom severity. Further, we expect negative emotions to have a higher impact on the prediction of symptom severity than positive emotions. Regarding the alliance, we expect positive emotions to predict better alliance. For negative emotions, we expect lower levels of alliance in general, though particularly for emotions associated with withdrawal (such as embarrassment and confusion) or confrontation (such as anger and disapproval). Again, we expected negative emotions to have a higher impact on the alliance scores.</p>
</sec>
</sec>
<sec id="s2">
<title>Methods</title>
<sec id="s2_1">
<title>Patients and therapists</title>
<p>Our dataset contained 124 patients (65.8% female) who had received treatment at an university outpatient clinic in Trier, Germany. On average, patients were 38.8 years (<italic>SD</italic> = 12.7) old. Regarding the socioeconomic status, almost all had either finished a secondary school certificate (51.6%) or their A-levels (42.1%). Most had finished an apprenticeship (41.3%), while 18.2% were currently in training or studying and 11.6% had a university degree. All patients underwent a diagnostic interview employing the Structured Clinical Interview for Axis I DSM-IV Disorders-Patient Edition (SCID-I; <xref ref-type="bibr" rid="B61">61</xref>). They were mostly diagnosed with primary diagnoses of affective disorders (<italic>n</italic> = 56), anxiety disorders (<italic>n</italic> = 24), and trauma and adjustment disorders (<italic>n</italic> = 16). On average, they received 2.3 (<italic>SD</italic> = 1.3, <italic>min</italic> = 1, <italic>max</italic> = 5) comorbid diagnoses.</p>
<p>The treatment was conducted by 47 therapists with a psychology master degree. All therapists had at least one year of prior treatment experience and were either already licensed CBT therapists or currently enrolled in training. They received supervision regularly.</p>
</sec>
<sec id="s2_2">
<title>Treatment</title>
<p>The treatment consisted of weekly CBT sessions. While the first two sessions served diagnostic purposes (initial assessment in session 1 and SCID-I interview in session 2), the treatment began in the third session. On average, patients received 35.7 (<italic>SD</italic> = 19.7) sessions.</p>
</sec>
<sec id="s2_3">
<title>Instruments and measures</title>
<sec id="s2_3_1">
<title>Symptom severity</title>
<p>Prior to each session, symptom severity was assessed via the Hopkins Symptom Checklist-11 (HSCL-11; <xref ref-type="bibr" rid="B62">62</xref>). The HSCL-11 is an 11-item self-report scale about general psychological distress. Patients rated a list of 11 symptoms (fearfulness, anxiousness, agitation, panic, sleep problems, hopelessness, loneliness, low mood, lack of interest, suicidal ideation, and worthlessness) on a Likert-type scale from 1 (<italic>not at all</italic>) to 4 (<italic>extremely</italic>). Symptom severity was then calculated as the mean score on these items. The HSCL-11 contains a depression and anxiety subscale and is highly correlated with various other anxiety and depression questionnaires (<xref ref-type="bibr" rid="B63">63</xref>). For instance, high associations have been found for the Brief Symptom Inventory (BSI; <xref ref-type="bibr" rid="B64">64</xref>; <italic>r</italic> = .91) and its subscales for anxiety (<italic>r</italic> = .82) and depression (<italic>r</italic> = .91). Regarding depression, high correlations have also been found for the Patient Health Questionnaire-9 (PHQ-9; <xref ref-type="bibr" rid="B65">65</xref>; <italic>r</italic> = .81). For worry symptoms, high correlations exist with the Generalized Anxiety Disorder 7 (GAD-7; <xref ref-type="bibr" rid="B66">66</xref>; <italic>r</italic> = .72). The HSCL-11 has shown good sensitivity to change (<xref ref-type="bibr" rid="B67">67</xref>). Assessing the third session of each patient in this sample, we also found good internal consistency (&#x3c9; = .92) according to McDonald&#x2019;s omega (<xref ref-type="bibr" rid="B68">68</xref>). Across all sessions in our dataset, average symptom severity was at 2.2 (<italic>SD</italic> = 0.79) on a scale from 1 to 4.</p>
</sec>
<sec id="s2_3_2">
<title>Alliance</title>
<p>Therapeutic alliance was assessed by the patient via the Session Rating Scale (SRS; <xref ref-type="bibr" rid="B69">69</xref>). The patients filled the questionnaire after each session. The SRS contains the conceptualization by Bordin (<xref ref-type="bibr" rid="B36">36</xref>) of three alliance components: 1. Affective bond, 2. Goal agreement, 3. Task agreement, which are assessed by three items. The SRS contains an additional fourth item, which reflects the overall alliance. The final score is calculated as a mean across all four items. The SRS has shown generally satisfying reliability, ranging from <italic>&#x3b1;</italic> = .70 to.97 and a test-retest reliability between <italic>r</italic> = .54 and.70 (<xref ref-type="bibr" rid="B70">70</xref>). In our sample, the SRS showed a good internal consistency in the third session (<italic>&#x3c9;</italic> = .83). Correlations with other alliance measures have been moderate (HAQ-II; <italic>r</italic> = .48; <xref ref-type="bibr" rid="B69">69</xref>; WAI; <italic>r</italic> = .57 &#x2013;.65; <xref ref-type="bibr" rid="B71">71</xref>).</p>
</sec>
</sec>
<sec id="s2_4">
<title>Transcripts</title>
<p>The transcripts corpus consisted of 553 transcripts of psychotherapy sessions. On average, there were 4.5 (<italic>SD</italic> = 4.9) transcripts per patient, generally starting with session 3 and continuing with every fifth session (e.g., 3, 5, 10, &#x2026;).</p>
<p>Transcription was conducted without the use of transcription software by psychology students based on the session recordings. Names of persons or places were removed to reduce identifiable information. The transcripts contained sparse annotations about nonverbal behavior or interruption in parentheses. Each transcript was organized as a table of consecutive speech turns by therapist and patient. The transcripts were not labelled for emotions. For our analysis, we retained only the patients&#x2019; speech turns, leaving 104,557 speech turns. We further split these speech turns into sentences for the model inference and retained all sentences with at least three words, leaving 233,648 sentences. Average sentence length was 12.7 (<italic>SD</italic> = 10.4) words. Per session, patients spoke on average 422.5 (<italic>SD</italic> = 174.1) sentences, amounting to 5,362.6 (<italic>SD</italic> = 2,089.3) words.</p>
</sec>
<sec id="s2_5">
<title>GoEmotions dataset</title>
<p>We used the <italic>GoEmotions</italic> dataset (<xref ref-type="bibr" rid="B72">72</xref>) as our labeled training data. The dataset consists of 54k labeled comments. All comments were taken from Reddit, while excluding offensive, vulgar, religion, and identity words. Comments had a length between 3 and 30 words and were balanced across the sentiment, different emotions, and subreddits. The comments were annotated by three raters across a list of 28 emotions (or respectively 27 emotions and a &#x2018;neutral&#x2019; category). If reasonable, multiple labels could be given to a single comment. Interrater agreement was assessed via Cohen&#x2019;s kappa by Demszky et&#xa0;al. (<xref ref-type="bibr" rid="B72">72</xref>), ranging between 0.331 (<italic>grief</italic>) and 0.468 (<italic>admiration</italic>). As is shown in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>, the posts were not well balanced across all emotions with especially neutral and admiration and approval being the most prevalent ones, while relief, pride and grief were very rare.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Barplot of the emotion frequency in the train set of GoEmotions.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1504306-g001.tif"/>
</fig>
</sec>
<sec id="s2_6">
<title>XLM-RoBERTa-base language model</title>
<p>We employed the <italic>XLM-RoBERTa-base</italic> model (<xref ref-type="bibr" rid="B73">73</xref>) as our base LLM, which we fine-tuned on the dataset. The <italic>XLM-RoBERTa-base</italic> model was trained on a masked multilingual dataset of over 2 terabyte (of which 66.6 gigabyte were in German), which allows the model to perform in over 100 languages. The model has an embedding size of 1024 tokens, corresponding to a maximal input context length of about 600&#x2013;800 words. The <italic>XLM-RoBERTa-base</italic> model was pretrained with a Masked Language Modeling objective by predicting 15% of randomly masked words to learn a bidirectional representation of the sentence. Since it was only trained on raw texts without human labeling, it is intended to be fine-tuned on a downstream task, such as the classification task that is contained in this paper.</p>
</sec>
<sec id="s2_7">
<title>Data analytic strategy</title>
<p>The analyses were conducted with Python 3.9. The complete workflow is shown in <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref> and is elaborated below.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Complete workflow for the data analysis (blue represents data and yellow the LLMs). The GoEmotions dataset is translated into German and used to fine-tune the XLM-RoBERTa LLM. The LLM is then employed to infer the emotions from the therapy transcripts to predict the Routine Outcome Monitoring (ROM) data.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1504306-g002.tif"/>
</fig>
<sec id="s2_7_1">
<title>Pre-processing and large language model fine-tuning</title>
<p>We selected the 54k labeled comments from the raw <italic>GoEmotions</italic> dataset and used automatic translation to German via DeepL (<xref ref-type="bibr" rid="B74">74</xref>). The dataset was split into 80% training set, 10% validation set, and 10% test set. Emotions were classified to a comment via one-hot encoding<xref ref-type="fn" rid="fn2">
<sup>2</sup>
</xref>. We then fine-tuned the <italic>XLM-RoBERTa-base</italic> model on the data in a multilabel classification task (i.e., several emotions could be classified to one sentence) with a batch size of 16, learning rate of 3e&#x2013;5, and weight decay of 0.01. The complete training code can be accessed via the OSF repository (<xref ref-type="bibr" rid="B75">75</xref>). Training was conducted for 10 epochs in the dataset format, which allows for faster processing speed (<xref ref-type="bibr" rid="B76">76</xref>). The loss function was Binary Cross-Entropy (BCE) with logits because of the multilabel implementation.</p>
<p>The final model showed similar metrics in the test set (<italic>F1<sub>macro</sub>
</italic> = 0.45, <italic>Kappa<sub>macro</sub>
</italic> = 0.42, <italic>Accuracy</italic> = 0.41) as the original model (<italic>F1<sub>macro</sub>
</italic> = 0.46) by Demszky et&#xa0;al. (<xref ref-type="bibr" rid="B72">72</xref>). Cohen&#x2019;s Kappa calculated between predicted emotions and labeled emotions ranged between 0.15 and 0.88 with a mean of 0.42, indicating moderate agreement (<xref ref-type="bibr" rid="B77">77</xref>). The confusion matrix in the final test set is shown in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Confusion matrix in the final test set. The color grading is exponentially scaled.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1504306-g003.tif"/>
</fig>
</sec>
<sec id="s2_7_2">
<title>Large language model inference</title>
<p>After the fine-tuning was completed, we applied the model for the emotion classification in our dataset. As the labeled data had a length of 3 to 30 words, we decided to conduct the classification on a sentence level. Each sentence by a patient was then run through the model pipeline and was classified across the 28 different emotions by assigning each emotion a probability between 0 and 1 for each sentence. For example, if a sentence was given a probability of 0.8 for <italic>admiration</italic>, this could be interpreted as the predicted probability for the presence of <italic>admiration</italic> in the sentence. Therefore, higher values correspond to a higher probability for the presence of a given emotion.</p>
</sec>
<sec id="s2_7_3">
<title>Evaluation strategy for the prediction of outcome</title>
<p>For the prediction of outcome (i.e., alliance and symptom severity), the automatically classified emotion probabilities were aggregated at a session level by calculating the mean for each emotion per session. Since the symptom severity measure contained a depression and an anxiety subscale, we conducted two sensitivity analyses, predicting the respective subscale. The 28 aggregated emotion probabilities were the features for the prediction. Employing nested cross-validation, several machine learning algorithms competed against each other in an internal five-fold cross-validation, while only the best performing algorithm was selected as the algorithm of choice for the respective test set in the external ten-fold cross-validation via the python library XRAI (<xref ref-type="bibr" rid="B78">78</xref>). We evaluated the model performance via correlation (<italic>r;</italic> <xref ref-type="bibr" rid="B79">79</xref>), normalized root mean squared error (NRMSE; <xref ref-type="bibr" rid="B80">80</xref>), and mean absolute error (MAE; <xref ref-type="bibr" rid="B81">81</xref>). For the NRMSE, normalization was conducted by dividing through the standard deviation of the target variable. Confidence intervals were calculated by bootstrapping across the ten test folds.</p>
</sec>
<sec id="s2_7_4">
<title>Machine learning algorithms</title>
<p>In order to achieve good prediction metrics, we chose a diverse set of ML algorithms to account for feature interactions, nonlinear effects and collinearity. The following machine learning algorithms competed against each other in the internal cross-validation: 1. Least Absolute Shrinkage and Selection Operator (Lasso; <xref ref-type="bibr" rid="B82">82</xref>), 2. Elastic net regularization and variable selection (Elastic Net; <xref ref-type="bibr" rid="B83">83</xref>), 3. eXtreme Gradient Boosting (XGBoost; <xref ref-type="bibr" rid="B84">84</xref>), 4. Random Forest (RF; <xref ref-type="bibr" rid="B85">85</xref>), 5. Support Vector Regression (SVR; <xref ref-type="bibr" rid="B86">86</xref>), and 6. SuperLearner (<xref ref-type="bibr" rid="B87">87</xref>). The SuperLearner integrates the ensemble of previous learners (i.e., Lasso, Elastic Net, XGBoost, RF, and SVR), using their predicted scores as features for an SVR meta-learner.</p>
<p>Out of these six different algorithms, the machine learning algorithm with the best mean correlation in the internal five-fold cross-validation was selected as the algorithm for the external test fold. Therefore, it could be possible that different algorithms were selected across the ten test folds, e.g., five times XGBoost, three times RF, and two times SVR.</p>
</sec>
<sec id="s2_7_5">
<title>Model explanation</title>
<p>In general, machine-learning models are not very well explainable due to their complex and nonlinear modeling (<xref ref-type="bibr" rid="B88">88</xref>). However, one proposed solution has been the use of Shapley values (<xref ref-type="bibr" rid="B89">89</xref>), which allow for an estimation of feature impact. To this end, we employed the python package <italic>SHAP</italic> (SHapley Additive exPlanations; <xref ref-type="bibr" rid="B90">90</xref>, <xref ref-type="bibr" rid="B91">91</xref>). <italic>SHAP</italic> allows for the assessment of the individual feature impact (i.e., how much are the predicted values influenced by this feature)?, as well as the impact of groups of features. Further, <italic>SHAP</italic> can be used to assess the direction of a feature impact (e.g., do higher feature values predict higher outcome values)?, as well as interactions between features.</p>
</sec>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Descriptive statistics</title>
<p>The mean probability of all emotions and their reliability is presented in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>. In addition, the valence of each emotion is indicated (positive/negative/neutral). Altogether, the model classified 14 positive emotions, 12 negative emotions and 2 neutral emotions. The most probable emotions in the transcript corpus were (with the exception of <italic>neutral</italic>) <italic>approval</italic> (12.98%)<italic>, disapproval</italic> (6.11%)<italic>, confusion</italic> (4.32%), and <italic>realization</italic> (4.14%). The least probable emotions were <italic>grief</italic> (0.11%), <italic>remorse</italic> (0.27%), <italic>amusement</italic> (0.73%), and <italic>relief</italic> (0.58%). Regarding the reliability of the assessment, we provided the F1 metric and Cohen&#x2019;s Kappa (<xref ref-type="bibr" rid="B77">77</xref>) from the test set in the <italic>GoEmotions</italic> dataset. F1 is the harmonic mean between precision (how often is the model correct when it predicts the emotion)? and recall (how often does the model detect the emotion when it actually occurs)?. Kappa can be interpreted according to (<xref ref-type="bibr" rid="B77">77</xref>) as fair agreement (&gt;.2), moderate agreement (&gt;.4), substantial agreement (&gt;.6), and almost perfect agreement (&gt;.8). Reliability was substantially high for some positive emotions (e.g., <italic>admiration, amusement, gratitude</italic>, and <italic>love</italic>), while the negative emotions showed moderate agreement at best (e.g., <italic>fear</italic>, <italic>remorse</italic>, and <italic>sadness</italic>).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Mean probability and standard deviations, as well as F1 and kappa values for each emotion.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Emotion (pos./neg./neutral)</th>
<th valign="top" align="center">M</th>
<th valign="top" align="center">SD</th>
<th valign="top" align="center">F1</th>
<th valign="top" align="center">Cohen&#x2019;s Kappa</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">admiration (pos.)</td>
<td valign="top" align="center">2.35%</td>
<td valign="top" align="center">1.41%</td>
<td valign="top" align="left">.64</td>
<td valign="middle" align="left">.601</td>
</tr>
<tr>
<td valign="top" align="left">amusement (pos.)</td>
<td valign="top" align="center">0.73%</td>
<td valign="top" align="center">0.66%</td>
<td valign="top" align="left">.78</td>
<td valign="middle" align="left">.767</td>
</tr>
<tr>
<td valign="top" align="left">anger (neg.)</td>
<td valign="top" align="center">0.88%</td>
<td valign="top" align="center">0.67%</td>
<td valign="top" align="left">.38</td>
<td valign="middle" align="left">.358</td>
</tr>
<tr>
<td valign="top" align="left">annoyance (neg.)</td>
<td valign="top" align="center">3.17%</td>
<td valign="top" align="center">1.32%</td>
<td valign="top" align="left">.27</td>
<td valign="middle" align="left">.229</td>
</tr>
<tr>
<td valign="top" align="left">approval (pos.)</td>
<td valign="top" align="center">12.98%</td>
<td valign="top" align="center">4.40%</td>
<td valign="top" align="left">.34</td>
<td valign="middle" align="left">.293</td>
</tr>
<tr>
<td valign="top" align="left">caring (pos.)</td>
<td valign="top" align="center">0.79%</td>
<td valign="top" align="center">0.51%</td>
<td valign="top" align="left">.38</td>
<td valign="middle" align="left">.365</td>
</tr>
<tr>
<td valign="top" align="left">confusion (neg.)</td>
<td valign="top" align="center">4.32%</td>
<td valign="top" align="center">2.06%</td>
<td valign="top" align="left">.40</td>
<td valign="middle" align="left">.378</td>
</tr>
<tr>
<td valign="top" align="left">curiosity (pos.)</td>
<td valign="top" align="center">2.10%</td>
<td valign="top" align="center">1.42%</td>
<td valign="top" align="left">.51</td>
<td valign="middle" align="left">.486</td>
</tr>
<tr>
<td valign="top" align="left">desire (pos.)</td>
<td valign="top" align="center">0.58%</td>
<td valign="top" align="center">0.49%</td>
<td valign="top" align="left">.39</td>
<td valign="middle" align="left">.387</td>
</tr>
<tr>
<td valign="top" align="left">disappointment (neg.)</td>
<td valign="top" align="center">2.31%</td>
<td valign="top" align="center">1.03%</td>
<td valign="top" align="left">.19</td>
<td valign="middle" align="left">.170</td>
</tr>
<tr>
<td valign="top" align="left">disapproval (neg.)</td>
<td valign="top" align="center">6.11%</td>
<td valign="top" align="center">2.02%</td>
<td valign="top" align="left">.32</td>
<td valign="middle" align="left">.286</td>
</tr>
<tr>
<td valign="top" align="left">disgust (neg.)</td>
<td valign="top" align="center">0.65%</td>
<td valign="top" align="center">0.45%</td>
<td valign="top" align="left">.41</td>
<td valign="middle" align="left">.395</td>
</tr>
<tr>
<td valign="top" align="left">embarrassment (neg.)</td>
<td valign="top" align="center">0.43%</td>
<td valign="top" align="center">0.41%</td>
<td valign="top" align="left">.37</td>
<td valign="middle" align="left">.367</td>
</tr>
<tr>
<td valign="top" align="left">excitement (pos.)</td>
<td valign="top" align="center">0.87%</td>
<td valign="top" align="center">0.55%</td>
<td valign="top" align="left">.35</td>
<td valign="middle" align="left">.339</td>
</tr>
<tr>
<td valign="top" align="left">fear (neg.)</td>
<td valign="top" align="center">1.23%</td>
<td valign="top" align="center">1.09%</td>
<td valign="top" align="left">.59</td>
<td valign="middle" align="left">.584</td>
</tr>
<tr>
<td valign="top" align="left">gratitude (pos.)</td>
<td valign="top" align="center">0.40%</td>
<td valign="top" align="center">0.34%</td>
<td valign="top" align="left">.89</td>
<td valign="middle" align="left">.882</td>
</tr>
<tr>
<td valign="top" align="left">grief (neg.)</td>
<td valign="top" align="center">0.11%</td>
<td valign="top" align="center">0.19%</td>
<td valign="top" align="left">.31</td>
<td valign="middle" align="left">.307</td>
</tr>
<tr>
<td valign="top" align="left">joy (pos.)</td>
<td valign="top" align="center">1.68%</td>
<td valign="top" align="center">0.97%</td>
<td valign="top" align="left">.51</td>
<td valign="middle" align="left">.499</td>
</tr>
<tr>
<td valign="top" align="left">love (pos.)</td>
<td valign="top" align="center">0.75%</td>
<td valign="top" align="center">0.69%</td>
<td valign="top" align="left">.73</td>
<td valign="middle" align="left">.721</td>
</tr>
<tr>
<td valign="top" align="left">nervousness (neg.)</td>
<td valign="top" align="center">0.91%</td>
<td valign="top" align="center">0.73%</td>
<td valign="top" align="left">.28</td>
<td valign="middle" align="left">.276</td>
</tr>
<tr>
<td valign="top" align="left">optimism (pos.)</td>
<td valign="top" align="center">1.43%</td>
<td valign="top" align="center">0.72%</td>
<td valign="top" align="left">.53</td>
<td valign="middle" align="left">.512</td>
</tr>
<tr>
<td valign="top" align="left">pride (pos.)</td>
<td valign="top" align="center">0.24%</td>
<td valign="top" align="center">0.28%</td>
<td valign="top" align="left">.30</td>
<td valign="middle" align="left">.299</td>
</tr>
<tr>
<td valign="top" align="left">realization (pos.)</td>
<td valign="top" align="center">4.14%</td>
<td valign="top" align="center">1.66%</td>
<td valign="top" align="left">.17</td>
<td valign="middle" align="left">.150</td>
</tr>
<tr>
<td valign="top" align="left">relief (pos.)</td>
<td valign="top" align="center">0.58%</td>
<td valign="top" align="center">0.36%</td>
<td valign="top" align="left">.27</td>
<td valign="middle" align="left">.266</td>
</tr>
<tr>
<td valign="top" align="left">remorse (neg.)</td>
<td valign="top" align="center">0.27%</td>
<td valign="top" align="center">0.25%</td>
<td valign="top" align="left">.55</td>
<td valign="middle" align="left">.545</td>
</tr>
<tr>
<td valign="top" align="left">sadness (neg.)</td>
<td valign="top" align="center">1.92%</td>
<td valign="top" align="center">1.18%</td>
<td valign="top" align="left">.50</td>
<td valign="middle" align="left">.488</td>
</tr>
<tr>
<td valign="top" align="left">surprise (neutral)</td>
<td valign="top" align="center">0.50%</td>
<td valign="top" align="center">0.40%</td>
<td valign="top" align="left">.53</td>
<td valign="middle" align="left">.514</td>
</tr>
<tr>
<td valign="top" align="left">neutral (neutral)</td>
<td valign="top" align="center">62.59%</td>
<td valign="top" align="center">6.13%</td>
<td valign="top" align="left">.60</td>
<td valign="middle" align="left">.410</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>pos<italic>.,</italic> positive; neg<italic>.,</italic> negative<italic>; M</italic>, mean; <italic>SD</italic>, standard deviation. <italic>F1</italic>, harmonic mean between precision (ratio between correct and total predictions of the emotion) and recall (ratio between correct predictions and total occurrence of the emotion); <italic>Cohen&#x2019;s Kappa</italic>, measure of model-rater-reliability. <italic>Mean</italic> and <italic>SD</italic> values are reported from the transcript corpus, while <italic>F1</italic> and <italic>Cohen&#x2019;s Kappa</italic> were calculated in the <italic>GoEmotions</italic> dataset.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>To give some impression about the labeled statements from psychotherapy transcripts, we compared some patient statements that were classified by the LLM with original comments from the GoEmotions dataset for different emotions (see <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). Due to confidentiality, the psychotherapy statements are from publicly available transcripts. We have provided a full list containing each emotion in our OSF (<xref ref-type="bibr" rid="B75">75</xref>).</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Example phrases from GoEmotions and from psychotherapy transcripts for different emotions.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Label</th>
<th valign="top" align="left">GoEmotions</th>
<th valign="top" align="left">Transcript</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">admiration</td>
<td valign="top" align="left">
<italic>aw, thanks! I appreciate that!</italic>
</td>
<td valign="top" align="left">
<italic>Yes, I moved them from one wall to the other and it looks really good.</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">anger</td>
<td valign="top" align="left">
<italic>Ok, then what the actual f** is your plan?</italic>
</td>
<td valign="top" align="left">
<italic>He then comes up and tries to open them and I&#x2019;m so angry I don&#x2019;t want to talk.</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">embarrassment</td>
<td valign="top" align="left">
<italic>Oooooffff. That&#x2019;s real awkward, but I mean that somehow still ended better than I expected so. Kudos ig??</italic>
</td>
<td valign="top" align="left">
<italic>I mean, but I&#x2019;m so ashamed of it.</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">fear</td>
<td valign="top" align="left">
<italic>I am afraid to look, but my morbid curiosity draws me to ask.</italic>
</td>
<td valign="top" align="left">
<italic>I said, &#x2018;We&#x2019;re all scared.&#x2019; But to my brother, I said, &#x2018;I&#x2019;m scared.&#x2019;</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">realization</td>
<td valign="top" align="left">
<italic>It&#x2019;s like you didn&#x2019;t even read the comment you&#x2019;re responding to.</italic>
</td>
<td valign="top" align="left">
<italic>I really do notice a difference.</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">sadness</td>
<td valign="top" align="left">
<italic>so painful to watch</italic>
</td>
<td valign="top" align="left">
<italic>But that was hard to hear too, because when I was told that I was losing a tooth, I just started crying.</italic>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Sample statements were provided by publicly available transcript at <ext-link ext-link-type="uri" xlink:href="http://www.alexanderstreet.com">alexanderstreet.com</ext-link>.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_2">
<title>Prediction of symptom severity</title>
<p>The machine learning model containing the 28 emotions as features showed a good performance with (<italic>r</italic> = .50 (95%-CI:.42,.57), NRMSE = 0.87 (95%-CI:.83,.91) and MAE = .57 (95%-CI:.55,.59). The selected learners for the external cross-validation were RF (6x) and SVR (4x). The most important predictors (see <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>) as calculated according to the relative <italic>SHAP</italic> value were <italic>approval</italic> (9.2%), <italic>sadness</italic> (8.7%), <italic>fear</italic> (7.8%), <italic>disappointment</italic> (6.4%), <italic>desire</italic> (6.3%), and <italic>sadness</italic> (6.2%). We expected negative emotions to predict higher symptom severity and positive emotions to predict lower symptom severity. This was generally accurate, though some positive emotions were associated with higher symptom severity, namely <italic>desire, pride, caring, amusement</italic>, and <italic>love.</italic> Simultaneously, no negative emotion was associated with less symptom severity. Further, we expected negative emotions to have a stronger impact on symptom severity than positive emotions. Altogether, <italic>approval, admiration, optimism, realization, excitement, gratitude</italic>, and <italic>relief</italic> were positive emotions significantly associated with lower symptom severity, pertaining to an aggregated feature impact of 27.0%, while all negative emotions <italic>(anger, fear, disappointment, sadness, nervousness, disapproval, annoyance, embarrassment, confusion, disgust, grief, and remorse)</italic> were significantly associated with higher symptom severity with almost twice the aggregated impact of negative emotions (51.8%), confirming the hypothesis. The remaining emotions were not significantly associated with symptom severity.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Symptom severity prediction: emotions, relative SHAP value, and correlation with SHAP value.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" rowspan="2" align="center">Emotion</th>
<th valign="top" colspan="2" align="center">Symptom Severity</th>
</tr>
<tr>
<th valign="top" align="center">Relative SHAP value</th>
<th valign="top" align="center">Correlation with SHAP value (95%-CI)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">approval</td>
<td valign="top" align="center">9.16%</td>
<td valign="top" align="center">-.63 (-.69, -.55)</td>
</tr>
<tr>
<td valign="top" align="left">anger</td>
<td valign="top" align="center">8.67%</td>
<td valign="top" align="center">.86 (.81,.91)</td>
</tr>
<tr>
<td valign="top" align="left">fear</td>
<td valign="top" align="center">7.77%</td>
<td valign="top" align="center">.88 (.84,.92)</td>
</tr>
<tr>
<td valign="top" align="left">disappointment</td>
<td valign="top" align="center">6.42%</td>
<td valign="top" align="center">.79 (.73,.84)</td>
</tr>
<tr>
<td valign="top" align="left">desire</td>
<td valign="top" align="center">6.32%</td>
<td valign="top" align="center">.90 (.85,.95)</td>
</tr>
<tr>
<td valign="top" align="left">sadness</td>
<td valign="top" align="center">6.24%</td>
<td valign="top" align="center">.83 (.78,.88)</td>
</tr>
<tr>
<td valign="top" align="left">admiration</td>
<td valign="top" align="center">5.96%</td>
<td valign="top" align="center">-.71 (-.79, -.64)</td>
</tr>
<tr>
<td valign="top" align="left">nervousness</td>
<td valign="top" align="center">4.72%</td>
<td valign="top" align="center">.79 (.72,.85)</td>
</tr>
<tr>
<td valign="top" align="left">disapproval</td>
<td valign="top" align="center">3.76%</td>
<td valign="top" align="center">.82 (.78,.86)</td>
</tr>
<tr>
<td valign="top" align="left">neutral</td>
<td valign="top" align="center">3.46%</td>
<td valign="top" align="center">-.01 (-.38,.37)</td>
</tr>
<tr>
<td valign="top" align="left">annoyance</td>
<td valign="top" align="center">3.38%</td>
<td valign="top" align="center">.89 (.84,.93)</td>
</tr>
<tr>
<td valign="top" align="left">optimism</td>
<td valign="top" align="center">3.29%</td>
<td valign="top" align="center">-.78 (-.83, -.73)</td>
</tr>
<tr>
<td valign="top" align="left">realization</td>
<td valign="top" align="center">3.18%</td>
<td valign="top" align="center">-.89 (-.91, -.86)</td>
</tr>
<tr>
<td valign="top" align="left">embarrassment</td>
<td valign="top" align="center">2.54%</td>
<td valign="top" align="center">.75 (.67,.83)</td>
</tr>
<tr>
<td valign="top" align="left">confusion</td>
<td valign="top" align="center">2.43%</td>
<td valign="top" align="center">.81 (.73,.87)</td>
</tr>
<tr>
<td valign="top" align="left">excitement</td>
<td valign="top" align="center">2.42%</td>
<td valign="top" align="center">-.56 (-.65, -.47)</td>
</tr>
<tr>
<td valign="top" align="left">disgust</td>
<td valign="top" align="center">2.12%</td>
<td valign="top" align="center">.80 (.75,.85)</td>
</tr>
<tr>
<td valign="top" align="left">pride</td>
<td valign="top" align="center">2.08%</td>
<td valign="top" align="center">.73 (.65,.81)</td>
</tr>
<tr>
<td valign="top" align="left">grief</td>
<td valign="top" align="center">1.98%</td>
<td valign="top" align="center">.55 (.44,.67)</td>
</tr>
<tr>
<td valign="top" align="left">caring</td>
<td valign="top" align="center">1.92%</td>
<td valign="top" align="center">.29 (.04,.51)</td>
</tr>
<tr>
<td valign="top" align="left">surprise</td>
<td valign="top" align="center">1.90%</td>
<td valign="top" align="center">-.60 (-.79, -.37)</td>
</tr>
<tr>
<td valign="top" align="left">remorse</td>
<td valign="top" align="center">1.78%</td>
<td valign="top" align="center">.33 (.04,.57)</td>
</tr>
<tr>
<td valign="top" align="left">joy</td>
<td valign="top" align="center">1.62%</td>
<td valign="top" align="center">-.18 (-.40,.02)</td>
</tr>
<tr>
<td valign="top" align="left">gratitude</td>
<td valign="top" align="center">1.60%</td>
<td valign="top" align="center">-.47 (-.70, -.22)</td>
</tr>
<tr>
<td valign="top" align="left">amusement</td>
<td valign="top" align="center">1.40%</td>
<td valign="top" align="center">.33 (.12,.53)</td>
</tr>
<tr>
<td valign="top" align="left">relief</td>
<td valign="top" align="center">1.38%</td>
<td valign="top" align="center">-.51 (-.65, -.37)</td>
</tr>
<tr>
<td valign="top" align="left">curiosity</td>
<td valign="top" align="center">1.34%</td>
<td valign="top" align="center">.14 (-.08,.35)</td>
</tr>
<tr>
<td valign="top" align="left">love</td>
<td valign="top" align="center">1.14%</td>
<td valign="top" align="center">.39 (.20,.55)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_3">
<title>Sensitivity analyses for the prediction of the anxiety and the depression subscale</title>
<p>Regarding the prediction of the anxiety (<italic>r</italic> = .47, 95%-CI: .40, .55) and depression (.53, 95%-CI: .47, .59) subscales, good metrics were achieved. A list of all associated emotions and their relative impact can be obtained from <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Tables 1, 2</bold>
</xref>. For the anxiety subscale, the emotions with the highest positive impact were <italic>fear</italic> (17.3%), <italic>sadness</italic> (8.6%), and <italic>nervousness</italic> (7.3%), while <italic>approval</italic> (10.4%) and <italic>admiration</italic> (6.1%) had the highest negative impact. Regarding depression, <italic>sadness</italic> (18.6%), <italic>grief</italic> (8.0%) and <italic>disappointment</italic> (7.2%) had the highest positive and <italic>approval</italic> (17.7%) and <italic>realization</italic> (4.2%) the highest negative impact.</p>
</sec>
<sec id="s3_4">
<title>Prediction of alliance</title>
<p>For the alliance prediction, the model performance was low to moderate with (<italic>r</italic> = .20 (95%-CI:&#xb4;.06,.32), NRMSE = 0.98 (95%-CI:.95, 1.01) and MAE = 8.76 (95%-CI: 8.34, 9.22). Regarding the external test set learners, Elastic Net (4x), as well as Lasso (3x) and RF (3x) were selected. The emotions with the highest impact (see <xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref>) were <italic>curiosity</italic> (24.9%), <italic>confusion</italic> (16.4%), and <italic>surprise</italic> (5.4%). We expected positive emotions to predict higher alliance and negative emotions to predict lower alliance. For negative emotions, this was not the case in general, since <italic>annoyance, remorse, disgust, nervousness, sadness</italic>, and <italic>embarrassment</italic> were not associated with lower alliance. Though, <italic>confusion</italic> as a marker of a withdrawal rupture and <italic>anger</italic> and <italic>disapproval</italic> as markers of confrontation ruptures predicted lower alliance. Positive emotions were mostly associated with higher alliance with the notable exception of <italic>curiosity</italic> and <italic>approval</italic>. Some emotions (e.g., <italic>optimism, nervousness</italic>) were not significantly associated with alliance. We expected negative emotions (<italic>confusion, anger, disapproval, fear, disappointment, grief;</italic> 27.5%) to have a greater negative impact on alliance than the positive impact of positive emotions (<italic>desire, joy, admiration, excitement, realization, amusement, relief, love, caring;</italic> 28.95%), which was not the case.</p>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>Alliance prediction: emotions, relative SHAP value, and correlation with SHAP value.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" rowspan="2" align="center">Emotion</th>
<th valign="top" colspan="2" align="center">Alliance</th>
</tr>
<tr>
<th valign="top" align="center">Relative SHAP value</th>
<th valign="top" align="center">Correlation with SHAP value (95%-CI)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">curiosity</td>
<td valign="top" align="center">24.94%</td>
<td valign="top" align="center">-.96 (-1.00, -.92)</td>
</tr>
<tr>
<td valign="top" align="left">confusion</td>
<td valign="top" align="center">16.41%</td>
<td valign="top" align="center">-.93 (-1.00, -.85)</td>
</tr>
<tr>
<td valign="top" align="left">surprise</td>
<td valign="top" align="center">5.42%</td>
<td valign="top" align="center">.77 (.55,.95)</td>
</tr>
<tr>
<td valign="top" align="left">desire</td>
<td valign="top" align="center">4.72%</td>
<td valign="top" align="center">.84 (.65,.98)</td>
</tr>
<tr>
<td valign="top" align="left">joy</td>
<td valign="top" align="center">4.69%</td>
<td valign="top" align="center">.61 (.35,.85)</td>
</tr>
<tr>
<td valign="top" align="left">admiration</td>
<td valign="top" align="center">4.61%</td>
<td valign="top" align="center">.56 (.30,.81)</td>
</tr>
<tr>
<td valign="top" align="left">excitement</td>
<td valign="top" align="center">4.35%</td>
<td valign="top" align="center">.77 (.49,.98)</td>
</tr>
<tr>
<td valign="top" align="left">realization</td>
<td valign="top" align="center">4.02%</td>
<td valign="top" align="center">.65 (.36,.90)</td>
</tr>
<tr>
<td valign="top" align="left">anger</td>
<td valign="top" align="center">3.85%</td>
<td valign="top" align="center">-.37 (-.69, -.04)</td>
</tr>
<tr>
<td valign="top" align="left">disapproval</td>
<td valign="top" align="center">3.36%</td>
<td valign="top" align="center">-.35 (-.65, -.05)</td>
</tr>
<tr>
<td valign="top" align="left">amusement</td>
<td valign="top" align="center">3.02%</td>
<td valign="top" align="center">.62 (.35,.86)</td>
</tr>
<tr>
<td valign="top" align="left">annoyance</td>
<td valign="top" align="center">2.08%</td>
<td valign="top" align="center">.49 (.22,.78)</td>
</tr>
<tr>
<td valign="top" align="left">remorse</td>
<td valign="top" align="center">1.94%</td>
<td valign="top" align="center">.50 (.15,.80)</td>
</tr>
<tr>
<td valign="top" align="left">approval</td>
<td valign="top" align="center">1.62%</td>
<td valign="top" align="center">-.23 (-.46, -.05)</td>
</tr>
<tr>
<td valign="top" align="left">relief</td>
<td valign="top" align="center">1.57%</td>
<td valign="top" align="center">.48 (.20,.77)</td>
</tr>
<tr>
<td valign="top" align="left">optimism</td>
<td valign="top" align="center">1.43%</td>
<td valign="top" align="center">.05 (-.11,.28)</td>
</tr>
<tr>
<td valign="top" align="left">fear</td>
<td valign="top" align="center">1.40%</td>
<td valign="top" align="center">-.31 (-.55, -.08)</td>
</tr>
<tr>
<td valign="top" align="left">disappointment</td>
<td valign="top" align="center">1.34%</td>
<td valign="top" align="center">-.53 (-.77, -.25)</td>
</tr>
<tr>
<td valign="top" align="left">grief</td>
<td valign="top" align="center">1.08%</td>
<td valign="top" align="center">-.06 (-.31,.25)</td>
</tr>
<tr>
<td valign="top" align="left">neutral</td>
<td valign="top" align="center">1.08%</td>
<td valign="top" align="center">.16 (.01,.37)</td>
</tr>
<tr>
<td valign="top" align="left">love</td>
<td valign="top" align="center">1.07%</td>
<td valign="top" align="center">.44 (.15,.73)</td>
</tr>
<tr>
<td valign="top" align="left">disgust</td>
<td valign="top" align="center">1.06%</td>
<td valign="top" align="center">.40 (.15,.66)</td>
</tr>
<tr>
<td valign="top" align="left">nervousness</td>
<td valign="top" align="center">1.02%</td>
<td valign="top" align="center">.01 (-.21,.25)</td>
</tr>
<tr>
<td valign="top" align="left">caring</td>
<td valign="top" align="center">0.91%</td>
<td valign="top" align="center">.53 (.26,.80)</td>
</tr>
<tr>
<td valign="top" align="left">gratitude</td>
<td valign="top" align="center">0.88%</td>
<td valign="top" align="center">.06 (-.13,.30)</td>
</tr>
<tr>
<td valign="top" align="left">sadness</td>
<td valign="top" align="center">0.88%</td>
<td valign="top" align="center">.31 (.07,.61)</td>
</tr>
<tr>
<td valign="top" align="left">pride</td>
<td valign="top" align="center">0.82%</td>
<td valign="top" align="center">.07 (-.13,.31)</td>
</tr>
<tr>
<td valign="top" align="left">embarrassment</td>
<td valign="top" align="center">0.42%</td>
<td valign="top" align="center">.12 (-.03,.33)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>Our study served three purposes: First, we fine-tuned an LLM for the classification of 28 emotions in German. Second, we employed this model on a dataset of 553 psychotherapy transcripts to predict symptom severity and alliance. Third, we assessed the most important emotions for the predictions of symptom severity and alliance. Our results indicate a modest classification performance for our fine-tuned model with <italic>F1<sub>macro</sub>
</italic> = .45, which is almost identical to the original performance in English (<italic>F1<sub>macro</sub>
</italic> = .46), indicating no overall accuracy loss due to the translation. Looking at individual emotions, classification accuracy varied slightly, but was mostly similar between German and English (the largest decrease in <italic>F1<sub>macro</sub>
</italic> was .11). The Kappa value of .42 demonstrated moderate agreement, which is not surprising because of the inherent limitation of identifying emotions only via the transcript modality while ignoring other modalities such as voice intonation (audio; e.g., <xref ref-type="bibr" rid="B92">92</xref>) or facial expression (video; e.g., <xref ref-type="bibr" rid="B93">93</xref>). Therefore, the modest performance likely did result from the low inter-rater-reliability in the <italic>GoEmotions</italic> dataset (Cohen&#x2019;s Kappa ranging from .33 to .47). However, there was considerable variation regarding the model&#x2019;s Kappa values, ranging between .15 and .88. This seems logical since some emotions may be more clearly expressed via language content (e.g., <italic>admiration, amusement, fear</italic>) than others (e.g., <italic>disappointment, annoyance</italic>), which might be better captured via voice features or mimic.</p>
<p>Employing the fine-tuned model, we successfully predicted symptom severity (<italic>r</italic> = .50) and alliance (<italic>r</italic> = .20) from the transcripts. The accuracy was comparable to a different approach based on session content as operationalized by topic modeling of 250 topics (<xref ref-type="bibr" rid="B55">55</xref>). Emotions showed higher associations with symptom severity than a model based on 14 cognitive distortions (<italic>r</italic> = .33) or negative sentiment only <italic>r</italic> = .08, <xref ref-type="bibr" rid="B94">94</xref>). In contrast, Eberhardt et&#xa0;al. (<xref ref-type="bibr" rid="B60">60</xref>) found both within-person correlations for positive sentiment (<italic>r</italic> = &#x2212;.29) and large between-person correlations for negative sentiment (<italic>r</italic> = .66). However, these correlations must be interpreted with caution as they come from a small dataset (<italic>N</italic> = 79) and may not be stable (<xref ref-type="bibr" rid="B95">95</xref>).</p>
<p>Regarding symptom severity, negative emotions mainly predicted higher and positive emotions lower symptom severity, as expected. For negative emotions, the best predictors were <italic>anger</italic> and <italic>fear</italic>, which both come with high arousal. <italic>Anger</italic> may be associated with the HSCL-11 items agitation, low mood and feeling worthless (as it often was self-directed) while <italic>fear</italic> may be associated with various items of the HSCL-11, such as fearfulness, anxiousness, agitation, panic, and sleep problems. Surprisingly, the positive emotion a<italic>pproval</italic> had the highest effect, probably because it was simultaneously the most often detected emotion (13.0%). Though content-wise <italic>approval</italic> was a fuzzy concept with low reliability (<italic>Kappa</italic> = .29), it tended to be associated with statements of agreement, feasibility, and acceptance, which can be protective factors (<xref ref-type="bibr" rid="B14">14</xref>, <xref ref-type="bibr" rid="B96">96</xref>). <italic>Desire</italic> was associated with higher symptom severity, likely because it contained statements that indicated a present frustration or lack of something (e.g., desiring more sleep, a more accepting partner, or happiness). Regarding the sensitivity analysis for anxiety, we found the highest impact of the negative emotions <italic>fear, sadness</italic>, and <italic>nervousness</italic>, while <italic>approval</italic> was the positive emotion with the highest impact. For depression, <italic>approval</italic> also was the most important positive emotion, while <italic>sadness, grief</italic> and <italic>disappointment</italic> were the most important negative emotions.</p>
<p>For alliance, contrary to our expectations, only few negative emotions predicted lower alliance, while most positive emotions predicted higher alliance. However, as expected, the negative emotions with significant associations might have served as withdrawal (<italic>confusion</italic>) or confrontation markers (<italic>anger, disapproval</italic>). The negative association with <italic>curiosity</italic> was surprising, especially since it explained about a quarter of the model impact. Looking at the sentences that were classified as <italic>curiosity</italic>, it seemed as if they sometimes indicated a misunderstanding (e.g., &#x201c;<italic>So this is from my diagnosis</italic>?&#x201d;), frustration (&#x201c;<italic>And you&#x2019;re a psychologist, or what?&#x201d;</italic>), or confusion (&#x201c;<italic>What will happen to me then</italic>?&#x201d;). The positive impact of positive emotions was highlighted by the associations with <italic>desire, joy, admiration</italic>, and <italic>excitement</italic> in line with the literature (<xref ref-type="bibr" rid="B35">35</xref>).</p>
</sec>
<sec id="s5">
<title>Limitations and future directions</title>
<p>This analysis comes with several limitations. Regarding our transcript-based approach, the training data is not optimal, as it is based on a social media dataset containing comments with a length of only 3 to 30 words. As can be seen from <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>, the social media comments tended to be more informal and contained some slang. Also, the comments seemed more expressive and more intense, which could cause problems with the emotion detection. It would therefore be desirable to train models on labeled data from the relevant domain (i.e., therapy transcripts), incorporating longer and more complex statements, because domain specificity can improve model accuracy (<xref ref-type="bibr" rid="B56">56</xref>, <xref ref-type="bibr" rid="B97">97</xref>). Also, it would be desirable to have training set, which is better balanced across emotions, because some emotions (e.g., <italic>grief, pride, relief, nervousness, embarrassment</italic>; see <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>) hardly occur in the training data. This could lead the model to be biased against these emotions so that they may not be detected. In general, emotion detection could be improved by including other modalities, such as voice (<xref ref-type="bibr" rid="B92">92</xref>) or mimic via video (<xref ref-type="bibr" rid="B93">93</xref>) due to the superiority of a multimodal approach (<xref ref-type="bibr" rid="B98">98</xref>). Altogether, these approaches would likely improve the classification accuracy substantially.</p>
<p>Since some of the emotions (e.g., <italic>realization, approval</italic>) were only loosely connected to the psychological concept of emotions (<xref ref-type="bibr" rid="B2">2</xref>), future analyses could benefit from a clearer and more distinct definition of the included emotions. Further, clearly, the relationship between patient emotions and alliance is more complex than assumed in our hypotheses. On the one hand, it has been suggested that the effects of emotional arousal on outcome can be moderated by the alliance so that high arousal can be productive as long as there is a sufficiently strong alliance (<xref ref-type="bibr" rid="B8">8</xref>). On the other hand, the therapist may actively manage the alliance so that it may be soothing in the context of high arousal and activating and challenging in the context of (too) little arousal (<xref ref-type="bibr" rid="B8">8</xref>). Therefore, NLP could be incorporated to model the alliance over the course of a session to assess the dynamic interplay between emotions and alliance. This could be employed to give feedback to therapists after a session, highlighting moments where they could modulate the interaction to increase or decrease arousal. Another approach would be the integration of therapist emotions and therapist empathy into our model to assess which therapist emotions may be detrimental to the alliance.</p>
</sec>
<sec id="s6" sec-type="conclusions">
<title>Conclusion</title>
<p>In summary, our transcript-based model could classify 28 emotions with reasonable model-rater-agreement (<italic>F1</italic> = .45, <italic>Kappa</italic> = .42). Classification tended to be more reliable for positive emotions. The average detection probability ranged between 13% (<italic>approval</italic>) and 0.1% (<italic>grief</italic>). Substantial associations with symptom severity (<italic>r</italic> = .50) were found in the expected directions (i.e., positive emotions were associated with lower symptom severity and negative emotions with higher symptom severity) by selecting SVR and RF learners. Associations with alliance (<italic>r</italic> = .20) were lower and the selected learners were Lasso, Elastic Net, and RF. While many positive emotions predicted higher alliance, the results for negative emotions were mixed. Notably, negative emotions that could serve as withdrawal (<italic>confusion;</italic> 16% impact) or confrontation ruptures (<italic>anger, disapproval;</italic> together 7% impact) predicted lower alliance. In the future, this model opens a wide array of possibilities regarding process-outcome associations with emotional processes, such as analyzing the emotion dynamic over the course of a session or comparing patient with therapist emotions.</p>
</sec>
</body>
<back>
<sec id="s7" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are publicly available. Our fine-tuned LLM "German-Emotions", including some example code, is available via huggingface (<ext-link ext-link-type="uri" xlink:href="https://huggingface.co/ChrisLalk/German-Emotions">https://huggingface.co/ChrisLalk/German-Emotions</ext-link>). Complete code for model training and model inference is available via OSF (<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.17605/osf.io/AKF3H">https://doi.org/10.17605/osf.io/AKF3H</ext-link>). Our prediction model XRAI can be accessed via GitHub (<ext-link ext-link-type="uri" xlink:href="https://github.com/PsyRes-Osnabrueck-University/xrai">https://github.com/PsyRes-Osnabrueck-University/xrai</ext-link>). Our translated dataset can be accessed via OSF, including some labeled example statements (<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.17605/osf.io/AKF3H">https://doi.org/10.17605/osf.io/AKF3H</ext-link>). The original dataset can be accessed via <ext-link ext-link-type="uri" xlink:href="https://paperswithcode.com/dataset/goemotions">https://paperswithcode.com/dataset/goemotions</ext-link>.</p>
</sec>
<sec id="s8" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Ethics Committee of the University Trier. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s9" sec-type="author-contributions">
<title>Author contributions</title>
<p>CL: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Project administration, Writing - original draft, Writing - review &amp; editing. KT: Formal analysis, Methodology, Writing - review &amp; editing. TS: Formal analysis, Investigation, Writing - review &amp; editing. JS: Data curation, Resources, Writing - review &amp; editing. SE: Resources, Writing - review &amp; editing. BS: Writing - review &amp; editing. AV: Resources, Writing - review &amp; editing. WL: Data curation, Funding acquisition, Supervision, Writing - review &amp; editing. JR: Conceptualization, Methodology, Supervision, Writing - original draft, Writing - review &amp; editing.</p>
</sec>
<sec id="s10" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This study was supported by the German Research Foundation (DFG) under grant numbers LU 660/10-1, LU 660/16-1 and LU 660/20-1.</p>
</sec>
<sec id="s11" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be constructed as a potential conflict of interest.</p>
</sec>
<sec id="s12" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec id="s13" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s14" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpsyt.2025.1504306/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpsyt.2025.1504306/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="Table2.docx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
</sec>
<fn-group>
<fn id="fn1">
<label>1</label>
<p>N-grams refer to sets of <italic>n</italic> consecutive words in a corpus.</p>
</fn>
<fn id="fn2">
<label>2</label>
<p>One-Hot encoding is the transformation of categorial data into binary vectors for each category. Contrary to dummy encoding, there is no reference category.</p>
</fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gross</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Mu&#xf1;oz</surname> <given-names>RF</given-names>
</name>
</person-group>. <article-title>Emotion regulation and mental health</article-title>. <source>Clin psychol: Sci Pract</source>. (<year>1995</year>) <volume>2</volume>:<fpage>151</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1468-2850.1995.tb00036.x</pub-id>
</citation>
</ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ekman</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>An argument for basic emotions</article-title>. <source>Cogn Emotion</source>. (<year>1992</year>) <volume>6</volume>:<fpage>169</fpage>&#x2013;<lpage>200</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/02699939208411068</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gilbert</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>An evolutionary approach to emotion in mental health with a focus on affiliative emotions</article-title>. <source>Emotion Rev</source>. (<year>2015</year>) <volume>7</volume>:<page-range>230&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/1754073915576552</pub-id>
</citation>
</ref>
<ref id="B4">
<label>4</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Sell</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>The Evolutionary Psychology of Anger</article-title>. In: <person-group person-group-type="editor">
<name>
<surname>Kappelhoff</surname> <given-names>H</given-names>
</name>
<name>
<surname>Bakels</surname> <given-names>J-H</given-names>
</name>
<name>
<surname>Lehmann</surname> <given-names>H</given-names>
</name>
<name>
<surname>Schmitt</surname> <given-names>C</given-names>
</name>
</person-group>, editors. <source>Emotionen</source> (<year>2019</year>) <publisher-loc>Germany</publisher-loc>: <publisher-name>J.B. Metzler, Stuttgart</publisher-name>. p. <page-range>174&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-3-476-05353-4_25</pub-id>
</citation>
</ref>
<ref id="B5">
<label>5</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Ekman</surname> <given-names>P</given-names>
</name>
<name>
<surname>Friesen</surname> <given-names>WV</given-names>
</name>
</person-group>. <source>Facial Action Coding System</source>. (<year>2019</year>) <publisher-loc>Palo Alto (Calif.)</publisher-loc>: <publisher-name>Consulting Psychologists Press</publisher-name>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/t27734-000</pub-id>.</citation>
</ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname> <given-names>T</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>D</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Mistry</surname> <given-names>R</given-names>
</name>
<name>
<surname>Ran</surname> <given-names>G</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
</person-group>. <article-title>Relation between emotion regulation and mental health: A meta-analysis review</article-title>. <source>psychol Rep</source>. (<year>2014</year>) <volume>114</volume>:<page-range>341&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2466/03.20.PR0.114k22w4</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Berking</surname> <given-names>M</given-names>
</name>
<name>
<surname>Wupperman</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>Emotion regulation and mental health: Recent findings, current challenges, and future directions</article-title>. <source>Curr Opin Psychiatry</source>. (<year>2012</year>) <volume>25</volume>:<page-range>128&#x2013;34</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/YCO.0b013e3283503669</pub-id>
</citation>
</ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Greenberg</surname> <given-names>LS</given-names>
</name>
<name>
<surname>Pascual-Leone</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Emotion in psychotherapy: A practice-friendly research review</article-title>. <source>J Clin Psychol</source>. (<year>2006</year>) <volume>62</volume>:<page-range>611&#x2013;30</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/jclp.20252</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beedie</surname> <given-names>C</given-names>
</name>
<name>
<surname>Terry</surname> <given-names>P</given-names>
</name>
<name>
<surname>Lane</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Distinctions between emotion and mood</article-title>. <source>Cogn Emotion</source>. (<year>2005</year>) <volume>19</volume>:<page-range>847&#x2013;78</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/02699930541000057</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beedie</surname> <given-names>CJ</given-names>
</name>
<name>
<surname>Terry</surname> <given-names>PC</given-names>
</name>
<name>
<surname>Lane</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Devonport</surname> <given-names>TJ</given-names>
</name>
</person-group>. <article-title>Differential assessment of emotions and moods: Development and validation of the Emotion and Mood Components of Anxiety Questionnaire</article-title>. <source>Pers Individ Dif</source>. (<year>2011</year>) <volume>50</volume>:<page-range>228&#x2013;33</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.paid.2010.09.034</pub-id>
</citation>
</ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hofmann</surname> <given-names>SG</given-names>
</name>
<name>
<surname>Sawyer</surname> <given-names>AT</given-names>
</name>
<name>
<surname>Fang</surname> <given-names>A</given-names>
</name>
<name>
<surname>Asnaani</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Emotion dysregulation model of mood and anxiety disorders</article-title>. <source>Depression Anxiety</source>. (<year>2012</year>) <volume>29</volume>:<page-range>409&#x2013;16</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/da.21888</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boumparis</surname> <given-names>N</given-names>
</name>
<name>
<surname>Karyotaki</surname> <given-names>E</given-names>
</name>
<name>
<surname>Kleiboer</surname> <given-names>A</given-names>
</name>
<name>
<surname>Hofmann</surname> <given-names>SG</given-names>
</name>
<name>
<surname>Cuijpers</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>The effect of psychotherapeutic interventions on positive and negative affect in depression: A systematic review and meta-analysis</article-title>. <source>J Affect Disord</source>. (<year>2016</year>) <volume>202</volume>:<page-range>153&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jad.2016.05.019</pub-id>
</citation>
</ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fredrickson</surname> <given-names>BL</given-names>
</name>
</person-group>. <article-title>The broaden&#x2013;and&#x2013;build theory of positive emotions</article-title>. <source>Philos Trans R Soc London Ser B: Biol Sci</source>. (<year>2004</year>) <volume>359</volume>:<page-range>1367&#x2013;77</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1098/rstb.2004.1512</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lindahl</surname> <given-names>M</given-names>
</name>
<name>
<surname>Archer</surname> <given-names>T</given-names>
</name>
</person-group>. <article-title>Depressive expression and anti-depressive protection in adolescence: stress, positive affect, motivation and self-efficacy</article-title>. <source>Psychology</source>. (<year>2013</year>) <volume>04</volume>:<fpage>495</fpage>&#x2013;<lpage>505</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4236/psych.2013.46070</pub-id>
</citation>
</ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hart</surname> <given-names>SL</given-names>
</name>
<name>
<surname>Vella</surname> <given-names>L</given-names>
</name>
<name>
<surname>Mohr</surname> <given-names>DC</given-names>
</name>
</person-group>. <article-title>Relationships among depressive symptoms, benefit-finding, optimism, and positive affect in multiple sclerosis patients after psychotherapy for depression</article-title>. <source>Health Psychol</source>. (<year>2008</year>) <volume>27</volume>:<page-range>230&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/0278-6133.27.2.230</pub-id>
</citation>
</ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Clark</surname> <given-names>LA</given-names>
</name>
<name>
<surname>Watson</surname> <given-names>D</given-names>
</name>
</person-group>. <article-title>Tripartite model of anxiety and depression: Psychometric evidence and taxonomic implications</article-title>. <source>J Abnormal Psychol</source>. (<year>1991</year>) <volume>100</volume>:<fpage>316</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/0021-843X.100.3.316</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Watson</surname> <given-names>D</given-names>
</name>
<name>
<surname>Clark</surname> <given-names>LA</given-names>
</name>
<name>
<surname>Tellegen</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Development and validation of brief measures of positive and negative affect: The PANAS scales</article-title>. <source>J Pers Soc Psychol</source>. (<year>1988</year>) <volume>54</volume>:<page-range>1063&#x2013;70</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/0022-3514.54.6.1063</pub-id>
</citation>
</ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dua</surname> <given-names>JK</given-names>
</name>
</person-group>. <article-title>The role of negative affect and positive affect in stress, depression, self-esteem, assertiveness, Type A behaviors, psychological health, and physical health</article-title>. <source>Genetic social Gen Psychol Monogr</source>. (<year>1993</year>) <volume>119</volume>:<page-range>515&#x2013;52</page-range>.</citation>
</ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kirkegaard Thomsen</surname> <given-names>D</given-names>
</name>
</person-group>. <article-title>The association between rumination and negative affect: A review</article-title>. <source>Cogn Emotion</source>. (<year>2006</year>) <volume>20</volume>:<page-range>1216&#x2013;35</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/02699930500473533</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Panaite</surname> <given-names>V</given-names>
</name>
<name>
<surname>Rottenberg</surname> <given-names>J</given-names>
</name>
<name>
<surname>Bylsma</surname> <given-names>LM</given-names>
</name>
</person-group>. <article-title>Daily affective dynamics predict depression symptom trajectories among adults with major and minor depression</article-title>. <source>Affect Sci</source>. (<year>2020</year>) <volume>1</volume>:<page-range>186&#x2013;98</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s42761-020-00014-w</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cohen</surname> <given-names>JR</given-names>
</name>
<name>
<surname>Thakur</surname> <given-names>H</given-names>
</name>
<name>
<surname>Young</surname> <given-names>JF</given-names>
</name>
<name>
<surname>Hankin</surname> <given-names>BL</given-names>
</name>
</person-group>. <article-title>The development and validation of an algorithm to predict future depression onset in unselected youth</article-title>. <source>psychol Med</source>. (<year>2020</year>) <volume>50</volume>:<page-range>2548&#x2013;56</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1017/S0033291719002691</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fl&#xfc;ckiger</surname> <given-names>C</given-names>
</name>
<name>
<surname>Del Re</surname> <given-names>AC</given-names>
</name>
<name>
<surname>Wampold</surname> <given-names>BE</given-names>
</name>
<name>
<surname>Horvath</surname> <given-names>AO</given-names>
</name>
</person-group>. <article-title>The alliance in adult psychotherapy: A meta-analytic synthesis</article-title>. <source>Psychotherapy</source>. (<year>2018</year>) <volume>55</volume>:<page-range>316&#x2013;40</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/pst0000172</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Fitness</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Emotions in relationships</article-title>. In: <person-group person-group-type="editor">
<name>
<surname>Mikulincer</surname> <given-names>M</given-names>
</name>
<name>
<surname>Shaver</surname> <given-names>PR</given-names>
</name>
<name>
<surname>Simpson</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Dovidio</surname> <given-names>JF</given-names>
</name>
</person-group>, editors. <source>APA handbook of personality and social psychology, Volume 3: Interpersonal relations</source>. <publisher-name>American Psychological Association</publisher-name> (<year>2015</year>). p. <fpage>297</fpage>&#x2013;<lpage>318</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/14344-011</pub-id>
</citation>
</ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Clark</surname> <given-names>MS</given-names>
</name>
<name>
<surname>Fitness</surname> <given-names>J</given-names>
</name>
<name>
<surname>Brissette</surname> <given-names>I</given-names>
</name>
</person-group>. <article-title>Understanding people&#x2019;s perceptions of relationships is crucial to understanding their emotional lives</article-title>. <source>Blackwell Handb Soc psychol: Interpersonal processes</source>. (<year>2001</year>) <volume>2</volume>:<page-range>253&#x2013;78</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/9780470998557.ch10</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Beach</surname> <given-names>SRH</given-names>
</name>
<name>
<surname>Fincham</surname> <given-names>FD</given-names>
</name>
</person-group>. <article-title>Toward an Integrated Model of Negative Affectivity in Marriage</article-title>. In: <person-group person-group-type="editor">
<name>
<surname>Johnson</surname> <given-names>SM</given-names>
</name>
<name>
<surname>Greenberg</surname> <given-names>LS</given-names>
</name>
</person-group>, editors. <source>The Heart of the Matter: Perspectives on Emotion in Marital Therapy</source>. <publisher-loc>New York, New York</publisher-loc>: <publisher-name>Brunner/Mazel</publisher-name> (<year>1994</year>). p. <page-range>227&#x2013;55</page-range>.</citation>
</ref>
<ref id="B26">
<label>26</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Gottman</surname> <given-names>JM</given-names>
</name>
</person-group>. <source>What Predicts Divorce? The Relationship Between Marital Processes and Marital Outcomes</source>. <publisher-loc>Mahwah, New Jersey</publisher-loc>: <publisher-name>Lawrence Erlbaum Associates, Inc</publisher-name> (<year>1994</year>).</citation>
</ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Iwakabe</surname> <given-names>S</given-names>
</name>
<name>
<surname>Rogan</surname> <given-names>K</given-names>
</name>
<name>
<surname>Stalikas</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>The relationship between client emotional expressions, therapist interventions, and the working alliance: an exploration of eight emotional expression events</article-title>. <source>J Psychother Integration</source>. (<year>2000</year>) <volume>10</volume>:<fpage>375</fpage>&#x2013;<lpage>401</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1009479100305</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Safran</surname> <given-names>JD</given-names>
</name>
</person-group>. <article-title>Towards a refinement of cognitive therapy in light of interpersonal theory: I. Theory</article-title>. <source>Clin Psychol Rev</source>. (<year>1990</year>) <volume>10</volume>:<fpage>87</fpage>&#x2013;<lpage>105</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0272-7358(90)90108-M</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kupferberg</surname> <given-names>A</given-names>
</name>
<name>
<surname>Hasler</surname> <given-names>G</given-names>
</name>
</person-group>. <article-title>The social cost of depression: Investigating the impact of impaired social emotion regulation, social cognition, and interpersonal behavior on social functioning</article-title>. <source>J Affect Disord Rep</source>. (<year>2023</year>) <volume>14</volume>:<elocation-id>100631</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jadr.2023.100631</pub-id>
</citation>
</ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eubanks</surname> <given-names>CF</given-names>
</name>
<name>
<surname>Lubitz</surname> <given-names>J</given-names>
</name>
<name>
<surname>Muran</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Safran</surname> <given-names>JD</given-names>
</name>
</person-group>. <article-title>Rupture resolution rating system (3RS): development and validation</article-title>. <source>Psychother Res</source>. (<year>2019</year>) <volume>29</volume>:<page-range>306&#x2013;19</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/10503307.2018.1552034</pub-id>
</citation>
</ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Black</surname> <given-names>RSA</given-names>
</name>
<name>
<surname>Curran</surname> <given-names>D</given-names>
</name>
<name>
<surname>Dyer</surname> <given-names>KFW</given-names>
</name>
</person-group>. <article-title>The impact of shame on the therapeutic alliance and intimate relationships: shame, therapeutic alliance, and intimate relationships</article-title>. <source>J Clin Psychol</source>. (<year>2013</year>) <volume>69</volume>:<page-range>646&#x2013;54</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/jclp.21959</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bartholomew</surname> <given-names>TT</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>E</given-names>
</name>
<name>
<surname>Joy</surname> <given-names>EE</given-names>
</name>
<name>
<surname>Robbins</surname> <given-names>KA</given-names>
</name>
<name>
<surname>Maldonado-Agui&#xf1;iga</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Clients&#x2019; perceptions of the working alliance as a predictor of increases in positive affect</article-title>. <source>J Psychother Integration</source>. (<year>2022</year>) <volume>32</volume>:<page-range>310&#x2013;25</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/int0000265</pub-id>
</citation>
</ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fitzpatrick</surname> <given-names>MR</given-names>
</name>
<name>
<surname>Janzen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Chamodraka</surname> <given-names>M</given-names>
</name>
<name>
<surname>Park</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Client critical incidents in the process of early alliance development: A positive emotion&#x2013;exploration spiral</article-title>. <source>Psychother Res</source>. (<year>2006</year>) <volume>16</volume>:<page-range>486&#x2013;98</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/10503300500485391</pub-id>
</citation>
</ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Notsu</surname> <given-names>H</given-names>
</name>
<name>
<surname>Iwakabe</surname> <given-names>S</given-names>
</name>
<name>
<surname>Thoma</surname> <given-names>NC</given-names>
</name>
</person-group>. <article-title>Enhancing working alliance through positive emotional experience: A cross-lag analysis</article-title>. <source>Psychother Res</source>. (<year>2023</year>) <volume>33</volume>:<page-range>328&#x2013;41</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/10503307.2022.2124893</pub-id>
</citation>
</ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sels</surname> <given-names>L</given-names>
</name>
<name>
<surname>Tran</surname> <given-names>A</given-names>
</name>
<name>
<surname>Greenaway</surname> <given-names>KH</given-names>
</name>
<name>
<surname>Verhofstadt</surname> <given-names>L</given-names>
</name>
<name>
<surname>Kalokerinos</surname> <given-names>EK</given-names>
</name>
</person-group>. <article-title>The social functions of positive emotions</article-title>. <source>Curr Opin Behav Sci</source>. (<year>2021</year>) <volume>39</volume>:<page-range>41&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cobeha.2020.12.009</pub-id>
</citation>
</ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bordin</surname> <given-names>ES</given-names>
</name>
</person-group>. <article-title>The generalizability of the psychoanalytic concept of the working alliance</article-title>. <source>Psychother: Theory Res Pract</source>. (<year>1979</year>) <volume>16</volume>:<page-range>252&#x2013;60</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/h0085885</pub-id>
</citation>
</ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baumeister</surname> <given-names>RF</given-names>
</name>
<name>
<surname>Bratslavsky</surname> <given-names>E</given-names>
</name>
<name>
<surname>Finkenauer</surname> <given-names>C</given-names>
</name>
<name>
<surname>Vohs</surname> <given-names>KD</given-names>
</name>
</person-group>. <article-title>Bad is stronger than good</article-title>. <source>Rev Gen Psychol</source>. (<year>2001</year>) <volume>5</volume>:<page-range>323&#x2013;70</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/1089-2680.5.4.323</pub-id>
</citation>
</ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>H</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Kong</surname> <given-names>X</given-names>
</name>
</person-group>. <article-title>Review on emotion recognition based on electroencephalography</article-title>. <source>Front Comput Neurosci</source>. (<year>2021</year>) <volume>15</volume>:<elocation-id>758212</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fncom.2021.758212</pub-id>
</citation>
</ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Egger</surname> <given-names>M</given-names>
</name>
<name>
<surname>Ley</surname> <given-names>M</given-names>
</name>
<name>
<surname>Hanke</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Emotion recognition from physiological signal analysis: A review</article-title>. <source>Electronic Notes Theor Comput Sci</source>. (<year>2019</year>) <volume>343</volume>:<fpage>35</fpage>&#x2013;<lpage>55</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.entcs.2019.04.009</pub-id>
</citation>
</ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pepa</surname> <given-names>L</given-names>
</name>
<name>
<surname>Spalazzi</surname> <given-names>L</given-names>
</name>
<name>
<surname>Capecci</surname> <given-names>M</given-names>
</name>
<name>
<surname>Ceravolo</surname> <given-names>MG</given-names>
</name>
</person-group>. <article-title>Automatic emotion recognition in clinical scenario: A systematic review of methods</article-title>. <source>IEEE Trans Affect Computing</source>. (<year>2023</year>) <volume>14</volume>:<page-range>1675&#x2013;95</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TAFFC.2021.3128787</pub-id>
</citation>
</ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saxena</surname> <given-names>A</given-names>
</name>
<name>
<surname>Khanna</surname> <given-names>A</given-names>
</name>
<name>
<surname>Gupta</surname> <given-names>D</given-names>
</name>
</person-group>. <article-title>Emotion recognition and detection methods: A comprehensive survey</article-title>. <source>J Artif Intell Syst</source>. (<year>2020</year>) <volume>2</volume>:<fpage>53</fpage>&#x2013;<lpage>79</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.33969/AIS.2020.21005</pub-id>
</citation>
</ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ahmed</surname> <given-names>Md.ZI</given-names>
</name>
<name>
<surname>Sinha</surname> <given-names>N</given-names>
</name>
<name>
<surname>Ghaderpour</surname> <given-names>E</given-names>
</name>
<name>
<surname>Phadikar</surname> <given-names>S</given-names>
</name>
<name>
<surname>Ghosh</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>A novel baseline removal paradigm for subject-independent features in emotion classification using EEG</article-title>. <source>Bioengineering</source>. (<year>2023</year>) <volume>10</volume>:<elocation-id>54</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/bioengineering10010054</pub-id>
</citation>
</ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ryumina</surname> <given-names>E</given-names>
</name>
<name>
<surname>Dresvyanskiy</surname> <given-names>D</given-names>
</name>
<name>
<surname>Karpov</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>In search of a robust facial expressions recognition model: A large-scale visual cross-corpus study</article-title>. <source>Neurocomputing</source>. (<year>2022</year>) <volume>514</volume>:<page-range>435&#x2013;50</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.neucom.2022.10.013</pub-id>
</citation>
</ref>
<ref id="B44">
<label>44</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baevski</surname> <given-names>A</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>H</given-names>
</name>
<name>
<surname>Mohamed</surname> <given-names>A</given-names>
</name>
<name>
<surname>Auli</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>
<italic>wav2vec 2.0: A framework for self-supervised learning of speech representations</italic> (arXiv:2006.11477)</article-title>. <source>arXiv</source>. (<year>2020</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.48550/arXiv.2006.11477</pub-id>
</citation>
</ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nasersharif</surname> <given-names>B</given-names>
</name>
<name>
<surname>Namvarpour</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Exploring the potential of Wav2vec 2.0 for speech emotion recognition using classifier combination and attention-based feature fusion</article-title>. <source>J Supercomputing</source>. (<year>2024</year>) <volume>80</volume>:<page-range>23667&#x2013;88</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11227-024-06158-x</pub-id>
</citation>
</ref>
<ref id="B46">
<label>46</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rozado</surname> <given-names>D</given-names>
</name>
<name>
<surname>Hughes</surname> <given-names>R</given-names>
</name>
<name>
<surname>Halberstadt</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Longitudinal analysis of sentiment and emotion in news media headlines using automated labelling with Transformer language models</article-title>. <source>PloS One</source>. (<year>2022</year>) <volume>17</volume>:<elocation-id>e0276367</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0276367</pub-id>
</citation>
</ref>
<ref id="B47">
<label>47</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Caschera</surname> <given-names>MC</given-names>
</name>
<name>
<surname>Grifoni</surname> <given-names>P</given-names>
</name>
<name>
<surname>Ferri</surname> <given-names>F</given-names>
</name>
</person-group>. <article-title>Emotion classification from speech and text in videos using a multimodal approach</article-title>. <source>Multimodal Technol Interaction</source>. (<year>2022</year>) <volume>6</volume>:<fpage>Article 4</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/mti6040028</pub-id>
</citation>
</ref>
<ref id="B48">
<label>48</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sloan</surname> <given-names>DM</given-names>
</name>
<name>
<surname>Kring</surname> <given-names>AM</given-names>
</name>
</person-group>. <article-title>Measuring changes in emotion during psychotherapy: Conceptual and methodological issues</article-title>. <source>Clin Psychol: Sci Pract</source>. (<year>2007</year>) <volume>14</volume>:<page-range>307&#x2013;22</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1468-2850.2007.00092.x</pub-id>
</citation>
</ref>
<ref id="B49">
<label>49</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Greenberg</surname> <given-names>LS</given-names>
</name>
<name>
<surname>Auszra</surname> <given-names>L</given-names>
</name>
<name>
<surname>Herrmann</surname> <given-names>IR</given-names>
</name>
</person-group>. <article-title>The relationship among emotional productivity, emotional arousal and outcome in experiential therapy of depression</article-title>. <source>Psychother Res</source>. (<year>2007</year>) <volume>17</volume>:<page-range>482&#x2013;93</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/10503300600977800</pub-id>
</citation>
</ref>
<ref id="B50">
<label>50</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>MaChado</surname> <given-names>PPP</given-names>
</name>
<name>
<surname>Beutler</surname> <given-names>LE</given-names>
</name>
<name>
<surname>Greenberg</surname> <given-names>LS</given-names>
</name>
</person-group>. <article-title>Emotion recognition in psychotherapy: Impact of therapist level of experience and emotional awareness</article-title>. <source>J Clin Psychol</source>. (<year>1999</year>) <volume>55</volume>:<fpage>39</fpage>&#x2013;<lpage>57</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/(SICI)1097-4679(199901)55:1&lt;39::AID-JCLP4&gt;3.0.CO;2-V</pub-id>
</citation>
</ref>
<ref id="B51">
<label>51</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Chowdhary</surname> <given-names>KR</given-names>
</name>
</person-group>. <article-title>Natural Language Processing</article-title>. In: <person-group person-group-type="editor">
<name>
<surname>Chowdhary</surname> <given-names>KR</given-names>
</name>
</person-group>, editor. <source>Fundamentals of Artificial Intelligence</source>. <publisher-name>Springer</publisher-name>, <publisher-loc>India</publisher-loc> (<year>2020</year>). p. <page-range>603&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-81-322-3972-7_19</pub-id>
</citation>
</ref>
<ref id="B52">
<label>52</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiao</surname> <given-names>B</given-names>
</name>
<name>
<surname>Imel</surname> <given-names>ZE</given-names>
</name>
<name>
<surname>Georgiou</surname> <given-names>PG</given-names>
</name>
<name>
<surname>Atkins</surname> <given-names>DC</given-names>
</name>
<name>
<surname>Narayanan</surname> <given-names>SS</given-names>
</name>
</person-group>. <article-title>&#x201c; Rate my therapist&#x201d;: Automated detection of empathy in drug and alcohol counseling via speech and language processing</article-title>. <source>PloS One</source>. (<year>2015</year>) <volume>10</volume>:<elocation-id>e0143055</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0143055</pub-id>
</citation>
</ref>
<ref id="B53">
<label>53</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Imel</surname> <given-names>ZE</given-names>
</name>
<name>
<surname>Pace</surname> <given-names>BT</given-names>
</name>
<name>
<surname>Soma</surname> <given-names>CS</given-names>
</name>
<name>
<surname>Tanana</surname> <given-names>M</given-names>
</name>
<name>
<surname>Hirsch</surname> <given-names>T</given-names>
</name>
<name>
<surname>Gibson</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Design feasibility of an automated, machine-learning based feedback system for motivational interviewing</article-title>. <source>Psychotherapy</source>. (<year>2019</year>) <volume>56</volume>:<page-range>318&#x2013;28</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/pst0000221</pub-id>
</citation>
</ref>
<ref id="B54">
<label>54</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Atzil-Slonim</surname> <given-names>D</given-names>
</name>
<name>
<surname>Juravski</surname> <given-names>D</given-names>
</name>
<name>
<surname>Bar-Kalifa</surname> <given-names>E</given-names>
</name>
<name>
<surname>Gilboa-Schechtman</surname> <given-names>E</given-names>
</name>
<name>
<surname>Tuval-Mashiach</surname> <given-names>R</given-names>
</name>
<name>
<surname>Shapira</surname> <given-names>N</given-names>
</name>
<etal/>
</person-group>. <article-title>Using topic models to identify clients&#x2019; functioning levels and alliance ruptures in psychotherapy</article-title>. <source>Psychotherapy</source>. (<year>2021</year>) <volume>58</volume>(<issue>2</issue>):<page-range>324&#x2013;339</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/pst0000362</pub-id>
</citation>
</ref>
<ref id="B55">
<label>55</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lalk</surname> <given-names>C</given-names>
</name>
<name>
<surname>Steinbrenner</surname> <given-names>T</given-names>
</name>
<name>
<surname>Kania</surname> <given-names>W</given-names>
</name>
<name>
<surname>Popko</surname> <given-names>A</given-names>
</name>
<name>
<surname>Wester</surname> <given-names>R</given-names>
</name>
<name>
<surname>Schaffrath</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Measuring alliance and symptom severity in psychotherapy transcripts using bert topic modeling</article-title>. <source>Administration Policy Ment Health Ment Health Serv Res</source>. (<year>2024</year>) <volume>51</volume>:<page-range>509&#x2013;24</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10488-024-01356-4</pub-id>
</citation>
</ref>
<ref id="B56">
<label>56</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Tanana</surname> <given-names>M</given-names>
</name>
<name>
<surname>Dembe</surname> <given-names>A</given-names>
</name>
<name>
<surname>Soma</surname> <given-names>CS</given-names>
</name>
<name>
<surname>Imel</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Atkins</surname> <given-names>D</given-names>
</name>
<name>
<surname>Srikumar</surname> <given-names>V</given-names>
</name>
</person-group>. (<year>2016</year>). <article-title>Is sentiment in movies the same as sentiment in psychotherapy? Comparisons using a new psychotherapy sentiment database</article-title>, in: <conf-name>Proceedings of the Third Workshop on Computational Lingusitics and Clinical Psychology</conf-name>, <publisher-loc>San Diego, CA, USA</publisher-loc>: <publisher-name>Association for Computational Linguistics</publisher-name>. pp. <fpage>33</fpage>&#x2013;<lpage>41</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.18653/v1/W16-0304</pub-id>
</citation>
</ref>
<ref id="B57">
<label>57</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Devlin</surname> <given-names>J</given-names>
</name>
<name>
<surname>Chang</surname> <given-names>M-W</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>K</given-names>
</name>
<name>
<surname>Toutanova</surname> <given-names>K</given-names>
</name>
</person-group>. <article-title>
<italic>BERT: pre-training of deep bidirectional transformers for language understanding</italic> (arXiv:1810.04805)</article-title>. <source>arXiv</source>. (<year>2019</year>)</citation>
</ref>
<ref id="B58">
<label>58</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tausczik</surname> <given-names>YR</given-names>
</name>
<name>
<surname>Pennebaker</surname> <given-names>JW</given-names>
</name>
</person-group>. <article-title>The psychological meaning of words: LIWC and computerized text analysis methods</article-title>. <source>J Lang Soc Psychol</source>. (<year>2010</year>) <volume>29</volume>:<fpage>24</fpage>&#x2013;<lpage>54</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/0261927X09351676</pub-id>
</citation>
</ref>
<ref id="B59">
<label>59</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tanana</surname> <given-names>MJ</given-names>
</name>
<name>
<surname>Soma</surname> <given-names>CS</given-names>
</name>
<name>
<surname>Kuo</surname> <given-names>PB</given-names>
</name>
<etal/>
</person-group>. <article-title>How do you feel? Using natural language processing to automatically rate emotion in psychotherapy</article-title>. <source>Behav Res</source>. (<year>2017</year>) <volume>53</volume>:<page-range>2069&#x2013;82</page-range>. doi:<pub-id pub-id-type="doi">10.3758/s13428-020-01531-z</pub-id>
</citation>
</ref>
<ref id="B60">
<label>60</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eberhardt</surname> <given-names>ST</given-names>
</name>
<name>
<surname>Schaffrath</surname> <given-names>J</given-names>
</name>
<name>
<surname>Moggia</surname> <given-names>D</given-names>
</name>
<name>
<surname>Schwartz</surname> <given-names>B</given-names>
</name>
<name>
<surname>Jaehde</surname> <given-names>M</given-names>
</name>
<name>
<surname>Rubel</surname> <given-names>JA</given-names>
</name>
<etal/>
</person-group>. <article-title>Decoding emotions: Exploring the validity of sentiment analysis in psychotherapy</article-title>. <source>Psychother Res</source>. (<year>2024</year>) <volume>35</volume>(<issue>2</issue>):<fpage>174</fpage>&#x2013;<lpage>89</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/10503307.2024.2322522</pub-id>
</citation>
</ref>
<ref id="B61">
<label>61</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>First</surname> <given-names>MB</given-names>
</name>
<name>
<surname>Gibbon</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>The Structured Clinical Interview for DSM-IV Axis I Disorders (SCID-I) and the Structured Clinical Interview for DSM-IV Axis II Disorders (SCID-II)</article-title>. In: <source>Comprehensive handbook of psychological assessment, Vol. 2: Personality assessment</source>. <publisher-loc>Hoboken, New Jersey</publisher-loc>: <publisher-name>John Wiley &amp; Sons, Inc</publisher-name> (<year>2004</year>). p. <page-range>134&#x2013;43</page-range>.</citation>
</ref>
<ref id="B62">
<label>62</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lutz</surname> <given-names>W</given-names>
</name>
<name>
<surname>Tholen</surname> <given-names>S</given-names>
</name>
<name>
<surname>Sch&#xfc;rch</surname> <given-names>E</given-names>
</name>
<name>
<surname>Berking</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Reliabilit&#xe4;t von Kurzformen g&#xe4;ngiger psychometrischer Instrumente zur Evaluation des therapeutischen Fortschritts in Psychotherapie und Psychiatrie</article-title>. <source>Diagnostica</source>. (<year>2006</year>) <volume>52</volume>:<fpage>11</fpage>&#x2013;<lpage>25</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1026/0012-1924.52.1.11</pub-id>
</citation>
</ref>
<ref id="B63">
<label>63</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lutz</surname> <given-names>W</given-names>
</name>
<name>
<surname>de Jong</surname> <given-names>K</given-names>
</name>
<name>
<surname>Rubel</surname> <given-names>R</given-names>
</name>
<name>
<surname>Delgadillo</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Measuring, predicting and tracking change in psychotherapy</article-title>. In: <person-group person-group-type="editor">
<name>
<surname>Barkham</surname> <given-names>M</given-names>
</name>
<name>
<surname>Lutz</surname> <given-names>W</given-names>
</name>
<name>
<surname>Castonguay</surname> <given-names>LG</given-names>
</name>
</person-group>, editors. <source>Bergin &amp; Garfield&#x2019;s handbook of psychotherapy and behavior change (7. Aufl.)</source>. <publisher-loc>Hoboken, New Jersey</publisher-loc>: <publisher-name>Wiley</publisher-name> (<year>2021</year>).</citation>
</ref>
<ref id="B64">
<label>64</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Derogatis</surname> <given-names>LR</given-names>
</name>
<name>
<surname>Melisaratos</surname> <given-names>N</given-names>
</name>
</person-group>. <article-title>The Brief Symptom Inventory: An introductory report</article-title>. <source>psychol Med</source>. (<year>1983</year>) <volume>13</volume>:<fpage>595</fpage>&#x2013;<lpage>605</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1017/S0033291700048017</pub-id>
</citation>
</ref>
<ref id="B65">
<label>65</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kroenke</surname> <given-names>K</given-names>
</name>
<name>
<surname>Spitzer</surname> <given-names>RL</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>JB</given-names>
</name>
</person-group>. <article-title>The PHQ-9: Validity of a brief depression severity measure</article-title>. <source>J Gen Internal Med</source>. (<year>2001</year>) <volume>16</volume>:<page-range>606&#x2013;13</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1046/j.1525-1497.2001.016009606.x</pub-id>
</citation>
</ref>
<ref id="B66">
<label>66</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Spitzer</surname> <given-names>RL</given-names>
</name>
<name>
<surname>Kroenke</surname> <given-names>K</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>JBW</given-names>
</name>
<name>
<surname>L&#xf6;we</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>A brief measure for assessing generalized anxiety disorder: the GAD-7</article-title>. <source>Arch Internal Med</source>. (<year>2006</year>) <volume>166</volume>:<elocation-id>1092</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/archinte.166.10.1092</pub-id>
</citation>
</ref>
<ref id="B67">
<label>67</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rubel</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Rosenbaum</surname> <given-names>D</given-names>
</name>
<name>
<surname>Lutz</surname> <given-names>W</given-names>
</name>
</person-group>. <article-title>Patients&#x2019; in-session experiences and symptom change: Session-to-session effects on a within- and between-patient level</article-title>. <source>Behav Res Ther</source>. (<year>2017</year>) <volume>90</volume>:<fpage>58</fpage>&#x2013;<lpage>66</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.brat.2016.12.007</pub-id>
</citation>
</ref>
<ref id="B68">
<label>68</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hayes</surname> <given-names>AF</given-names>
</name>
<name>
<surname>Coutts</surname> <given-names>JJ</given-names>
</name>
</person-group>. <article-title>Use omega rather than cronbach&#x2019;s alpha for estimating reliability. But&#x2026;</article-title>. <source>Communication Methods Measures</source>. (<year>2020</year>) <volume>14</volume>:<fpage>1</fpage>&#x2013;<lpage>24</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/19312458.2020.1718629</pub-id>
</citation>
</ref>
<ref id="B69">
<label>69</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Duncan</surname> <given-names>BL</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>SD</given-names>
</name>
<name>
<surname>Sparks</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Claud</surname> <given-names>DA</given-names>
</name>
<name>
<surname>Reynolds</surname> <given-names>LR</given-names>
</name>
<name>
<surname>Brown</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>The Session Rating Scale: Preliminary psychometric properties of a &#x201c;working&#x201d; alliance measure</article-title>. <source>J Brief Ther</source>. (<year>2003</year>) <volume>3</volume>:<fpage>3</fpage>&#x2013;<lpage>12</lpage>.</citation>
</ref>
<ref id="B70">
<label>70</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Murphy</surname> <given-names>MG</given-names>
</name>
<name>
<surname>Rakes</surname> <given-names>S</given-names>
</name>
<name>
<surname>Harris</surname> <given-names>RM</given-names>
</name>
</person-group>. <article-title>The psychometric properties of the session rating scale: A narrative review</article-title>. <source>J Evidence-Based Soc Work</source>. (<year>2020</year>) <volume>17</volume>:<page-range>279&#x2013;99</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/26408066.2020.1729281</pub-id>
</citation>
</ref>
<ref id="B71">
<label>71</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reese</surname> <given-names>RJ</given-names>
</name>
<name>
<surname>Slone</surname> <given-names>NC</given-names>
</name>
<name>
<surname>Miserocchi</surname> <given-names>KM</given-names>
</name>
</person-group>. <article-title>Using client feedback in psychotherapy from an interpersonal process perspective</article-title>. <source>Psychotherapy</source>. (<year>2013</year>) <volume>50</volume>:<page-range>288&#x2013;91</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/a0032522</pub-id>
</citation>
</ref>
<ref id="B72">
<label>72</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Demszky</surname> <given-names>D</given-names>
</name>
<name>
<surname>Movshovitz-Attias</surname> <given-names>D</given-names>
</name>
<name>
<surname>Ko</surname> <given-names>J</given-names>
</name>
<name>
<surname>Cowen</surname> <given-names>A</given-names>
</name>
<name>
<surname>Nemade</surname> <given-names>G</given-names>
</name>
<name>
<surname>Ravi</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>
<italic>GoEmotions: A dataset of fine-grained emotions</italic> (Version 2)</article-title>. <source>arXiv</source>. (<year>2020</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.48550/ARXIV.2005.00547</pub-id>
</citation>
</ref>
<ref id="B73">
<label>73</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Conneau</surname> <given-names>A</given-names>
</name>
<name>
<surname>Khandelwal</surname> <given-names>K</given-names>
</name>
<name>
<surname>Goyal</surname> <given-names>N</given-names>
</name>
<name>
<surname>Chaudhary</surname> <given-names>V</given-names>
</name>
<name>
<surname>Wenzek</surname> <given-names>G</given-names>
</name>
<name>
<surname>Guzm&#xe1;n</surname> <given-names>F</given-names>
</name>
<etal/>
</person-group>. <article-title>
<italic>Unsupervised cross-lingual representation learning at scale</italic> (Version 2)</article-title>. <source>arXiv</source>. (<year>2019</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.48550/ARXIV.1911.02116</pub-id>
</citation>
</ref>
<ref id="B74">
<label>74</label>
<citation citation-type="web">
<person-group person-group-type="author">
<collab>DeepL</collab>
</person-group>. <article-title>DeepL</article-title> (<year>2024</year>). Available online at: <uri xlink:href="https://www.deepl.com/de/translator">https://www.deepl.com/de/translator</uri> (Accessed August 1, 2024).</citation>
</ref>
<ref id="B75">
<label>75</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lalk</surname> <given-names>C</given-names>
</name>
<name>
<surname>Targan</surname> <given-names>K</given-names>
</name>
<name>
<surname>Steinbrenner</surname> <given-names>T</given-names>
</name>
<name>
<surname>Schaffrath</surname> <given-names>J</given-names>
</name>
<name>
<surname>Eberhardt</surname> <given-names>ST</given-names>
</name>
<name>
<surname>Schwartz</surname> <given-names>B</given-names>
</name>
<etal/>
</person-group>. <source>Employing Large Language Models for Emotion Detection in Psychotherapy Transcripts: Supplementary Data</source>. (<year>2025</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.17605/OSF.IO/AKF3H</pub-id>.</citation>
</ref>
<ref id="B76">
<label>76</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lhoest</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Moral</surname> <given-names>AV</given-names>
</name>
<name>
<surname>von</surname> <given-names>P</given-names>
</name>
<name>
<surname>Wolf</surname> <given-names>T</given-names>
</name>
<name>
<surname>&#x160;a&#x161;ko</surname> <given-names>M</given-names>
</name>
<name>
<surname>Jernite</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <source>
<italic>huggingface/datasets: 2.8.0</italic> (Version 2.8.0) [Software]</source>. <publisher-name>Zenodo</publisher-name> (<year>2022</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.5281/zenodo.7457269</pub-id>
</citation>
</ref>
<ref id="B77">
<label>77</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Landis</surname> <given-names>JR</given-names>
</name>
<name>
<surname>Koch</surname> <given-names>GG</given-names>
</name>
</person-group>. <article-title>The measurement of observer agreement for categorical data</article-title>. <source>Biometrics</source>. (<year>1977</year>) <volume>33</volume>:<page-range>159&#x2013;74</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2307/2529310</pub-id>
</citation>
</ref>
<ref id="B78">
<label>78</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lalk</surname> <given-names>C</given-names>
</name>
<name>
<surname>Mathew</surname> <given-names>R</given-names>
</name>
</person-group>. <source>
<italic>XRAI - eXplanable Regression-based Artificial Intelligence</italic> (Version 0.1.1) [Software]</source>. (<year>2024</year>).</citation>
</ref>
<ref id="B79">
<label>79</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Cohen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Cohen</surname> <given-names>P</given-names>
</name>
<name>
<surname>West</surname> <given-names>SG</given-names>
</name>
<name>
<surname>Aiken</surname> <given-names>LS</given-names>
</name>
</person-group>. <source>Applied multiple regression correlation analysis for the behavioral sciences</source>. <edition>3rd ed.</edition> <publisher-loc>New York, New York</publisher-loc>: <publisher-name>Routledge Taylor &amp; Francis Group</publisher-name> (<year>2015</year>).</citation>
</ref>
<ref id="B80">
<label>80</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chai</surname> <given-names>T</given-names>
</name>
<name>
<surname>Draxler</surname> <given-names>RR</given-names>
</name>
</person-group>. <article-title>Root mean square error (RMSE) or mean absolute error (MAE)? &#x2013; Arguments against avoiding RMSE in the literature</article-title>. <source>Geoscientific Model Dev</source>. (<year>2014</year>) <volume>7</volume>:<page-range>1247&#x2013;50</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/gmd-7-1247-2014</pub-id>
</citation>
</ref>
<ref id="B81">
<label>81</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Willmott</surname> <given-names>CJ</given-names>
</name>
<name>
<surname>Matsuura</surname> <given-names>K</given-names>
</name>
</person-group>. <article-title>Advantages of the mean absolute error (MAE) over the root mean square error (RMSE) in assessing average model performance</article-title>. <source>Climate Res</source>. (<year>2005</year>) <volume>30</volume>:<fpage>79</fpage>&#x2013;<lpage>82</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3354/cr030079</pub-id>
</citation>
</ref>
<ref id="B82">
<label>82</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tibshirani</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>Regression shrinkage and selection via the lasso</article-title>. <source>J R Stat Society Ser B (Methodological)</source>. (<year>1996</year>) <volume>58</volume>:<page-range>267&#x2013;88</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.2517-6161.1996.tb02080.x</pub-id>
</citation>
</ref>
<ref id="B83">
<label>83</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zou</surname> <given-names>H</given-names>
</name>
<name>
<surname>Hastie</surname> <given-names>T</given-names>
</name>
</person-group>. <article-title>Regularization and variable selection via the elastic net</article-title>. <source>J R Stat Society Ser B (Statistical Methodology)</source>. (<year>2005</year>) <volume>67</volume>:<page-range>301&#x2013;20</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1467-9868.2005.00503.x</pub-id>
</citation>
</ref>
<ref id="B84">
<label>84</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>T</given-names>
</name>
<name>
<surname>Guestrin</surname> <given-names>C</given-names>
</name>
</person-group>. (<year>2016</year>). <article-title>XGBoost: A scalable tree boosting system</article-title>, in: <conf-name>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>, <publisher-loc>San Francisco, California</publisher-loc>: <publisher-name>Association for Computing Machinery</publisher-name>. pp. <page-range>785&#x2013;94</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id>
</citation>
</ref>
<ref id="B85">
<label>85</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Random forests</article-title>. <source>Mach Learn</source>. (<year>2001</year>) <volume>45</volume>:<fpage>5</fpage>&#x2013;<lpage>32</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id>
</citation>
</ref>
<ref id="B86">
<label>86</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cortes</surname> <given-names>C</given-names>
</name>
<name>
<surname>Vapnik</surname> <given-names>V</given-names>
</name>
</person-group>. <article-title>Support-vector networks</article-title>. <source>Mach Learn</source>. (<year>1995</year>) <volume>20</volume>:<page-range>273&#x2013;97</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF00994018</pub-id>
</citation>
</ref>
<ref id="B87">
<label>87</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>van der Laan</surname> <given-names>MJ</given-names>
</name>
<name>
<surname>Polley</surname> <given-names>EC</given-names>
</name>
<name>
<surname>Hubbard</surname> <given-names>AE</given-names>
</name>
</person-group>. <article-title>Super learner</article-title>. <source>Stat Appl Genet Mol Biol</source>. (<year>2007</year>) <volume>6</volume>:<fpage>Article25</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2202/1544-6115.1309</pub-id>
</citation>
</ref>
<ref id="B88">
<label>88</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Holzinger</surname> <given-names>A</given-names>
</name>
<name>
<surname>Saranti</surname> <given-names>A</given-names>
</name>
<name>
<surname>Molnar</surname> <given-names>C</given-names>
</name>
<name>
<surname>Biecek</surname> <given-names>P</given-names>
</name>
<name>
<surname>Samek</surname> <given-names>W</given-names>
</name>
</person-group>. <article-title>Explainable AI Methods&#x2014;A Brief Overview</article-title>. In: <person-group person-group-type="editor">
<name>
<surname>Holzinger</surname> <given-names>A</given-names>
</name>
<name>
<surname>Goebel</surname> <given-names>R</given-names>
</name>
<name>
<surname>Fong</surname> <given-names>R</given-names>
</name>
<name>
<surname>Moon</surname> <given-names>T</given-names>
</name>
<name>
<surname>M&#xfc;ller</surname> <given-names>K-R</given-names>
</name>
<name>
<surname>Samek</surname> <given-names>W</given-names>
</name>
</person-group>, editors. <source>xxAI - Beyond Explainable AI: International Workshop, Held in Conjunction with ICML 2020, July 18, 2020, Vienna, AUSTRIA, Revised and Extended Papers</source>. <publisher-loc>Berlin, Germany</publisher-loc>: <publisher-name>Springer International Publishing</publisher-name> (<year>2022</year>). p. <fpage>13</fpage>&#x2013;<lpage>38</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-3-031-04083-2_2</pub-id>
</citation>
</ref>
<ref id="B89">
<label>89</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Shapley</surname> <given-names>LS</given-names>
</name>
</person-group>. <article-title>17. A Value for n-Person Games</article-title>. In: <person-group person-group-type="editor">
<name>
<surname>Kuhn</surname> <given-names>HW</given-names>
</name>
<name>
<surname>Tucker</surname> <given-names>AW</given-names>
</name>
</person-group>, editors. <source>Contributions to the Theory of Games (AM-28)</source>, vol. <volume>II</volume>. <publisher-loc>Princeton, New Jersey</publisher-loc>: <publisher-name>Princeton University Press</publisher-name> (<year>1953</year>). p. <page-range>307&#x2013;18</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1515/9781400881970-018</pub-id>
</citation>
</ref>
<ref id="B90">
<label>90</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lundberg</surname> <given-names>S</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>S-I</given-names>
</name>
</person-group>. <article-title>A unified approach to interpreting model predictions</article-title>. <source>arXiv:1705.07874 [cs stat]</source>. (<year>2017</year>). <uri xlink:href="http://arxiv.org/abs/1705.07874">http://arxiv.org/abs/1705.07874</uri> (Accessed July 5, 2024).</citation>
</ref>
<ref id="B91">
<label>91</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lundberg</surname> <given-names>SM</given-names>
</name>
<name>
<surname>Erion</surname> <given-names>G</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>H</given-names>
</name>
<name>
<surname>DeGrave</surname> <given-names>A</given-names>
</name>
<name>
<surname>Prutkin</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Nair</surname> <given-names>B</given-names>
</name>
<etal/>
</person-group>. <article-title>Explainable AI for trees: from local explanations to global understanding</article-title>. <source>arXiv:1905.04610 [cs stat]</source>. (<year>2019</year>). <uri xlink:href="http://arxiv.org/abs/1905.04610">http://arxiv.org/abs/1905.04610</uri> (Accessed July 5, 2024).</citation>
</ref>
<ref id="B92">
<label>92</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nof</surname> <given-names>A</given-names>
</name>
<name>
<surname>Amir</surname> <given-names>O</given-names>
</name>
<name>
<surname>Goldstein</surname> <given-names>P</given-names>
</name>
<name>
<surname>Zilcha-Mano</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>What do these sounds tell us about the therapeutic alliance: Acoustic markers as predictors of alliance</article-title>. <source>Clin Psychol Psychother</source>. (<year>2021</year>) <volume>28</volume>:<page-range>807&#x2013;17</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/cpp.v28.4</pub-id>
</citation>
</ref>
<ref id="B93">
<label>93</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Slonim</surname> <given-names>DA</given-names>
</name>
<name>
<surname>Yehezkel</surname> <given-names>I</given-names>
</name>
<name>
<surname>Paz</surname> <given-names>A</given-names>
</name>
<name>
<surname>Bar-Kalifa</surname> <given-names>E</given-names>
</name>
<name>
<surname>Wolff</surname> <given-names>M</given-names>
</name>
<name>
<surname>Dar</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Facing change: using automated facial expression analysis to examine emotional flexibility in the treatment of depression</article-title>. <source>Administration Policy Ment Health Ment Health Serv Res</source>. (<year>2024</year>) <volume>51</volume>:<page-range>501&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10488-023-01310-w</pub-id>
</citation>
</ref>
<ref id="B94">
<label>94</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lalk</surname> <given-names>C</given-names>
</name>
<name>
<surname>Steinbrenner</surname> <given-names>T</given-names>
</name>
<name>
<surname>Pena</surname> <given-names>JS</given-names>
</name>
<name>
<surname>Kania</surname> <given-names>W</given-names>
</name>
<name>
<surname>Schaffrath</surname> <given-names>J</given-names>
</name>
<name>
<surname>Eberhardt</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Depression symptoms are associated with frequency of cognitive distortions in psychotherapy transcripts</article-title>. <source>Cogn Ther Res</source>. (<year>2024</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10608-024-10542-5</pub-id>
</citation>
</ref>
<ref id="B95">
<label>95</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sch&#xf6;nbrodt</surname> <given-names>FD</given-names>
</name>
<name>
<surname>Perugini</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>At what sample size do correlations stabilize</article-title>? <source>J Res Pers</source>. (<year>2013</year>) <volume>47</volume>:<page-range>609&#x2013;12</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jrp.2013.05.009</pub-id>
</citation>
</ref>
<ref id="B96">
<label>96</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoyer</surname> <given-names>J</given-names>
</name>
<name>
<surname>Gloster</surname> <given-names>AT</given-names>
</name>
</person-group>. <article-title>Psychologische Flexibilit&#xe4;t messen= Measuring psychological flexibility: Der Fragebogen zu Akzeptanz und Handeln&#x2013;II (FAH-II): The Acceptance and Action Questionnaire&#x2013;II (AAQ-II)</article-title>. <source>Verhaltenstherapie</source>. (<year>2013</year>) <volume>23</volume>:<page-range>42&#x2013;4</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1159/000347040</pub-id>
</citation>
</ref>
<ref id="B97">
<label>97</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pang</surname> <given-names>B</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Opinion mining and sentiment analysis</article-title>. <source>Foundations Trends&#xae; Inf Retrieval</source>. (<year>2008</year>) <volume>2</volume>:<fpage>1</fpage>&#x2013;<lpage>135</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1561/1500000011</pub-id>
</citation>
</ref>
<ref id="B98">
<label>98</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>D-H</given-names>
</name>
<name>
<surname>Son</surname> <given-names>W-H</given-names>
</name>
<name>
<surname>Kwak</surname> <given-names>S-S</given-names>
</name>
<name>
<surname>Yun</surname> <given-names>T-H</given-names>
</name>
<name>
<surname>Park</surname> <given-names>J-H</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>J-D</given-names>
</name>
</person-group>. <article-title>A hybrid deep learning emotion classification system using multimodal data</article-title>. <source>Sensors</source>. (<year>2023</year>) <volume>23</volume>:<fpage>Article 23</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/s23239333</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>