<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychiatry</journal-id>
<journal-title>Frontiers in Psychiatry</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychiatry</abbrev-journal-title>
<issn pub-type="epub">1664-0640</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyt.2025.1596269</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Psychiatry</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Relationship between personality and sleep: a dual validation study combining empirical and big data-driven approaches</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Cao</surname>
<given-names>Lei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2671249/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wu</surname>
<given-names>Jiake</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3042388/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Mengyao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhao</surname>
<given-names>Liang</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3087713/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Xin</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yao</surname>
<given-names>Bowen</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Qi</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3008068/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Beijing Key Laboratory of Applied Experimental Psychology, National Demonstration Center for Experimental Psychology Education (Beijing Normal University), Faculty of Psychology, Beijing Normal University</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>School of Information Management, Key Laboratory of Semantic, Publishing and Knowledge Service of the National Press and Publication Administration, Wuhan University</institution>, <addr-line>Wuhan</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>The Institute of Biomedical Engineering, University of Oxford</institution>, <addr-line>Oxford</addr-line>, <country>United Kingdom</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>School of Economics and Management, Beijing Jiaotong University</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Long Lu, Wuhan University, China</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Mariusz Stanis&#x142;aw Wiglusz, Medical University of Gdansk, Poland</p>
<p>Saeid Komasi, Mind GPS Institute, Iran</p>
<p>Ali Zakiei, Substance Abuse Prevention Research Center and Sleep Disorders Research Center and Kermanshah University of Medical Sciences, Iran</p>
<p>Sali Rahadi Asih, University of Indonesia, Indonesia</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Qi Li, <email xlink:href="mailto:liqi2018@bnu.edu.cn">liqi2018@bnu.edu.cn</email>
</p>
</fn>
<fn fn-type="other" id="fn003">
<p>&#x2020;These authors share first authorship</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>17</day>
<month>07</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1596269</elocation-id>
<history>
<date date-type="received">
<day>19</day>
<month>03</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>17</day>
<month>06</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Cao, Wu, Wang, Zhao, Wang, Yao and Li</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Cao, Wu, Wang, Zhao, Wang, Yao and Li</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Objective</title>
<p>Sleep is a vital component of individual health, and personality traits are key factors influencing it. This study aims to investigate the relationship between personality traits and both modelassessed sleep problems and self-reported sleep quality.</p>
</sec>
<sec>
<title>Methods</title>
<p>Using deep semantic understanding technology, we developed three deep learning models based on microblogs. Model 1 and Model 2 identified whether a post indicated a sleep problem, while Model 3 assessed the user&#x2019;s personality traits based on the Five-Factor Model (FFM). We surveyed a dataset comprising 336 active users and then applied the models to a large-scale microblog dataset containing 4,860,000 posts from 15,251 users.</p>
</sec>
<sec>
<title>Results</title>
<p>Our experimental results revealed that: (1) conscientiousness, agreeableness, and extraversion are associated with better sleep quality, while neuroticism is linked to poorer sleep quality; (2) the relationships between sleep problems and personality traits remained consistent when the model, trained on a small survey dataset with expert annotations, was applied to the large-scale dataset.</p>
</sec>
<sec>
<title>Conclusions</title>
<p>These findings highlight the potential of using deep learning models to analyze the complex relationship between personality traits and sleep, offering valuable insights for future research and interventions.</p>
</sec>
</abstract>
<kwd-group>
<kwd>personality</kwd>
<kwd>sleep</kwd>
<kwd>semantic understanding</kwd>
<kwd>neural network</kwd>
<kwd>microblog</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="5"/>
<equation-count count="0"/>
<ref-count count="66"/>
<page-count count="15"/>
<word-count count="8670"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Digital Mental Health</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<sec id="s1_1">
<label>1.1</label>
<title>Background</title>
<p>Numerous studies have demonstrated that sleep plays a crucial role in physical recovery, memory consolidation, and emotional regulation (<xref ref-type="bibr" rid="B1">1</xref>). Scholars consider sleep to be a multifaceted phenomenon, proposing various sleep-related characteristics such as sleep quality (<xref ref-type="bibr" rid="B2">2</xref>), sleep duration (<xref ref-type="bibr" rid="B2">2</xref>), sleep problems (<xref ref-type="bibr" rid="B3">3</xref>) and sleep disorders (e.g., insomnia) (<xref ref-type="bibr" rid="B4">4</xref>). When these sleep issues arise, they are associated with an increased risk of developing various physical health conditions, including diabetes (<xref ref-type="bibr" rid="B5">5</xref>), obesity (<xref ref-type="bibr" rid="B6">6</xref>), cardiovascular diseases (<xref ref-type="bibr" rid="B7">7</xref>), and Alzheimer&#x2019;s disease (<xref ref-type="bibr" rid="B8">8</xref>), as well as a heightened risk of mortality (<xref ref-type="bibr" rid="B9">9</xref>). In addition, sleep disorders are strongly linked to mental health problems, such as the experience of excessive negative emotions and insufficient positive emotions (<xref ref-type="bibr" rid="B10">10</xref>). To better understand sleep, researchers have developed various tools to assess different aspects of sleep, which can generally be categorized into objective and subjective measures. Objective sleep characteristics are typically measured using laboratory equipment or specialized wearable devices, to record multiple physiological signals during sleep (e.g., electroencephalography and eye movements). These measures are considered the standard clinical procedure for diagnosing sleep-related disorders. Subjective sleep characteristics are commonly assessed through self-reported questionnaires [e.g., the Pittsburgh Sleep Quality Index (PSQI) (<xref ref-type="bibr" rid="B11">11</xref>)] and sleep diaries.</p>
<p>Personality is considered one of the key factors related to sleep (<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B12">12</xref>). According to Akram et&#xa0;al. (<xref ref-type="bibr" rid="B4">4</xref>), the inherent nature of personality serves as both a predisposing and a potential maintaining factor for insomnia. A closer examination of personality&#x2019;s susceptibility and its long-term effects can provide a better understanding of the etiology of insomnia (<xref ref-type="bibr" rid="B12">12</xref>). For example, Grandner (<xref ref-type="bibr" rid="B13">13</xref>) noted that elevated arousal levels may explain the connection between neuroticism and sleep quality, as neuroticism is associated with stronger physiological responses to stress, which can delay an individual&#x2019;s return to a calm state after experiencing acute stress. To better understand personality, scholars have proposed various models from different perspectives. These include Cloninger&#x2019;s psychobiological model (<xref ref-type="bibr" rid="B14">14</xref>), Cattell&#x2019;s 16Factor Personality model (16 PF) (<xref ref-type="bibr" rid="B15">15</xref>), Eysenck&#x2019;s personality model (<xref ref-type="bibr" rid="B16">16</xref>), the Alternative Model of Personality Disorders (AMPD) (<xref ref-type="bibr" rid="B17">17</xref>), and the Five-Factor Model (FFM) (<xref ref-type="bibr" rid="B18">18</xref>). Among the commonly used models, Cloninger&#x2019;s psychobiological model emphasizes the integration of genetic and developmental factors and is widely applied in mental disorder research (<xref ref-type="bibr" rid="B14">14</xref>); the DSM-5&#x2019;s Alternative Model of Personality Disorders (AMPD) focuses on traits such as negative affectivity, detachment, antagonism, disinhibition, and psychoticism, which are typically used to assess maladaptive personality traits and disorders (<xref ref-type="bibr" rid="B17">17</xref>). While all these models provide comprehensive analyses of personality, the FFM, also known as the Big-5 (<xref ref-type="bibr" rid="B19">19</xref>), stands out due to its demonstrated moderate-to-high longitudinal stability, reliability, and cross-cultural applicability (<xref ref-type="bibr" rid="B2">2</xref>). The FFM includes five broad traits: extraversion, agreeableness, conscientiousness, neuroticism, and openness to new experiences (<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B20">20</xref>).</p>
<p>Previous studies have shown that personality traits negatively affect various sleep characteristics, particularly sleep quality and chronotype (<xref ref-type="bibr" rid="B2">2</xref>, <xref ref-type="bibr" rid="B3">3</xref>). In research based on the Five-Factor Model (FFM), neuroticism has consistently been identified as a stable negative predictor of sleep quality (<xref ref-type="bibr" rid="B2">2</xref>, <xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B21">21</xref>&#x2013;<xref ref-type="bibr" rid="B25">25</xref>). Individuals with high neuroticism are more likely to hold metacognitive beliefs about sleep difficulties (<xref ref-type="bibr" rid="B24">24</xref>), experience more negative and fewer positive emotions (<xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B26">26</xref>), and tend to be more hyperaroused, all of which adversely affect sleep quality (<xref ref-type="bibr" rid="B10">10</xref>). Beyond FFM-based research, the Cloninger model also shows a correlation between traits like harm avoidance and sleep disorders such as insomnia (<xref ref-type="bibr" rid="B27">27</xref>). Zakiei et&#xa0;al. (<xref ref-type="bibr" rid="B28">28</xref>) emphasized that not only traditional personality traits but also pathological traits (e.g., psychoticism and negative affectivity) are stable predictors of various sleep problems. Akram et&#xa0;al. (<xref ref-type="bibr" rid="B4">4</xref>) also found that insomnia is linked to negative or maladaptive personality traits, including neuroticism, perfectionism, worry, social inhibition, and avoidance. Hisler et&#xa0;al. (<xref ref-type="bibr" rid="B29">29</xref>) suggested that trait stress, rather than neuroticism, modulates the relationship between sleep and self-control. However, several recent studies have reported findings that challenge these widely accepted relationships, particularly the link between neuroticism and sleep quality (<xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B30">30</xref>). Saksvik-Lehouillier et&#xa0;al. (<xref ref-type="bibr" rid="B25">25</xref>) found that individuals with high neuroticism experience fewer negative emotions under partial sleep deprivation than during normal sleep, whereas those with medium and low levels of neuroticism reported the opposite pattern. A further study of college students using Actigraph to objectively measure sleep found no relationship between neuroticism and sleep quality (<xref ref-type="bibr" rid="B30">30</xref>).</p>
<p>Several studies suggest that conscientiousness and extraversion are positively correlated with sleep quality (<xref ref-type="bibr" rid="B2">2</xref>, <xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B23">23</xref>), as individuals higher in these traits tend to be both psychologically and physiologically healthier and experience fewer negative emotions in stressful situations (<xref ref-type="bibr" rid="B26">26</xref>). However, some studies have contradicted these findings, suggesting that the relationship between personality traits and sleep quality may not be consistent across different contexts (<xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B30">30</xref>). For example, Kri&#x17e;an and Hisler (<xref ref-type="bibr" rid="B22">22</xref>) found no significant relationship between extraversion and objectively measured sleep quality, and Mead et&#xa0;al. (<xref ref-type="bibr" rid="B30">30</xref>) reported that extraversion may even negatively impact sleep quality.</p>
<p>Although research generally shows that agreeableness and openness are unrelated to sleep quality (<xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B30">30</xref>), Cellini et&#xa0;al. (<xref ref-type="bibr" rid="B10">10</xref>) found that when cognitive reappraisal, inhibition, emotions, and hyperarousal were included in the regression model, agreeableness was the only personality trait that predicted sleep quality. Spears et&#xa0;al. (<xref ref-type="bibr" rid="B9">9</xref>) also suggested that agreeableness may indirectly predict mortality risk by affecting daytime impairments and sleep. Furthermore, Leger et&#xa0;al. (<xref ref-type="bibr" rid="B26">26</xref>) found evidence suggesting that openness might be associated with better sleep quality, as individuals with high openness tend to experience fewer negative emotions and may, therefore, have better sleep quality.</p>
</sec>
<sec id="s1_2">
<label>1.2</label>
<title>Measuring personality and sleep from social media</title>
<p>Due to the limitations of traditional methods in large-scale data collection, real-time analysis, and cost efficiency, researchers have increasingly turned to social media in recent years to assess mental health indicators, leveraging its natural user expressions and traceable characteristics as complementary tools (<xref ref-type="bibr" rid="B31">31</xref>&#x2013;<xref ref-type="bibr" rid="B35">35</xref>). These studies focused on three characteristics: behavioral features [e.g., number of posts, timing of posts, frequency of likes (<xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B36">36</xref>), and comments on other posts (<xref ref-type="bibr" rid="B37">37</xref>)]; multimedia features [e.g., videos (<xref ref-type="bibr" rid="B38">38</xref>) and images (<xref ref-type="bibr" rid="B39">39</xref>)]; and text features. For text features, three semantic representation methods were mainly used to understand the content: discrete representations [e.g., term frequency-inverse document frequency (<xref ref-type="bibr" rid="B40">40</xref>)], closed vocabulary methods [e.g., Linguistic Inquiry and Word Count (<xref ref-type="bibr" rid="B41">41</xref>) and self-defined dictionaries (<xref ref-type="bibr" rid="B42">42</xref>)], and open vocabulary methods [e.g., Word2Vec (<xref ref-type="bibr" rid="B43">43</xref>) and BERT (<xref ref-type="bibr" rid="B44">44</xref>)]. Among these, open vocabulary methods using deep learning-based word embeddings provide the most effective representation of social media text (<xref ref-type="bibr" rid="B45">45</xref>).</p>
<p>Regarding personality, most research on personality assessment has focused on English text (<xref ref-type="bibr" rid="B46">46</xref>), with few studies examining the Chinese context using distributed representation methods for data training models. For example, Mahajan et&#xa0;al. (<xref ref-type="bibr" rid="B47">47</xref>) found that online-revealed personalities align with users&#x2019; true personalities. Cutler and Condon (<xref ref-type="bibr" rid="B48">48</xref>) conducted factor analysis on word embeddings of English text using BERT and compared the results with earlier lexical studies. They found that agreeableness, extraversion, and conscientiousness traits were well-replicated, but neuroticism and openness were not. Considerable research attention has focused on examining the relationship between sleep characteristics and their associated variables on social media platforms such as Twitter, Weibo, and Reddit (<xref ref-type="bibr" rid="B49">49</xref>). For example, Liu et&#xa0;al. (<xref ref-type="bibr" rid="B50">50</xref>) examined sleep-related user attributes like region and education levels, and Yao et&#xa0;al. (<xref ref-type="bibr" rid="B51">51</xref>) investigated how sleep quality as a symptom accompanies other mental health issues within a depression community, identifying co-occurrences with fear, negative expectations, and suicidal intentions. Relatively few studies have evaluated sleep problems using natural language processing techniques. For instance, Tian et&#xa0;al. (<xref ref-type="bibr" rid="B52">52</xref>) employed a support vector machine algorithm to detect sleep-related complaints in social media posts and identify key topics associated with insomnia.</p>
</sec>
<sec id="s1_3">
<label>1.3</label>
<title>Research objectives</title>
<p>Previous studies have established connections between personality traits and sleep characteristics, but inconsistent methodologies have produced mixed results (<xref ref-type="bibr" rid="B4">4</xref>). Two persistent issues complicate research in this area. First, data availability remains limited. Most existing datasets that include both sleep and personality measures are small and not publicly accessible, which restricts the generalizability of findings. Second, research approaches are often disconnected. Although social media platforms offer rich natural language data, most studies focus exclusively on either personality assessment or insomnia detection, with little attention to the interaction between the two (<xref ref-type="bibr" rid="B53">53</xref>).</p>
<p>This study aims to investigate the relationship between personality traits and both model-assessed sleep problems and self-reported sleep quality. Specifically, we focus on four main objectives:</p>
<list list-type="order">
<list-item>
<p>Develop and validate deep learning models for assessing sleep problems.</p>
</list-item>
<list-item>
<p>Develop and validate deep learning models for personality assessments.</p>
</list-item>
<list-item>
<p>Examine how personality traits correlate with self-reported sleep quality in survey responses.</p>
</list-item>
<list-item>
<p>Examine the link between personality traits and model-assessed sleep problems in the large dataset.</p>
</list-item>
</list>
</sec>
</sec>
<sec id="s2">
<label>2</label>
<title>Methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Overview of the methodological process</title>
<p>As shown in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>, we followed a systematic process for project design, data collection, and implementation. (1) First, we collected microblogs from Sina Weibo, China&#x2019;s largest social media platform, and constructed two datasets. The first dataset was a large-scale collection, consisting of 4,860,000 posts from 15,251 users. The second dataset combined microblogs with survey responses from 923 Sina Weibo users (336 active users). For data collection and management, we used PyCharm 2021.3.1 (Community Edition, JetBrains) to process the microblog text. (2) We then built two sleep assessment models: Model 1 was designed to determine whether a post was sleep-related, and Model 2 assessed whether a post indicated a sleep problem. For personality assessment, we applied BERT-based word embeddings in combination with long short-term memory (LSTM) (<xref ref-type="bibr" rid="B55">55</xref>) regression models incorporating an attention mechanism (Model 3). (3) To analyze the relationship between personality traits (FFM) and sleep characteristics, we used both self-reported data and model-generated assessments. As part of an exploratory analysis, we applied the three semantic models, which independently assess personality traits and sleep problems, to the large-scale microblog dataset to further investigate their relationship in this context.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>The framework of the study. CBF-PI, Chinese simplified big five personality inventory (<xref ref-type="bibr" rid="B54">54</xref>); PSQI, Pittsburgh sleep quality index (<xref ref-type="bibr" rid="B11">11</xref>).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1596269-g001.tif">
<alt-text content-type="machine-generated">Flowchart showing three sections: Sleep Assessment Models, Personality Assessment Models, and Relationship Analysis between Personality and Sleep. The first section details steps for processing posts on sleep, using BERT models to classify sleep-related and sleep-problem posts. The second section outlines survey data collection and cleaning, producing personality scores using BERT, Attention, and LSTM. The final section combines data sets for analyzing the relationship between personality and sleep, with models assessing sleep states and personality. Arrows indicate data flow and model outcomes.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Data collection</title>
<sec id="s2_2_1">
<label>2.2.1</label>
<title>Microblog dataset</title>
<p>The construction of the microblog dataset followed four steps: collection, cleaning, encoding, and enhancement. We collected microblogs from March 2021 to July 2021 using a set of sleep-related keywords describing sleep-related issues (e.g., &#x201c;insomnia&#x201d;, &#x201c;stay up&#x201d;, &#x201c;extensive dream&#x201d;, &#x201c;nightmare&#x201d;, &#x201c;startle awake&#x201d;, &#x201c;early morning&#x201d;, &#x201c;unable to sleep&#x201d; and &#x201c;sleepy&#x201d;). Thus, we obtained a large microblog dataset (N = 7,588,597) potentially reflecting sleep problems. From this dataset, we randomly selected a smaller subset for human labeling. The dataset had an average of 219.46 posts per user.</p>
<sec id="s2_2_1_1">
<label>2.2.1.1</label>
<title>Text cleaning and encoding</title>
<p>We counted the frequency of stop words (e.g., advertisement and marketing account) and filtered noisy posts via manual screening. This resulted in 3,449,456 posts for subsequent analysis. We randomly selected 1,600 posts, and each post was labeled in two steps by two undergraduate psychology students. For the label of &#x201c;whether the post is related to sleep&#x201d;, a total of 1,497 posts were consistently labeled (r = 0.84, <italic>p &lt;</italic>.001), of which 1,042 posts were sleep-related. For the label of &#x201c;whether the post reflects a sleep problem&#x201d;, a total of 774 posts were labeled consistently (r = 0.41, <italic>p &lt;</italic>.001), of which 606 posts were related to a &#x201c;sleep problem&#x201d;. In the subsequent model building, we only used consistently labeled data.</p>
</sec>
<sec id="s2_2_1_2">
<label>2.2.1.2</label>
<title>Data enhancement</title>
<p>To balance the sample size for the training set, we applied different strategies to the training set of Model 1 (&#x201c;whether the post is related to sleep&#x201d;) and Model 2 (&#x201c;whether the post reflects a sleep problem&#x201d;). For Model 1, we added 957 posts that did not include sleep-related keywords and were not related to sleep. For Model 2, we used the back-translation method (using the googletrans library in Python): the original post was translated into English, then translated into Spanish, and finally translated back into Chinese. We obtained 517 posts that did not express sleep problems, and 1,123 posts were selected for training Model 2.</p>
</sec>
</sec>
<sec id="s2_2_2">
<label>2.2.2</label>
<title>User survey</title>
<sec id="s2_2_2_1">
<label>2.2.2.1</label>
<title>Participants</title>
<p>The surveys were created using Qualtrics and distributed in two ways: 1) alongside the &#x201c;# Questionnaire Mutual Filling&#x201d; super topics on Sina Weibo, and 2) via the PsyExperimentor participant recruitment platform <xref ref-type="fn" rid="fn1">
<sup>1</sup>
</xref>. A total of 923 questionnaires were collected, of which 336 were valid and from active users. The average age of participants was 23.66 years (standard deviation (<italic>SD</italic>) = 4.60), and 257 were women. Participants were excluded if they failed the lie detection questions, were inactive microblog users (i.e., had fewer than five original posts), or had nonexistent or marketing-focused user identifications (ID). Through the user IDs, we crawled the original posts of all participants from January 2020 to January 2023 (N = 73,735). On average, each participant made 219.45 original posts. The highest and lowest number of posts by a participant was 3,945 and 5, respectively.</p>
</sec>
<sec id="s2_2_2_2">
<label>2.2.2.2</label>
<title>Questionnaires</title>
<p>The questionnaire comprised two parts: (1) a basic information questionnaire, which included age, gender, household registration, occupation, frequency of usage, nickname, and user ID; and (2) the Chinese Simplified Big Five Personality Inventory (CBF-PI) (<xref ref-type="bibr" rid="B54">54</xref>). The CBF-PI comprises a total of 15 items, with three items for each of the five personality traits. Responses are made on a six-point scale, with responses ranging from 1 (completely disagree) to 6 (completely agree). Two items are scored in reverse. Cronbach&#x2019;s alpha coefficients for openness, conscientiousness, extraversion, agreeableness, and neuroticism were 0.82, 0.72, 0.82, 0.83, and 0.77, respectively. The descriptive statistics of the valid users (N = 336) for each dimension of the FFM are presented in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>. The scores for each dimension were normally distributed. The PSQI (<xref ref-type="bibr" rid="B11">11</xref>) comprises 19 items across seven dimensions, and each item is scored on a four-point scale. The total score represents sleep sleep quality, with higher scores indicating poorer sleep quality. Excluding five fill-in-the-blank questions, Cronbach&#x2019;s alpha coefficient for the PSQI was 0.84.</p>
</sec>
</sec>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Sleep assessment models</title>
<p>We developed two sleep assessment models. The first model assessed each post on &#x201c;whether it is related to sleep&#x201d; (Model 1). For posts that are assessed as being &#x201c;related to sleep&#x201d;, the second model evaluated &#x201c;whether there are sleep problems&#x201d; (Model 2). Models 1 and 2 shared a similar structure, and both utilize a BERT fine-tuning approach with a downstream fully connected neural network to build a classifier. To ensure computational efficiency, the text was first segmented into sentences. Due to BERT&#x2019;s input limitation of 512 characteristics, sentences exceeding this length were truncated. After segmentation, each sentence was first passed through a pre-trained BERT Chinese model to convert each word into word embeddings, which were subsequently input into a Transformer Encoder (<italic>Trm</italic>). The <italic>Trm</italic> established semantic relationships between words according to the context. Then the output from the <italic>Trm</italic> was then fed into four types of classification models: a linear fully connected layer (BERT + Linear), a convolutional neural network (BERT + CNN), a recurrent neural network (BERT + LSTM), and a recurrent neural network with an attention mechanism (BERT + LSTM + Attention). These models were chosen to assess different types of contextual and sequential relationships within the text, allowing us to test various architectures for better performance.</p>
<p>To further evaluate the performance and robustness of our models, we also converted each sentence into word embeddings using a pre-trained ERNIE model [Enhanced Representation through Knowledge Integration; (<xref ref-type="bibr" rid="B56">56</xref>)], which was then input into a linear classifier (ERNIE + Linear). This additional model served as a comparative baseline, allowing us to assess the impact of using a different pre-trained language model for the task. The results from these models were compared to determine the most effective architecture for assessing sleep-related content and sleep problems in microblog posts, providing insights into which approach best captured the nuances of sleep-related language.</p>
<p>We split the labeled dataset for Model 1 (N = 2,454) and the labeled dataset for Model 2 (N = 1,123) into training, validation, and testing sets using a ratio of 8:1:1. Specifically, 80% of the data was used for training the model, 10% for model validation, and the remaining 10% for testing. This approach ensured that the models were trained on a sufficient amount of data while retaining a separate dataset for testing performance and tuning. To evaluate the performance of the models, we used Precision (P), Recall (R), and F1 score as key metrics. These metrics were chosen because they offer a balanced view of model performance. In our evaluation, the F1 score was prioritized because it combines both Precision and Recall into a single metric, offering a more comprehensive understanding of the model&#x2019;s performance.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Personality assessment models</title>
<p>The personality assessment model based on microblog text comprised five components: the BERT embedding layer, sentence fusion layer, LSTM layer, attention layer, and regression layer (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). This model evaluated personality as a trait variable, assuming it remains stable over time. Therefore, we aggregated multiple posts from each user to form a sequence of text data, which was crucial for capturing the consistency of the user&#x2019;s personality expression over time. Initially, word embeddings for each post were generated using the Chinese BERT pre-trained model. Since BERT had an input limitation of 512 tokens, posts longer than this threshold were truncated, and a &#x201c;split then merge&#x201d; approach was applied to ensure that the word embeddings accurately represented longer posts. In the sentence fusion layer, the word embeddings from the most recent 100 posts were selected for subsequent training. For users with fewer than 100 posts, zero vectors were used for padding. This resulted in each user&#x2019;s word embeddings being represented as a 100 &#xd7; 768 matrix. The sequence of word embedding matrices for each user was then input into the LSTM layer. LSTM, a specialized type of recurrent neural network, was particularly suited for handling sequence data. Here, each user&#x2019;s posts were treated as a sequence, allowing the LSTM to capture the temporal dynamics and semantic relationships across the multiple posts of each user. By processing these sequences, the model could learn how a user&#x2019;s personality traits were reflected and expressed over time in the context of their social media posts.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Structure of the personality assessment models (Model 3). Each model contains five layers: bidirectional encoder representations from transformers (BERT) word-embedding layer, sentence fusion layer, LSTM layer, attention layer, and regression layer. We trained five separate regression models for the Big Five personality traits. We used users&#x2019; self-reported scores as labeled inputs for training.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1596269-g002.tif">
<alt-text content-type="machine-generated">Diagram of a neural network architecture involving BERT word embeddings processed through a sentence-pool module, followed by a Long Short-Term Memory (LSTM) network. Attention mechanisms compute vectors \(a_1\) to \(a_N\), which are integrated to form a vector \(v\). This vector is passed through a linear layer leading to a regression score. The process is sequentially labeled: 1) BERT word embedding, 2) Sentence-Pool, 3) LSTM, 4) Attention, and 5) Regression.</alt-text>
</graphic>
</fig>
<p>To enhance the model&#x2019;s focus on relevant personality-related features, we incorporated an attention mechanism. This mechanism allocated attention to different parts of the sentence vectors, enabling the model to better capture key personality-related content from each post, thereby improving classification accuracy. Finally, a linear regression model was applied to the output of the attention layer to generate the personality scores.</p>
<p>We trained five separate regression models for the Big Five personality traits, using normalized selfreported CBF-PI scores as labeled inputs. Normalizing personality scores improved training efficiency, reduced the impact of data sparsity and outliers, and led to a more stable model. In addition to the primary model, we compared the BERT-based model&#x2019;s performance with simpler models such as a linear fully connected layer (BERT + Linear) and a recurrent neural network (BERT + LSTM). The effectiveness of these models was evaluated by comparing the predicted personality scores with the labeled values using Pearson&#x2019;s correlation coefficient and RMSE. This comparison allowed us to assess the relative performance of different models in capturing personality traits from user-generated microblog content.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Development and validation of deep learning models for sleep problem assessment</title>
<p>The results of the sleep assessment models (i.e., Models 1 and 2) and comparisons with alternate models are shown in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>. When determining whether a post is related to sleep (Model 1), the best performance was achieved when using only the BERT fine-tuning approach (accuracy = 95.09%, precision = 97.27%, F1 score = 0.95). When determining whether a sleep-related post indicated a sleep problem (Model 2), the best performance was achieved when using only the BERT fine-tuning approach, which had an accuracy of 91.30%, a precision of 91.65%, and an F1 score of 0.91.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Results of sleep assessment models: Model 1 assessed whether a post is related to sleep, and Model 2 evaluated whether there is a sleep problem in the post.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" align="center">Model</th>
<th valign="top" colspan="3" align="center">Model 1</th>
<th valign="top" colspan="3" align="center">Model 2</th>
</tr>
<tr>
<th valign="top" align="center">Precision</th>
<th valign="top" align="center">Recall</th>
<th valign="top" align="center">F1</th>
<th valign="top" align="center">Precision</th>
<th valign="top" align="center">Recall</th>
<th valign="top" align="center">F1</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">BERT + Linear</td>
<td valign="top" align="center">95.09%</td>
<td valign="top" align="center">
<bold>97.27%</bold>
</td>
<td valign="top" align="center">
<bold>0.95</bold>
</td>
<td valign="top" align="center">
<bold>91.30%</bold>
</td>
<td valign="top" align="center">
<bold>91.65%</bold>
</td>
<td valign="top" align="center">
<bold>0.91</bold>
</td>
</tr>
<tr>
<td valign="top" align="center">ERNIE + Linear</td>
<td valign="top" align="center">
<bold>97.25%</bold>
</td>
<td valign="top" align="center">92.17%</td>
<td valign="top" align="center">0.95</td>
<td valign="top" align="center">90.20%</td>
<td valign="top" align="center">88.46%</td>
<td valign="top" align="center">0.89</td>
</tr>
<tr>
<td valign="top" align="center">BERT + CNN</td>
<td valign="top" align="center">88.60%</td>
<td valign="top" align="center">87.83%</td>
<td valign="top" align="center">0.88</td>
<td valign="top" align="center">86.27%</td>
<td valign="top" align="center">84.62%</td>
<td valign="top" align="center">0.85</td>
</tr>
<tr>
<td valign="top" align="center">BERT + LSTM</td>
<td valign="top" align="center">92.52%</td>
<td valign="top" align="center">90.00%</td>
<td valign="top" align="center">0.91</td>
<td valign="top" align="center">89.36%</td>
<td valign="top" align="center">80.77%</td>
<td valign="top" align="center">0.85</td>
</tr>
<tr>
<td valign="top" align="center">BERT + LSTM + Attention</td>
<td valign="top" align="center">89.74%</td>
<td valign="top" align="center">91.30%</td>
<td valign="top" align="center">0.91</td>
<td valign="top" align="center">62.67%</td>
<td valign="top" align="center">90.38%</td>
<td valign="top" align="center">0.74</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Bold values indicate the best model performance.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>It is noteworthy that the assessment models for sleep-related and sleep problem posts, which used only BERT or ERNIE fine-tuning followed by a fully connected neural network output, performed better than those that incorporated additional deep learning algorithms. This indicates that, for our tasks, fine-tuning pre-trained models is sufficient to achieve good classification results. In fact, the addition of more complex models tended to degrade performance. This aligns with the findings of Mohammadi and Chapon (<xref ref-type="bibr" rid="B57">57</xref>), who demonstrated that when fine-tuning BERT pre-trained models, fully connected neural networks perform better than more complex classifiers for text classification tasks. Simpler classifiers can maximize the use of BERT&#x2019;s text representation capabilities, resulting in better performance, whereas complex classifiers are more prone to issues like overfitting, which can degrade performance.</p>
<p>We applied the sleep assessment models (Model 1 and Model 2) to a total of 73,735 posts from 336 valid participants. Among these, 2,709 posts were identified as related to sleep, and 1,578 of them were further identified as expressing sleep problems. For each participant, we calculated: (1) the total number of posts (TN, i.e., posting frequency); (2) the number of sleep-related posts (NSR); (3) the number of posts indicating sleep problems (NSP); (4) the proportion of sleep-related posts (PSR); and (5) the proportion of posts with sleep problems (PSP). Among the 336 users, 192 posted sleep-related content (with a maximum of 168 such posts and a highest proportion of 53.30%), and 172 users posted content expressing sleep problems (with a maximum of 81 such posts and a highest proportion of 53.33%).</p>
<p>We initially used self-reported sleep quality (i.e., PSQI scores) to evaluate the validity of sleep characteristics assessed by Model 1 and Model 2. However, PSQI scores were not significantly correlated with any of the four model-assessed sleep characteristics. To further explore potential influencing factors, we examined the correlation between the number of posts indicating sleep problems (NSP) and the total number of posts (TN). A strong positive correlation was observed (Pearson&#x2019;s r = 0.64, <italic>p &lt;</italic>.001), indicating possible collinearity. To address this, we conducted a moderation analysis with PSQI score as the independent variable, the number of posts indicating sleep problems (NSP) as the dependent variable, and the total number of posts (TN) as a moderating variable. Age and gender were included as covariates. The results showed that poorer self-reported sleep quality (i.e., higher PSQI scores) significantly predicted a greater number of sleep problem posts (NSP) (<italic>&#x3b2;</italic> = 0.68, <italic>p</italic> = .015). In addition, the interaction between sleep quality and the total number of posts (TN) was significant (<italic>&#x3b2;</italic> = 0.12, <italic>p</italic> = .006), suggesting a moderating effect of user activity. Simple slope analysis (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>) indicated that when the posting frequency was low, the PSQI score did not significantly predict the number of sleep problem posts (NSP) (<italic>&#x3b2;</italic> = 0.06, <italic>p</italic> = .817). However, at a high level of posting frequency, higher PSQI score significantly predicted more posts expressing sleep problems (<italic>&#x3b2;</italic> = 1.49, <italic>p &lt;</italic>.001). A similar pattern was observed for the number of sleep-related posts (NSR). From these findings, we conclude that:</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>The moderating effect of the total number of posts (TN) on self-reported sleep quality (SQ, assessed using the pittsburgh sleep quality index (PSQI)) and the number of posts indicating a sleep problem (NSP, assessed using Model 2).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1596269-g003.tif">
<alt-text content-type="machine-generated">Line chart showing the relationship between self-reported sleep quality (low to high) and the number of posts indicating a sleep problem. The orange line shows a high number of posts, increasing from 9 to 13 as sleep quality rises. The blue line shows a low number of posts, remaining constant near zero.</alt-text>
</graphic>
</fig>
<p>Conclusion 1: Self-reported sleep quality significantly predicts model-assessed sleep problems, and this relationship is moderated by users&#x2019; total posting frequency.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Development and validation of deep learning models for personality assessments</title>
<p>The predictive performance of the personality (Big Five) models (Model 3) is shown in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>. When the input consisted of sentence vectors extracted using BERT features, the LSTM regression model based on the attention mechanism performed the best (average RMSE = 0.186), with predicted values for the test set significantly positively correlated with the questionnaire scores. Using the linear regression model or the LSTM model separately resulted in poor performance, with low, non-significant correlation coefficients between the predicted and questionnaire scores and higher RMSE. It is noteworthy that the performance of the personality assessment model (Model 3) varied across the five traits. Openness (<italic>r</italic> = 0.50, <italic>p</italic> = .003) and conscientiousness (<italic>r</italic> = 0.51, <italic>p</italic> = .003) performed well, with correlations around 0.5, whereas extraversion (<italic>r</italic> = 0.27, <italic>p</italic> = .021), agreeableness (<italic>r</italic> = 0.33, <italic>p</italic> = .013), and neuroticism (<italic>r</italic> = 0.24, <italic>p</italic> = .047) showed poorer performance. The self-reported questionnaires indicated generally high scores, with uneven training data for agreeableness. Results for agreeableness and extraversion may also have been affected by social desirability factors, such as acceptance, pro-social behavior, and sociability (<xref ref-type="bibr" rid="B58">58</xref>). Furthermore, agreeableness, which is a highly evaluative trait, may lead to inaccuracies in self-assessment and, in turn, inconsistent results (<xref ref-type="bibr" rid="B59">59</xref>).</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Results of personality assessment models: the Chinese Simplified Big Five Personality Inventory (CBF-PI) as a measure of FFM.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Method</th>
<th valign="top" align="center">Result</th>
<th valign="top" align="center">O</th>
<th valign="top" align="center">C</th>
<th valign="top" align="center">E</th>
<th valign="top" align="center">A</th>
<th valign="top" align="center">N</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="2" align="center">CBF-PI Score</td>
<td valign="top" align="center">
<italic>M</italic>
</td>
<td valign="top" align="center">10.82</td>
<td valign="top" align="center">13.34</td>
<td valign="top" align="center">10.12</td>
<td valign="top" align="center">13.80</td>
<td valign="top" align="center">10.34</td>
</tr>
<tr>
<td valign="top" align="center">
<italic>SD</italic>
</td>
<td valign="top" align="center">3.23</td>
<td valign="top" align="center">2.54</td>
<td valign="top" align="center">3.40</td>
<td valign="top" align="center">2.64</td>
<td valign="top" align="center">3.28</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">BERT + Linear</td>
<td valign="top" align="center">
<italic>r</italic>
</td>
<td valign="top" align="center">-0.04</td>
<td valign="top" align="center">0.09</td>
<td valign="top" align="center">0.04</td>
<td valign="top" align="center">0.04</td>
<td valign="top" align="center">-0.30</td>
</tr>
<tr>
<td valign="top" align="center">RMSE</td>
<td valign="top" align="center">0.34</td>
<td valign="top" align="center">0.28</td>
<td valign="top" align="center">0.38</td>
<td valign="top" align="center">0.25</td>
<td valign="top" align="center">0.42</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">BERT + LSTM</td>
<td valign="top" align="center">
<italic>r</italic>
</td>
<td valign="top" align="center">0.14</td>
<td valign="top" align="center">0.09</td>
<td valign="top" align="center">0.10</td>
<td valign="top" align="center">0.20</td>
<td valign="top" align="center">0.14</td>
</tr>
<tr>
<td valign="top" align="center">RMSE</td>
<td valign="top" align="center">0.21</td>
<td valign="top" align="center">0.19</td>
<td valign="top" align="center">0.22</td>
<td valign="top" align="center">0.19</td>
<td valign="top" align="center">0.24</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">BERT + LSTM + Attention</td>
<td valign="top" align="center">
<italic>r</italic>
</td>
<td valign="top" align="center">0.50**</td>
<td valign="top" align="center">0.51**</td>
<td valign="top" align="center">0.28**</td>
<td valign="top" align="center">0.33*</td>
<td valign="top" align="center">0.24*</td>
</tr>
<tr>
<td valign="top" align="center">RMSE</td>
<td valign="top" align="center">
<bold>0.17</bold>
</td>
<td valign="top" align="center">
<bold>0.16</bold>
</td>
<td valign="top" align="center">
<bold>0.21</bold>
</td>
<td valign="top" align="center">
<bold>0.17</bold>
</td>
<td valign="top" align="center">
<bold>0.22</bold>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>O, Openness; C, Conscientiousness; E, Extraversion; A, Agreeableness; N, Neuroticism; M, Mean; SD, Standard Deviation; <italic>r</italic>, Pearson&#x2019;s correlation coefficient; RMSE, Root Mean Squared Error. *<italic>p &lt;.</italic>05, **<italic>p &lt;.</italic>01.</p>
</fn>
<fn>
<p>Bold values indicate the best model performance.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Relationship between personality traits and self-reported sleep quality</title>
<p>We examined the correlations between self-reported sleep quality (i.e., PSQI score), the number of sleep-related posts (NSR), the number of posts indicating a sleep problem (NSP), and the proportion of posts with sleep problems (PSP) and personality traits (measured by CBF-PI scores) (<xref ref-type="supplementary-material" rid="SF1">
<bold>Supplementary Table S1</bold>
</xref> in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplemental Materials</bold>
</xref>). The results showed significant associations between all five personality traits (openness, conscientiousness, extraversion, agreeableness, and neuroticism) and PSQI scores. Then we used these four model-assessed sleep characteristics as dependent variables and other variables (i.e., personality traits, gender and age) that showed significant correlations with these characteristics as independent variables in the regression model. Results in <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref> show that agreeableness significantly predicted better self-reported sleep quality (<italic>&#x3b2;</italic> = 0.14, <italic>p &lt;</italic>.01), while neuroticism significantly predicted poorer self-reported sleep quality (<italic>&#x3b2;</italic> = 0.4, <italic>p &lt;</italic>.001). Therefore, we concluded that:</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Regression analysis of personality traits (CBF-PI scores) with PSQI and model-assessed sleep characteristics in 336 users.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" colspan="2" align="center">Regression models</th>
<th valign="top" colspan="6" align="center">Model fit</th>
</tr>
<tr>
<th valign="top" align="center">Dependent</th>
<th valign="top" align="center">Independent</th>
<th valign="top" align="center">
<italic>R</italic>
</th>
<th valign="top" align="center">
<italic>R</italic>
<sup>2</sup>
</th>
<th valign="top" align="center">
<italic>F</italic>
</th>
<th valign="top" align="center">
<italic>B</italic> (95% CI)</th>
<th valign="top" align="center">
<italic>&#x3b2;</italic>
</th>
<th valign="top" align="center">
<italic>t</italic>
</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="5" align="center">PSQI</td>
<td valign="top" align="center">O</td>
<td valign="top" rowspan="5" align="center">0.53</td>
<td valign="top" rowspan="5" align="center">0.27</td>
<td valign="top" rowspan="5" align="center">26.35**</td>
<td valign="top" align="center">0.03 [&#x2013;0.06,0.13]</td>
<td valign="top" align="center">0.04</td>
<td valign="top" align="center">0.49</td>
</tr>
<tr>
<td valign="top" align="center">C</td>
<td valign="top" align="center">&#x2013;0.11 [&#x2013;0.24,0.01]</td>
<td valign="top" align="center">&#x2013;0.10</td>
<td valign="top" align="center">&#x2013;1.85</td>
</tr>
<tr>
<td valign="top" align="center">E</td>
<td valign="top" align="center">&#x2013;0.07 [&#x2013;0.17,0.02]</td>
<td valign="top" align="center">&#x2013;0.08</td>
<td valign="top" align="center">&#x2013;1.50</td>
</tr>
<tr>
<td valign="top" align="center">A</td>
<td valign="top" align="center">&#x2013;0.15 [&#x2013;0.27,0.46]</td>
<td valign="top" align="center">&#x2013;0.14</td>
<td valign="top" align="center">
<bold>&#x2013;2.70*</bold>
</td>
</tr>
<tr>
<td valign="top" align="center">N</td>
<td valign="top" align="center">0.36 [0.27,0.46]</td>
<td valign="top" align="center">0.40</td>
<td valign="top" align="center">
<bold>7.61***</bold>
</td>
</tr>
<tr>
<td valign="middle" rowspan="4" align="center">NSR</td>
<td valign="top" align="center">Age</td>
<td valign="top" rowspan="4" align="center">0.20</td>
<td valign="top" rowspan="4" align="center">0.03</td>
<td valign="top" rowspan="4" align="center">3.50*</td>
<td valign="top" align="center">0.37 [&#x2013;0.04,0.78]</td>
<td valign="top" align="center">0.10</td>
<td valign="top" align="center">1.76</td>
</tr>
<tr>
<td valign="top" align="center">O</td>
<td valign="top" align="center">&#x2013;0.33 [&#x2013;1.72,&#x2013;0.08]</td>
<td valign="top" align="center">&#x2013;0.06</td>
<td valign="top" align="center">&#x2013;0.96</td>
</tr>
<tr>
<td valign="top" align="center">C</td>
<td valign="top" align="center">&#x2013;0.90 [&#x2013;1.72,&#x2013;0.08]</td>
<td valign="top" align="center">&#x2013;0.13</td>
<td valign="top" align="center">
<bold>&#x2013;2.15*</bold>
</td>
</tr>
<tr>
<td valign="top" align="center">E</td>
<td valign="top" align="center">&#x2013;0.24 [&#x2013;0.87,0.39]</td>
<td valign="top" align="center">&#x2013;0.05</td>
<td valign="top" align="center">&#x2013;0.74</td>
</tr>
<tr>
<td valign="middle" rowspan="4" align="center">PSR</td>
<td valign="top" align="center">Gender</td>
<td valign="top" rowspan="4" align="center">0.26</td>
<td valign="top" rowspan="4" align="center">0.05</td>
<td valign="top" rowspan="4" align="center">5.75**</td>
<td valign="top" align="center">3.14 [0.53,5.74]</td>
<td valign="top" align="center">0.13</td>
<td valign="top" align="center">
<bold>2.37*</bold>
</td>
</tr>
<tr>
<td valign="top" align="center">Age</td>
<td valign="top" align="center">0.26 [0.02,0.49]</td>
<td valign="top" align="center">0.12</td>
<td valign="top" align="center">
<bold>2.16*</bold>
</td>
</tr>
<tr>
<td valign="top" align="center">O</td>
<td valign="top" align="center">&#x2013;0.28 [&#x2013;0.64,0.07]</td>
<td valign="top" align="center">&#x2013;0.09</td>
<td valign="top" align="center">&#x2013;1.57</td>
</tr>
<tr>
<td valign="top" align="center">C</td>
<td valign="top" align="center">&#x2013;0.40 [&#x2013;0.82,0.06]</td>
<td valign="top" align="center">&#x2013;0.10</td>
<td valign="top" align="center">&#x2013;1.71</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>O, Openness; C, Conscientiousness; E, Extraversion; A, Agreeableness, N, Neuroticism; PSQI, Pittsburgh Sleep Quality Index; NSR, Number of Sleep-Related Posts; PSR, Proportion of Sleep-Related Posts; PSP, Proportion of Posts with Sleep Problems; R, Pearson&#x2019;s correlation coefficient; R&#xb2;, Coefficient of Determination; F, F-statistic (used to assess model fit); 95% CI, 95% Confidence Interval; B, Unstandardized regression coefficient; <italic>&#x3b2;</italic>, Standardized regression coefficient; t, t-statistic (used for hypothesis testing). *<italic>p</italic>&lt;.05, **<italic>p</italic>&lt;.01.</p>
</fn>
<fn>
<p>Bold values indicate statistically significant results.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Conclusion 2: Openness, conscientiousness, extraversion, and agreeableness were significantly associated with better self-reported sleep quality, while neuroticism was linked to poorer self-reported sleep quality in the correlation analysis. Agreeableness and neuroticism remained significant predictors in the multivariate regression.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Relationship between personality traits and model-assessed sleep problems</title>
<p>We applied the sleep assessment models (i.e., Models 1 and 2) to the dataset comprising 73,735 posts from 336 surveyed users. We then explored the relationships between sleep characteristics and personality traits at both the post and user levels to provide a comprehensive view.</p>
<p>At the post level, &#x201c;whether a post is related to sleep (SR)&#x201d; and &#x201c;whether a post indicates a sleep problem (SP)&#x201d; were used as independent variables, and self-reported personality traits (CBF-PI scores) were used as dependent variables in independent samples t-tests. Due to the small proportion of sleep-related posts for all personality traits except agreeableness, we applied corrections for unequal variances using IBM SPSS Statistics for Mac (Version 26.0.0.2). The results are shown in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>. We found two key results: (1) Posts related to sleep (SR) had significantly lower scores in openness (<italic>t</italic> = 20.88, <italic>p &lt;</italic>.001), conscientiousness (<italic>t</italic> = 19.23, <italic>p &lt;</italic>.001), extraversion (<italic>t</italic> = 17.16, <italic>p &lt;</italic>.001), and agreeableness (<italic>t</italic> = 11.67, <italic>p &lt;</italic>.001), and had significantly higher scores in neuroticism (t = 17.07, p <italic>&lt;</italic>.001); (2) Compared to posts without sleep problems, posts expressing sleep problems (SP) had significantly lower scores in openness (<italic>t</italic> = 17.52, <italic>p &lt;</italic>.001), conscientiousness (<italic>t</italic> = 13.99, <italic>p &lt;</italic>.001), extraversion (<italic>t</italic> = 12.47, <italic>p &lt;</italic>.001), and agreeableness (<italic>t</italic> = 7.70, <italic>p &lt;</italic>.001), and significantly higher scores in neuroticism (<italic>t</italic> = &#x2212;12.93, <italic>p &lt;</italic>.001). Therefore, we drew the following conclusion:</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Relationship between sleep and the big five personality traits (openness, conscientiousness, extraversion, agreeableness, and neuroticism) at the post level (tested on the user survey dataset). &#x201c;SR&#x201d; is an abbreviation for &#x201c;Sleep-Related&#x201d;, indicating whether the post is related to sleep; &#x201c;SP&#x201d; is an abbreviation for &#x201c;Sleep Problems&#x201d;, indicating whether the post explicitly expresses sleep problems. The green bars represent posts classified as &#x201c;Related to sleep&#x201d; or &#x201c;Expressed sleep problems&#x201d;, and the blue bars represent posts classified as &#x201c;Not related to sleep&#x201d; or &#x201c;Did not express sleep problems&#x201d;.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1596269-g004.tif">
<alt-text content-type="machine-generated">Bar chart showing personality scores for five traits: Openness (O), Conscientiousness (C), Extraversion (E), Agreeableness (A), and Neuroticism (N). Each trait has two bars: green for those related to sleep problems and blue for those not related. Scores range from eight to fourteen, with notable higher scores in conscientiousness and agreeableness for both groups.</alt-text>
</graphic>
</fig>
<p>Conclusion 3: Openness, conscientiousness, extraversion and agreeableness measured by CBF-PI scores are significantly associated with fewer model-assessed sleep problems, whereas neuroticism is significantly was associated with more model-assessed sleep problems at the post level.</p>
<p>At the user level, we first examined the correlations between personality traits (measured by CBF-PI scores) and the four model-assessed sleep characteristics (the number of sleep-related posts (NSR), the proportion of sleep-related posts (PSR), the number of posts indicating a sleep problem (NSP) and the proportion of posts with sleep problems (PSP)) (<xref ref-type="supplementary-material" rid="SF1">
<bold>Supplementary Table S1</bold>
</xref> in Supplemental Materials). The number of sleep-related posts (NSR) was significantly negatively correlated with openness (<italic>r</italic> = &#x2212;0.12, <italic>p</italic> = .031), conscientiousness (<italic>r</italic> = &#x2212;0.16, <italic>p</italic> = .006), and extraversion (<italic>r</italic> = &#x2212;0.11, <italic>p</italic> = .046). The number of posts indicating a sleep problem (NSP) was significantly negatively correlated with openness (<italic>r</italic> = &#x2212;0.14, <italic>p</italic> = .013) and conscientiousness (<italic>r</italic> = &#x2212;0.16, <italic>p</italic> = .003). The proportion of posts with sleep problems (PSP) was significantly negatively correlated with openness (<italic>r</italic> = &#x2212;0.14, <italic>p</italic> = .013; <xref ref-type="supplementary-material" rid="SF1">
<bold>Supplementary Table S1</bold>
</xref>). Further regression analysis revealed that conscientiousness was a significant negative predictor of the number of sleep-related posts (NSR) (<italic>&#x3b2;</italic> = &#x2212;0.13, <italic>p</italic> = .032).</p>
<p>Further, we explored the relationship between model-assessed sleep characteristics and model-assessed personality traits from a big data-driven perspective. We randomly selected 15,251 users who had posted sleep-related content and crawled all of their original posts (N = 4,864,600) made between January 2020 to January 2023 using the user IDs. We then selected users who had posted more than five original posts (N = 13,753; 11,035 women, 2,627 men, and 91 with undisclosed gender), resulting in a total of 3,960,000 posts. We applied the sleep assessment models (i.e., Models 1 and 2) and the personality assessment model (Model 3). Results showed that 12,623 users had written sleep-related posts, which totaling 447,600 posts (11.3% of all posts), and 12,274 users had written about sleep problems, which totaled 332,600 posts (8.4% of all posts). Based on the analysis results from the surveyed dataset, we used two model-assessed sleep characteristics: the number of sleep-related posts (NSR) and the number of posts indicating a sleep problem (NSP), and conducted a correlation analysis between these sleep characteristics and personality traits. As shown in <xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref>, the number of sleep-related posts (NSR) was significantly correlated with lower scores in conscientiousness (<italic>r</italic> =&#x2212;0.07, <italic>p &lt;</italic>.001), extraversion (<italic>r</italic> =&#x2212;0.16, <italic>p &lt;</italic>.001), and agreeableness (<italic>r</italic> =&#x2212;0.14, p <italic>&lt;</italic>.001), and significantly correlated with higher scores in neuroticism (<italic>r</italic> =0.23, p <italic>&lt;</italic>.001). For the number of posts indicating a sleep problem (NSP), the results were similar to those for the number of sleep-related posts (NSR), with the addition of a significant positive correlation with openness (<italic>r</italic> = 0.02, <italic>p</italic> = .027).</p>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>Correlations between model-assessed sleep characteristics and personality traits.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" rowspan="2" align="left">Sleep Characteristics</th>
<th valign="top" colspan="5" align="center">Model-assessed personality traits</th>
</tr>
<tr>
<th valign="top" align="center">O (95% CI)</th>
<th valign="top" align="center">C (95% CI)</th>
<th valign="top" align="center">E (95% CI)</th>
<th valign="top" align="center">A (95% CI)</th>
<th valign="top" align="center">N (95% CI)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">NSR</td>
<td valign="top" align="center">0.01 [&#x2212;0.01,&#x2212;0.02]</td>
<td valign="top" align="center">&#x2212;0.07<sup>&#x2217;&#x2217;&#x2217;</sup> [&#x2212;0.09,&#x2212;.05]</td>
<td valign="top" align="center">&#x2212;0.16<sup>&#x2217;&#x2217;&#x2217;</sup> [&#x2212;0.18,&#x2212;0.14]</td>
<td valign="top" align="center">&#x2212;0.14<sup>&#x2217;&#x2217;&#x2217;</sup> [&#x2212;0.15,&#x2212;0.12]</td>
<td valign="top" align="center">0.23<sup>&#x2217;&#x2217;&#x2217;</sup> [0.21,0.24]</td>
</tr>
<tr>
<td valign="top" align="left">NSP</td>
<td valign="top" align="center">0.02<sup>&#x2217;</sup> [0.01,0.04]</td>
<td valign="top" align="center">&#x2212;0.06<sup>&#x2217;&#x2217;&#x2217;</sup> [&#x2212;0.07,&#x2212;0.04]</td>
<td valign="top" align="center">&#x2212;0.16<sup>&#x2217;&#x2217;&#x2217;</sup> [&#x2212;0.18,&#x2212;0.15]</td>
<td valign="top" align="center">&#x2212;0.15<sup>&#x2217;&#x2217;&#x2217;</sup> [&#x2212;0.17,&#x2212;0.14]</td>
<td valign="top" align="center">&#x2212;0.20<sup>&#x2217;&#x2217;&#x2217;</sup> [&#x2212;0.18,&#x2212;0.22]</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Users = 13,753.</p>
</fn>
<fn>
<p>O, Openness; C, Conscientiousness; E, Extraversion; A, Agreeableness; N, Neuroticism; NSR, The number of sleep-related posts; NSP, The number of posts indicating a sleep problem; 95% CI, 95% Confidence Interval; *<italic>p &lt;.</italic>05, ***<italic>p &lt;.</italic>001.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>We analyzed the model-assessed personality scores in the large dataset and found two key issues: (1) The standard deviation (SD) of model-assessed personality trait scores was lower than that of self-reported scores in the surveyed dataset (N = 336; <xref ref-type="supplementary-material" rid="SF2">
<bold>Supplementary Tables S2</bold>
</xref>, <xref ref-type="supplementary-material" rid="SF3">
<bold>S3</bold>
</xref>). Since the model&#x2019;s training goal was to minimize the loss function, predictions tended to cluster around the mean value. (2) There was collinearity among the model-assessed personality traits, likely due to the use of the same dataset for training the models of the five dimensions. Despite these issues, the model-assessed personality traits was significantly correlated with the self-reported personality traits (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>), indicating that the relative magnitude of each user&#x2019;s personality scores reflected their position within the entire group.</p>
<p>To address these two issues, we ranked and grouped the model-assessed personality traits (N = 13,753) and selected the top and bottom 27% of the data to form low-score and high-score groups, respectively, for each dimension. The 27% selection was chosen to ensure a clear distinction between the low-score and high-score groups, capturing significant extremes while minimizing overlap and potential collinearity from the central range. <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref> shows that: (1) users in the high-score group for conscientiousness (<italic>t</italic> = 14.96, <italic>p &lt;</italic>.001), extraversion (<italic>t</italic> = 23.36, p <italic>&lt;</italic>.001), and agreeableness (<italic>t</italic> = 19.65, <italic>p &lt;</italic>.001) had significantly fewer sleep-related posts than those in the low-score group for these traits, while users in the high neuroticism group had significantly more sleep-related posts than those in the low neuroticism group (<italic>t</italic> = &#x2212;21.02, <italic>p &lt;</italic>.001); (2) users in the high-score group for openness (<italic>t</italic> =&#x2212;2.18, <italic>p</italic> = .029) and neuroticism (<italic>t</italic> =&#x2212;17.54, <italic>p &lt;</italic>.001) had significantly more posts indicating a sleep problem than those in the low-score group for these traits, while users in the high-score group for conscientiousness (<italic>t</italic> = 11.42, <italic>p &lt;</italic>.001), extraversion (<italic>t</italic> = 22.68, <italic>p &lt;</italic>.001), and agreeableness (<italic>t</italic> = 21.58, <italic>p &lt;</italic>.001) had significantly fewer posts indicating a sleep problem than those in the low-score group for these traits. Thus, we concluded that:</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Differences in the number of posts [the number of sleep-related posts (NSR) and the number of posts indicating a sleep problem (NSP)] between users with high and low scores for the various personality traits (N = 13,753). O, Openness; C, Conscientiousness; E, Extraversion; A, Agreeableness; N, Neuroticism.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpsyt-16-1596269-g005.tif">
<alt-text content-type="machine-generated">Bar chart comparing the number of sleep-related and sleep problem posts for low and high personality score groups across traits: openness (O), conscientiousness (C), extraversion (E), agreeableness (A), and neuroticism (N). Dark blue represents low scores, and light blue represents high scores.</alt-text>
</graphic>
</fig>
<p>Conclusion 4: From a big data-driven perspective, higher model-assessed sleep characteristics were significantly associated with lower scores in model-assessed conscientiousness, extraversion, and agreeableness, and with higher scores in neuroticism. These findings largely align with the results from self-reported data.</p>
</sec>
</sec>
<sec id="s4">
<label>4</label>
<title>General discussion</title>
<p>In this paper, we present a novel framework that integrates user surveys and big data-driven computational methods to assess sleep characteristics and personality traits from microblogs. Specifically, we constructed two classifiers based on BERT word embeddings to capture the deep semantic content of microblogs, enabling us to determine whether posts were related to sleep and whether they expressed sleep problems (Models 1 and 2, respectively). For the more complex task of personality assessment, we built a semantic feature space by fine-tuning BERT word embeddings and introduced an LSTM neural network with an attention mechanism to predict scores for the five personality traits manifested in the microblogs (Model 3). We collected an empirical dataset based on user surveys (total users = 923, active users = 336) and applied expert cross-annotation and self-reported questionnaires as the gold standard for training the three models. Our approach achieved high performance in assessing sleep characteristics and personality traits in both the training and testing datasets. We then applied these models to a separate large-scale microblog dataset (13,753 users and 4,864,600 posts).</p>
<p>Notably, our approach also scrutinized the reliability of big data methods in assessing psychological variables and their interrelationships. We analyzed these relationships from bothe survey-based and big data-driven perspectives and identified the commonalities with, and differences between, the findings of previous research across the five personality dimensions (<xref ref-type="table" rid="T5">
<bold>Table&#xa0;5</bold>
</xref>). Previous research has consistently found a negative impact of neuroticism and a positive impact of conscientiousness on sleep quality (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B24">24</xref>). Furthermore, extraversion is also often associated with better sleep quality (<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B23">23</xref>). In the surveyed dataset, we found that:</p>
<list list-type="order">
<list-item>
<p>Self-reported sleep quality significantly predicts model-assessed sleep problems, and this relationship is moderated by users&#x2019; total posting frequency.</p>
</list-item>
<list-item>
<p>Openness, conscientiousness, extraversion, and agreeableness measured by CBF-PI scores are significantly associated with better self-reported sleep quality, whereas neuroticism significantly predicts poorer self-reported sleep quality.</p>
</list-item>
<list-item>
<p>Openness, conscientiousness, extraversion and agreeableness measured by CBF-PI scores are significantly associated with fewer model-assessed sleep problems, whereas neuroticism is significantly was associated with more model-assessed sleep problems at the post level.</p>
</list-item>
<list-item>
<p>Self-reported sleep quality (as measured by the PSQI) predicted the number of sleep-related posts and the number of posts indicating a sleep problem, moderated by the total number of posts.</p>
<p>When the models were applied to large-scale dataset, we found that:</p>
</list-item>
<list-item>
<p>Higher model-assessed sleep characteristics were significantly associated with lower scores in modelassessed conscientiousness, extraversion, and agreeableness, and with higher scores in neuroticism.</p>
</list-item>
</list>
<table-wrap id="T5" position="float">
<label>Table&#xa0;5</label>
<caption>
<p>Comparison of the personality&#x2013;sleep relationship between our study and previous studies.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Author</th>
<th valign="top" align="center">Method</th>
<th valign="top" align="center">Participants</th>
<th valign="top" align="center">N</th>
<th valign="top" align="center">E</th>
<th valign="top" align="center">C</th>
<th valign="top" align="center">O</th>
<th valign="top" align="center">A</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">This study</td>
<td valign="top" align="center">Model1,2 vs. CBF-PI<break/>Self-reported sleep vs. CBF-PI</td>
<td valign="top" align="center">Posts<break/>(N = 73,735) Users<break/>(N = 336)</td>
<td valign="top" align="center">Negative<break/>Negative<break/>(predicted)</td>
<td valign="top" align="center">Positive<break/>Positive</td>
<td valign="top" align="center">Positive<break/>Positive</td>
<td valign="top" align="center">Positive<break/>Positive</td>
<td valign="top" align="center">Positive<break/>Positive<break/>(predicted)</td>
</tr>
<tr>
<td valign="top" align="center"/>
<td valign="top" align="center">Model1,2 vs. CBF-PI</td>
<td valign="top" align="center">Users<break/>(N = 336)</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">Positive (predicted)</td>
<td valign="top" align="center">Positive (predicted)</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">Hintsanen et al. (<xref ref-type="bibr" rid="B60">60</xref>)</td>
<td valign="top" align="center">Model1,2 vs. Model3</td>
<td valign="top" align="center">Users<break/>(N = 13,753)</td>
<td valign="top" align="center">Negative</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">Positive</td>
</tr>
<tr>
<td valign="top" align="center">Survey</td>
<td valign="top" align="center">Cross-culture<break/>(N=2,727)</td>
<td valign="top" align="center">Negative</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">Positive</td>
</tr>
<tr>
<td valign="top" align="center">Cellini et al. (<xref ref-type="bibr" rid="B10">10</xref>)</td>
<td valign="top" align="center">Survey</td>
<td valign="top" align="center">Subjects<break/>(N = 498)</td>
<td valign="top" align="center">Negative</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">Positive</td>
</tr>
<tr>
<td valign="top" align="center">Stephan et al. (<xref ref-type="bibr" rid="B21">21</xref>)</td>
<td valign="top" align="center">Survey (Longitudinal)</td>
<td valign="top" align="center">Four groups<break/>(N&#xbf;22,000)</td>
<td valign="top" align="center">Negative</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="center">Kri&#x17e;an and Hisler (<xref ref-type="bibr" rid="B22">22</xref>)</td>
<td valign="top" align="center">Survey + ActiGraph</td>
<td valign="top" align="center">Adults<break/>(N = 382)</td>
<td valign="top" align="center">Negative</td>
<td valign="top" align="center">x</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">x</td>
<td valign="top" align="center">x</td>
</tr>
<tr>
<td valign="top" align="center">Sutin et al. (<xref ref-type="bibr" rid="B23">23</xref>)</td>
<td valign="top" align="center">Diary + ActiGraph</td>
<td valign="top" align="center">Adults<break/>(N = 620)</td>
<td valign="top" align="center">Negative</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">x</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="center">Spears et al. (<xref ref-type="bibr" rid="B9">9</xref>)</td>
<td valign="top" align="center">Survey (Longitudinal)</td>
<td valign="top" align="center">Users (N=3,759)</td>
<td valign="top" align="center">Negative</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">Negative</td>
</tr>
<tr>
<td valign="top" align="center">Mead et al. (<xref ref-type="bibr" rid="B30">30</xref>)</td>
<td valign="top" align="center">ActiGraph</td>
<td valign="top" align="center">College subjects<break/>(N = 358)</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">Negative</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Model 1 assessed whether a post was related to sleep, and Model 2 assessed whether a post indicated a sleep problem. Model 3 assessed FFM personality traits. &#x201c;&#x201c; indicates &#x201c;not related&#x201d;, and &#x201c;x&#x201d; indicates &#x201c;inconsistent.&#x201d;.</p>
</fn>
<fn>
<p>O, Openness; C, Conscientiousness; E, Extraversion; A, Agreeableness; N, Neuroticism; CBF-PI, The Chinese Simplified Big Five Personality Inventory as a measure of FFM; Self-reported sleep, PSQI score.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>In regard to the automated assessment of psychological indicators from large-scale semantics, two issues are worth discussing. The first issue is the difficulty of manual text annotation and its impact on model performance. In our study, annotations showed high consistency for labeling &#x201c;sleep-related&#x201d; posts but low consistency for labeling &#x201c;sleep problems&#x201d; due to the complexity of the task. Identifying sleep-related content is straightforward using keywords like &#x201c;sleep&#x201d; and &#x201c;stay up late&#x201d;, whereas assessing sleep problems requires consideration of context and emotions. We initially attempted to annotate the &#x201c;causes&#x201d; and &#x201c;manifestations&#x201d;. However, due to data sparsity (i.e., lack of explicit causes) and complexity (i.e., vague expressions or mixed causes), most annotators labeled the text as &#x201c;unable to determine&#x201d;, leading to a small and low-quality dataset. Consequently, these annotations were not used for further study. For complex psychological indicators, future work could improve training data accuracy and richness by increasing the amount of annotated data, standardizing the annotation process, and recruiting experienced annotators.</p>
<p>Second, controlling the quantity and quality of microblog content is crucial. For example, Tian et&#xa0;al. (<xref ref-type="bibr" rid="B52">52</xref>) found that only 0.37% of posts expressed sleep-related complaints due to the prevalence of advertisements and marketing accounts. Therefore, we carefully screened 923 participants and retained 336 users who had posted a sufficient number of original posts. This ensured a clean high-quality dataset for training the model. Of the 73,735 posts, 3.67% were sleep-related, and 2.15% indicated sleep problems. A unique benefit of our framework is that other researchers can apply our freely available fine-tuned models and datasets to any Chinese post data <xref ref-type="fn" rid="fn2">
<sup>2</sup>
</xref>. After applying the sleep assessment and personality assessment models to the large microblog dataset (users = 13,753), we found that 12,623 users had made 447,600 posts with sleep-related content (11.3% of all posts), and 12,274 users had made 332,600 posts about sleep problems (8.4% of all posts). These data constitute a rich, high-quality sleep-related microblog dataset.</p>
<p>Our approach is not without limitations. From the perspective of model limitations, the personality assessment models performed modestly for neuroticism and extraversion. One reason for this is that these traits may manifest ambiguously on Chinese social media. For instance, posts related to neuroticism often involve indirect expressions of distress (e.g., sarcasm) rather than explicit emotional disclosure, which aligns with findings by Yuan et&#xa0;al. (<xref ref-type="bibr" rid="B42">42</xref>) on cultural differences in personality expression. Extraversion, while theoretically associated with social engagement, could be conflated with performative behaviors online (e.g., frequent but superficial interactions), as noted by Liu and Zhu (<xref ref-type="bibr" rid="B46">46</xref>). Similarly, Cutler and Condon (<xref ref-type="bibr" rid="B48">48</xref>) reported instability in detecting neuroticism from text, attributing it to the trait&#x2019;s context-dependent expression. Another interesting, albeit disappointing, finding was that the relationship between openness and sleep quality was inconsistent across the different datasets. Unlike conscientiousness and extraversion, which are descriptive traits, openness is an evaluative trait, which are more susceptible to instability and, consequently, may yield inconsistent results (<xref ref-type="bibr" rid="B59">59</xref>). Addressing the stability of openness assessments in future studies could enhance our understanding of its relationship with sleep. Future work could integrate multimodal data (e.g., pictures, interaction patterns) to better capture contextual nuances and improve the stability of assessment (<xref ref-type="bibr" rid="B53">53</xref>). Additionally, as our models operate at the post level, the frequency of sleep-related symptoms (e.g., whether a post expresses sleep problems) was not directly incorporated into the deep learning models. Future work could integrate longitudinal data to better capture the frequency and chronicity of symptoms.</p>
<p>Another limitation is that we used a shortened version of the personality questionnaire (i.e., the CBF-PI) for the user survey. Although the CBF-PI has been validated in previous studies, the reduced number of items may have introduced bias in some of the dimensions. Future studies could use the full version and control for other variables that may affect the accuracy of personality assessments. Finally, to explore the relationship between sleep and personality, we used four indicators of sleep characteristics: the number of sleep-related posts, the proportion of sleep-related posts, the number of posts indicating a sleep problem, and the proportion of posts with sleep problems. We found that, without controlling for users&#x2019; overall posting activity, these indicators were not significantly correlated with sleep quality. Future research could explore how to assess sleep quality among inactive users (i.e., those who post rarely or not at all). While our models showed significant correlations with PSQI scores, we did not test their ability to directly predict PSQI scores. This limits conclusions about their potential as proxies for standardized sleep assessments. Further validation is needed to assess this predictive capacity in future work.</p>
<p>The study is based on passive data collection from the public social media platform (Sina Weibo), a topic widely discussed in terms of ethical considerations (<xref ref-type="bibr" rid="B61">61</xref>, <xref ref-type="bibr" rid="B62">62</xref>). For our study, we took the following ethical precautions. First, we submitted the research for approval from the ethics review board and received approval before proceeding. Second, no private messages were accessed during the research process, and all data (e.g., user IDs and post IDs) were anonymized after preprocessing. Third, the goal of this research is to explore patterns across large populations to derive theoretical insights, rather than applying them to psychological interventions at the individual level. Overall, this study adheres to ethical guidelines, including the APA Guidelines for Telepsychology (<xref ref-type="bibr" rid="B63">63</xref>) and the British Psychological Society&#x2019;s guidelines on internet-mediated research (<xref ref-type="bibr" rid="B64">64</xref>). We emphasize that transparent data use disclosures, enhanced data security, and rigorous ethical oversight should be core components of large-scale digital psychological research.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusions</title>
<p>Our findings demonstrate the reliability of big data-driven computational methods for evaluating sleep characteristics and personality traits. Specifically, we found that: (1) conscientiousness, agreeableness, and extraversion are associated with better sleep quality, while neuroticism is linked to poorer sleep quality. (2) When the model trained on a small survey dataset with expert annotations and questionnaires was applied to a large-scale microblog dataset, the sleep-personality relationships remained consistent across datasets. From a theoretical perspective, our work provides a multifaceted approach that integrates computational methods with psychological research, offering new insights into how big data can inform psychological theory. From the perspective of clinical implications, understanding the relationship between personality traits and sleep characteristics can guide personalized interventions. For example, individuals with high neuroticism may benefit from interventions focused on emotional regulation, such as CBT or mindfulness (<xref ref-type="bibr" rid="B65">65</xref>), while those with higher agreeableness, conscientiousness, and extraversion may improve sleep quality with structured routines and social support (<xref ref-type="bibr" rid="B66">66</xref>). Future work could explore the underlying causes of sleep problems expressed in microblogs by overcoming data sparsity through multiple data sources and multimodal data approaches. This would facilitate more comprehensive analysis and lead to more precise and effective sleep interventions tailored to individuals&#x2019; specific needs.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s7" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Faculty of Psychology, Beijing Normal University. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s8" sec-type="author-contributions">
<title>Author contributions</title>
<p>LC: Visualization, Software, Methodology, Conceptualization, Writing &#x2013; original draft. JW: Conceptualization, Data curation, Methodology, Writing &#x2013; original draft. MW: Writing &#x2013; review &amp; editing, Software, Conceptualization, Formal Analysis, Data curation. LZ: Conceptualization, Writing &#x2013; review &amp; editing, Visualization. XW: Writing &#x2013; review &amp; editing, Visualization, Data curation, Conceptualization. BY: Data curation, Writing &#x2013; review &amp; editing, Visualization. QL: Writing &#x2013; review &amp; editing, Project administration, Funding acquisition, Methodology, Conceptualization.</p>
</sec>
<sec id="s9" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This study was funded by the National Natural Science Foundation of China (grant No. 62006022, 62007027, 62306039) and Natural Science Foundation of Hubei Province (grant No. 2023AF8B15).</p>
</sec>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec id="s12" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s13" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpsyt.2025.1596269/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpsyt.2025.1596269/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table1.pdf" id="SF1" mimetype="application/pdf">
<label>Supplementary Table&#xa0;1</label>
<caption>
<p>Correlations between personality traits (CBF-PI scores), PSQI, and model-assessed sleep characteristics in 336 users. O, Openness, C, Conscientiousness, E, Extraversion, A, Agreeableness, N, Neuroticism; PSQI, Pittsburgh Sleep Quality Index; TN, Total Number of Posts; NSR, Number of Sleep-Related Posts; PSR, Proportion of Sleep-Related Posts; NSP, Number of Posts Indicating Sleep Problems; PSP, Proportion of Posts with Sleep Problems; <sup>*</sup>
<italic>p</italic> &lt;.05, <sup>**</sup>
<italic>p</italic> &lt;.01.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Table1.pdf" id="SF2" mimetype="application/pdf">
<label>Supplementary Table&#xa0;2</label>
<caption>
<p>Descriptive statistics of users in the large dataset (users = 13,753, posts = 4,864,600). O, Openness; C, Conscientiousness; E, Extraversion; A, Agreeableness; N, Neuroticism; PSQI, Pittsburgh Sleep Quality Index; M, Mean; SD, Standard Deviation; TN, Total Number of Posts; NSR, Number of Sleep-Related Posts; NSP, Number of Posts Indicating Sleep Problems.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Table1.pdf" id="SF3" mimetype="application/pdf">
<label>Supplementary Table&#xa0;3</label>
<caption>
<p>Descriptive statistics of valid surveyed users (users = 336, posts = 73,735). O, Openness; C, Conscientiousness; E, Extraversion; A, Agreeableness; N, Neuroticism; PSQI, Pittsburgh Sleep Quality Index; M, Mean; SD, Standard Deviation; TN, Total Number of Posts; NSR, Number of Sleep-Related Posts; PSR, Proportion of Sleep-Related Posts; NSP, Number of Posts Indicating Sleep Problems; PSP, Proportion of Posts with Sleep Problems; PSQI, Pittsburgh Sleep Quality Index.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="SupplementaryFile1.zip" id="SM1" mimetype="application/zip"/>
</sec>
<fn-group>
<fn id="fn1">
<label>1</label>
<p>
<ext-link ext-link-type="uri" xlink:href="https://aishiyan.bnu.edu.cn">https://aishiyan.bnu.edu.cn</ext-link>
</p>
</fn>
<fn id="fn2">
<label>2</label>
<p>
<ext-link ext-link-type="uri" xlink:href="https://pan.bnu.edu.cn/l/l1wLB0">https://pan.bnu.edu.cn/l/l1wLB0</ext-link>
</p>
</fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Siegel</surname> <given-names>JM</given-names>
</name>
</person-group>. <article-title>Clues to the functions of mammalian sleep</article-title>. <source>Nature</source>. (<year>2005</year>) <volume>437</volume>:<page-range>1264&#x2013;71</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature04285</pub-id>, PMID: <pub-id pub-id-type="pmid">16251951</pub-id></citation></ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>R</given-names>
</name>
<name>
<surname>Mu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<name>
<surname>Cheung</surname> <given-names>FTW</given-names>
</name>
<name>
<surname>Chan</surname> <given-names>NY</given-names>
</name>
<name>
<surname>Chan</surname> <given-names>JWY</given-names>
</name>
<etal/>
</person-group>. <article-title>The relationship between neo-five personality traits and sleep-related characteristics: A systematic review and metaanalysis</article-title>. <source>Sleep Med Rev</source>. (<year>2025</year>) <volume>59</volume>:<fpage>101565</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.smrv.2025.102081</pub-id>, PMID: <pub-id pub-id-type="pmid">40158435</pub-id></citation></ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guerreiro</surname> <given-names>J</given-names>
</name>
<name>
<surname>Schulze</surname> <given-names>L</given-names>
</name>
<name>
<surname>Garcia i Tormo</surname> <given-names>A</given-names>
</name>
<name>
<surname>Henwood</surname> <given-names>AJ</given-names>
</name>
<name>
<surname>Schneider</surname> <given-names>L</given-names>
</name>
<name>
<surname>Krob</surname> <given-names>E</given-names>
</name>
<etal/>
</person-group>. <article-title>The relationship between big five personality traits and sleep patterns: A systematic review</article-title>. <source>Nat Sci Sleep</source>. (<year>2024</year>) <volume>16</volume>:<page-range>1327&#x2013;37</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2147/NSS.S467842</pub-id>, PMID: <pub-id pub-id-type="pmid">39247910</pub-id></citation></ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Akram</surname> <given-names>U</given-names>
</name>
<name>
<surname>Stevenson</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Gardani</surname> <given-names>M</given-names>
</name>
<name>
<surname>Allen</surname> <given-names>S</given-names>
</name>
<name>
<surname>Johann</surname> <given-names>AF</given-names>
</name>
</person-group>. <article-title>Personality and insomnia: A systematic review and narrative synthesis</article-title>. <source>J Sleep Res</source>. (<year>2023</year>) <volume>32</volume>:<elocation-id>e14031</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/jsr.14031</pub-id>, PMID: <pub-id pub-id-type="pmid">37654128</pub-id></citation></ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cappuccio</surname> <given-names>FP</given-names>
</name>
<name>
<surname>D&#x2019;Elia</surname> <given-names>L</given-names>
</name>
<name>
<surname>Strazzullo</surname> <given-names>P</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>MA</given-names>
</name>
</person-group>. <article-title>Quantity and quality of sleep and incidence of type 2 diabetes: A systematic review and meta-analysis</article-title>. <source>Diabetes Care</source>. (<year>2010</year>) <volume>33</volume>:<page-range>414&#x2013;20</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2337/dc09-1124</pub-id>, PMID: <pub-id pub-id-type="pmid">19910503</pub-id></citation></ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gangwisch</surname> <given-names>JE</given-names>
</name>
<name>
<surname>Malaspina</surname> <given-names>D</given-names>
</name>
<name>
<surname>Boden-Albala</surname> <given-names>B</given-names>
</name>
<name>
<surname>Heymsfield</surname> <given-names>SB</given-names>
</name>
</person-group>. <article-title>Inadequate sleep as a risk factor for obesity: analyses of the nhanes i</article-title>. <source>Sleep</source>. (<year>2005</year>) <volume>28</volume>:<page-range>1289&#x2013;96</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/sleep/28.10.1289</pub-id>, PMID: <pub-id pub-id-type="pmid">16295214</pub-id></citation></ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoevenaar-Blom</surname> <given-names>MP</given-names>
</name>
<name>
<surname>Spijkerman</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Kromhout</surname> <given-names>D</given-names>
</name>
<name>
<surname>van den Berg</surname> <given-names>JF</given-names>
</name>
<name>
<surname>Verschuren</surname> <given-names>WMM</given-names>
</name>
</person-group>. <article-title>Sleep duration and sleep quality in relation to 12-year cardiovascular disease incidence: The morgen study</article-title>. <source>Sleep</source>. (<year>2011</year>) <volume>34</volume>:<page-range>1487&#x2013;92</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.5665/sleep.1382</pub-id>, PMID: <pub-id pub-id-type="pmid">22043119</pub-id></citation></ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bubu</surname> <given-names>OM</given-names>
</name>
<name>
<surname>Bakke</surname> <given-names>JR</given-names>
</name>
<name>
<surname>Hogan</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Umasabor-Bubu</surname> <given-names>O</given-names>
</name>
<name>
<surname>Mukhtar</surname> <given-names>FJ</given-names>
</name>
<name>
<surname>Ram</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Disturbed sleep is associated with changes in alzheimer&#x2019;s disease (ad) biomarkers predictive of persons that ultimately develop ad: Findings from subgroup meta-analysis on sleep and alzheimer&#x2019;s disease</article-title>. <source>Sleep</source>. (<year>2017</year>) <volume>40</volume>:<page-range>A430&#x2013;0</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/sleepj/zsx050.1152</pub-id>
</citation></ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Spears</surname> <given-names>SK</given-names>
</name>
<name>
<surname>Montgomery-Downs</surname> <given-names>HE</given-names>
</name>
<name>
<surname>Steinman</surname> <given-names>SA</given-names>
</name>
<name>
<surname>Duggan</surname> <given-names>KA</given-names>
</name>
<name>
<surname>Turiano</surname> <given-names>NA</given-names>
</name>
</person-group>. <article-title>Sleep: A pathway linking personality to mortality risk</article-title>. <source>J Res Pers</source>. (<year>2019</year>) <volume>81</volume>:<fpage>11</fpage>&#x2013;<lpage>24</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jrp.2019.04.007</pub-id>, PMID: <pub-id pub-id-type="pmid">31341341</pub-id></citation></ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cellini</surname> <given-names>N</given-names>
</name>
<name>
<surname>Duggan</surname> <given-names>KA</given-names>
</name>
<name>
<surname>Sarlo</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Perceived sleep quality: The interplay of neuroticism, affect, and hyperarousal</article-title>. <source>Sleep Health</source>. (<year>2017</year>) <volume>3</volume>:<page-range>184&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.sleh.2017.03.001</pub-id>, PMID: <pub-id pub-id-type="pmid">28526256</pub-id></citation></ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buysse</surname> <given-names>DJ</given-names>
</name>
<name>
<surname>Reynolds</surname> <given-names>CF</given-names>
<suffix>III</suffix>
</name>
<name>
<surname>Monk</surname> <given-names>TH</given-names>
</name>
<name>
<surname>Berman</surname> <given-names>SR</given-names>
</name>
<name>
<surname>Kupfer</surname> <given-names>DJ</given-names>
</name>
</person-group>. <article-title>The pittsburgh sleep quality index: A new instrument for psychiatric practice and research</article-title>. <source>Psychiatry Res</source>. (<year>1988</year>) <volume>28</volume>:<fpage>193</fpage>&#x2013;<lpage>213</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0165-1781(89)90047-4</pub-id>, PMID: <pub-id pub-id-type="pmid">2748771</pub-id></citation></ref>
<ref id="B12">
<label>12</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Spielman</surname> <given-names>AJ</given-names>
</name>
<name>
<surname>Glovinsky</surname> <given-names>PB</given-names>
</name>
</person-group>. &#x201c;<article-title>Introduction: The varied nature of insomnia</article-title>&#x201d;. In: <person-group person-group-type="editor">
<name>
<surname>Hauri</surname> <given-names>PJ</given-names>
</name>
</person-group>, editors, <source>Case studies in insomnia</source> (Vol. <volume>1</volume>). <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>. (<year>1991</year>). pp. <page-range>1&#x2013;15</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-1-4757-9586-8_1</pub-id>
</citation></ref>
<ref id="B13">
<label>13</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Grandner</surname> <given-names>MA</given-names>
</name>
</person-group>. &#x201c;<article-title>Epidemiology of insufficient sleep and poor sleep quality</article-title>&#x201d;. In: <person-group person-group-type="editor">
<name>
<surname>Wright</surname> <given-names>KP</given-names>
</name>
<name>
<surname>Castriotta</surname> <given-names>RA</given-names>
</name>
</person-group>, editors, <source>Sleep Disorders Medicine</source>. <publisher-loc>San Diego, CA</publisher-loc>: <publisher-name>Elsevier</publisher-name>. (<year>2019</year>). p. <page-range>11&#x2013;20</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/B978-0-12-815373-4.00002-2</pub-id>
</citation></ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cloninger</surname> <given-names>CR</given-names>
</name>
<name>
<surname>Svrakic</surname> <given-names>DM</given-names>
</name>
<name>
<surname>Przybeck</surname> <given-names>TR</given-names>
</name>
</person-group>. <article-title>A psychobiological model of temperament and character</article-title>. <source>Arch Gen Psychiatry</source>. (<year>1993</year>) <volume>50</volume>:<page-range>975&#x2013;90</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/archpsyc.1993.01820240059008</pub-id>, PMID: <pub-id pub-id-type="pmid">8250684</pub-id></citation></ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cattell</surname> <given-names>RB</given-names>
</name>
</person-group>. <article-title>The description of personality: Basic traits resolved into clusters</article-title>. <source>J Abnormal Soc Psychol</source>. (<year>1949</year>) <volume>44</volume>:<page-range>417&#x2013;41</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/h0051956</pub-id>
</citation></ref>
<ref id="B16">
<label>16</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Eysenck</surname> <given-names>HJ</given-names>
</name>
<name>
<surname>Eysenck</surname> <given-names>SBG</given-names>
</name>
</person-group>. <source>Personality and individual differences: A natural science approach</source>. <publisher-loc>New York, NY</publisher-loc>:<publisher-name>Plenum Press</publisher-name> (<year>1985</year>).</citation></ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krueger</surname> <given-names>RF</given-names>
</name>
<name>
<surname>Derringer</surname> <given-names>J</given-names>
</name>
<name>
<surname>Markon</surname> <given-names>KE</given-names>
</name>
<name>
<surname>Watson</surname> <given-names>D</given-names>
</name>
<name>
<surname>Skodol</surname> <given-names>AE</given-names>
</name>
</person-group>. <article-title>Initial construction of a maladaptive personality trait model and inventory for dsm-5</article-title>. <source>psychol Med</source>. (<year>2012</year>) <volume>42</volume>:<page-range>1879&#x2013;90</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1017/S0033291711002674</pub-id>, PMID: <pub-id pub-id-type="pmid">22153017</pub-id></citation></ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McCrae</surname> <given-names>RR</given-names>
</name>
<name>
<surname>Costa</surname> <given-names>PT</given-names>
</name>
</person-group>. <article-title>Updating norman&#x2019;s &#x201c;adequate taxonomy&#x201d;: Intelligence and personality dimensions in natural language and in questionnaires</article-title>. <source>J Pers Soc Psychol</source>. (<year>1985</year>) <volume>49</volume>:<page-range>710&#x2013;21</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/0022-3514.49.3.710</pub-id>, PMID: <pub-id pub-id-type="pmid">4045699</pub-id></citation></ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goldberg</surname> <given-names>LR</given-names>
</name>
</person-group>. <article-title>The structure of phenotypic personality traits</article-title>. <source>Am Psychol</source>. (<year>1993</year>) <volume>48</volume>:<fpage>26</fpage>&#x2013;<lpage>34</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/0003-066X.48.1.26</pub-id>
</citation></ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McCrae</surname> <given-names>RR</given-names>
</name>
<name>
<surname>John</surname> <given-names>OP</given-names>
</name>
</person-group>. <article-title>An introduction to the five-factor model and its applications</article-title>. <source>J Pers Soc Psychol</source>. (<year>1992</year>) <volume>60</volume>:<fpage>175</fpage>&#x2013;<lpage>215</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1467-6494.1992.tb00970.x</pub-id>, PMID: <pub-id pub-id-type="pmid">1635039</pub-id></citation></ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stephan</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Sutin</surname> <given-names>AS</given-names>
</name>
<name>
<surname>Bayard</surname> <given-names>S</given-names>
</name>
<name>
<surname>Krizan</surname> <given-names>Z</given-names>
</name>
</person-group>. <article-title>Personality and sleep quality: Evidence from four prospective studies</article-title>. <source>Health Psychol</source>. (<year>2018</year>) <volume>37</volume>:<page-range>271&#x2013;81</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/hea0000577</pub-id>, PMID: <pub-id pub-id-type="pmid">29172602</pub-id></citation></ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kri&#x17e;an</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Hisler</surname> <given-names>G</given-names>
</name>
</person-group>. <article-title>Personality and sleep: Neuroticism and conscientiousness predict behaviourally recorded sleep years later</article-title>. <source>Eur J Pers</source>. (<year>2019</year>) <volume>33</volume>:<page-range>133&#x2013;53</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/per.2191</pub-id>
</citation></ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sutin</surname> <given-names>AR</given-names>
</name>
<name>
<surname>Gamaldo</surname> <given-names>AA</given-names>
</name>
<name>
<surname>Stephan</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Strickhouser</surname> <given-names>JE</given-names>
</name>
<name>
<surname>Terracciano</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Personality traits and the subjective and objective experience of sleep</article-title>. <source>Int J Behav Med</source>. (<year>2020</year>) <volume>27</volume>:<page-range>481&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12529-019-09828-w</pub-id>, PMID: <pub-id pub-id-type="pmid">31755033</pub-id></citation></ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sella</surname> <given-names>E</given-names>
</name>
<name>
<surname>Carbone</surname> <given-names>E</given-names>
</name>
<name>
<surname>Toffalini</surname> <given-names>E</given-names>
</name>
<name>
<surname>Borella</surname> <given-names>E</given-names>
</name>
</person-group>. <article-title>Personality traits and sleep quality: The role of sleep-related beliefs</article-title>. <source>Pers Individ Dif</source>. (<year>2020</year>) <volume>156</volume>:<elocation-id>109770</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.paid.2019.109770</pub-id>
</citation></ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saksvik-Lehouillier</surname> <given-names>I</given-names>
</name>
<name>
<surname>Langvik</surname> <given-names>E</given-names>
</name>
<name>
<surname>Saksvik</surname> <given-names>SB</given-names>
</name>
<name>
<surname>Kallestad</surname> <given-names>H</given-names>
</name>
<name>
<surname>Folles&#xf8;</surname> <given-names>HS</given-names>
</name>
<name>
<surname>Austad</surname> <given-names>SB</given-names>
</name>
<etal/>
</person-group>. <article-title>High neuroticism is associated with reduced negative affect following sleep deprivation</article-title>. <source>Pers Individ Dif</source>. (<year>2022</year>) <volume>185</volume>:<fpage>110218</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.paid.2021.111291</pub-id>
</citation></ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leger</surname> <given-names>KA</given-names>
</name>
<name>
<surname>Charles</surname> <given-names>ST</given-names>
</name>
<name>
<surname>Turiano</surname> <given-names>NA</given-names>
</name>
<name>
<surname>Almeida</surname> <given-names>DM</given-names>
</name>
</person-group>. <article-title>Personality and stressor-related affect</article-title>. <source>J Pers Soc Psychol</source>. (<year>2016</year>) <volume>111</volume>:<page-range>917&#x2013;28</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/pspp0000083</pub-id>, PMID: <pub-id pub-id-type="pmid">26796984</pub-id></citation></ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rezaei</surname> <given-names>F</given-names>
</name>
<name>
<surname>Hemmati</surname> <given-names>A</given-names>
</name>
<name>
<surname>Rahmani</surname> <given-names>K</given-names>
</name>
</person-group>. <article-title>Psychobiological personality traits related to sleep disorders and sexual dysfunction: A systematic review and meta-analysis</article-title>. <source>Turkish J Sleep Med</source>. (<year>2021</year>) <volume>8</volume>:<fpage>74</fpage>&#x2013;<lpage>89</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4274/jtsm.galenos.2021.04695</pub-id>
</citation></ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zakiei</surname> <given-names>A</given-names>
</name>
<name>
<surname>Khazaie</surname> <given-names>H</given-names>
</name>
<name>
<surname>Alimoradi</surname> <given-names>M</given-names>
</name>
<name>
<surname>El Rafihi-Ferreira</surname> <given-names>R</given-names>
</name>
<name>
<surname>Moradi</surname> <given-names>M-T</given-names>
</name>
<name>
<surname>Komasi</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Personality and sleep psychopathology: Associations between the dsm-5 maladaptive trait domains and multiple sleep problems in an adult population</article-title>. <source>Pers Ment Health</source>. (<year>2025</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.1002/pmh.70008</pub-id>, PMID: <pub-id pub-id-type="pmid">39905486</pub-id></citation></ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hisler</surname> <given-names>GC</given-names>
</name>
<name>
<surname>Krizan</surname> <given-names>Z</given-names>
</name>
<name>
<surname>DeHart</surname> <given-names>T</given-names>
</name>
</person-group>. <article-title>Does stress explain the effect of sleep on self-control difficulties? a month-long daily diary study</article-title>. <source>Pers Soc Psychol Bull</source>. (<year>2019</year>) <volume>45</volume>:<page-range>864&#x2013;77</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/0146167218798823</pub-id>, PMID: <pub-id pub-id-type="pmid">30319028</pub-id></citation></ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mead</surname> <given-names>MP</given-names>
</name>
<name>
<surname>Persich</surname> <given-names>MR</given-names>
</name>
<name>
<surname>Duggan</surname> <given-names>KA</given-names>
</name>
<name>
<surname>Veronda</surname> <given-names>A</given-names>
</name>
<name>
<surname>Irish</surname> <given-names>LA</given-names>
</name>
</person-group>. <article-title>Big 5 personality traits and intraindividual variability in sleep duration, continuity, and timing</article-title>. <source>Sleep Health</source>. (<year>2021</year>) <volume>7</volume>:<page-range>238&#x2013;45</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.sleh.2020.11.008</pub-id>, PMID: <pub-id pub-id-type="pmid">33436344</pub-id></citation></ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kosinski</surname> <given-names>M</given-names>
</name>
<name>
<surname>Matz</surname> <given-names>SC</given-names>
</name>
<name>
<surname>Gosling</surname> <given-names>SD</given-names>
</name>
<name>
<surname>Popov</surname> <given-names>V</given-names>
</name>
<name>
<surname>Stillwell</surname> <given-names>D</given-names>
</name>
</person-group>. <article-title>Facebook as a research tool for the social sciences: Opportunities, challenges, ethical considerations, and practical guidelines</article-title>. <source>Am Psychol</source>. (<year>2015</year>) <volume>70</volume>:<page-range>543&#x2013;56</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/a0039210</pub-id>, PMID: <pub-id pub-id-type="pmid">26348336</pub-id></citation></ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>L</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>L</given-names>
</name>
</person-group>. &#x201c;<article-title>Leverage social media for personalized stress detection</article-title>&#x201d;. In: <conf-name>Proceedings of the 28th ACM International Conference on Multimedia</conf-name>. <publisher-name>ACM</publisher-name>. (<year>2020</year>). pp. <page-range>2710&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1145/3394171.3413974</pub-id>
</citation></ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>L</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Li</surname> <given-names>N</given-names>
</name>
</person-group>. &#x201c;<article-title>A meta-learning based stress category detection framework on social media</article-title>&#x201d;. In: <conf-name>Proceedings of the ACM Web Conference 2022</conf-name>. <publisher-name>ACM</publisher-name>. (<year>2022</year>). pp. <page-range>2925&#x2013;35</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1145/3485447.3512015</pub-id>
</citation></ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zeng</surname> <given-names>K</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Li</surname> <given-names>N</given-names>
</name>
<etal/>
</person-group>. &#x201c;<article-title>Contrastive learning of stress-specific word embedding for social media based stress detection</article-title>&#x201d;. In: <conf-name>Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining</conf-name>. <publisher-name>ACM</publisher-name>. (<year>2023</year>). pp. <page-range>5137&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1145/3580305.3599384</pub-id>
</citation></ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zeng</surname> <given-names>K</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Q</given-names>
</name>
<etal/>
</person-group>. &#x201c;<article-title>MISE: Meta-knowledge inheritance for social media-based stressor estimation</article-title>&#x201d;. In: <conf-name>Proceedings of the ACM on Web Conference 2025</conf-name>. <publisher-name>ACM</publisher-name>. (<year>2025</year>). pp. <page-range>1866&#x2013;76</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1145/3589335.3645526</pub-id>
</citation></ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Youyou</surname> <given-names>W</given-names>
</name>
<name>
<surname>Kosinski</surname> <given-names>M</given-names>
</name>
<name>
<surname>Stillwell</surname> <given-names>D</given-names>
</name>
</person-group>. <article-title>Computer-based personality judgments are more accurate than those made by humans</article-title>. <source>Proc Natl Acad Sci United States America</source>. (<year>2015</year>) <volume>112</volume>:<page-range>1036&#x2013;40</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1418680112</pub-id>, PMID: <pub-id pub-id-type="pmid">25583507</pub-id></citation></ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>S</given-names>
</name>
<name>
<surname>Li</surname> <given-names>H</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y</given-names>
</name>
</person-group>. <article-title>Predicting user personality with social interactions in weibo</article-title>. <source>Aslib J Inf Manage</source>. (<year>2021</year>) <volume>73</volume>:<page-range>839&#x2013;64</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1108/AJIM-02-2021-0048</pub-id>
</citation></ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Suman</surname> <given-names>C</given-names>
</name>
<name>
<surname>Saha</surname> <given-names>S</given-names>
</name>
<name>
<surname>Gupta</surname> <given-names>A</given-names>
</name>
<name>
<surname>Pandey</surname> <given-names>SK</given-names>
</name>
<name>
<surname>Bhattacharyya</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>A multi-modal personality prediction system</article-title>. <source>Knowledge-Based Syst</source>. (<year>2022</year>) <volume>236</volume>:<elocation-id>107715</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.knosys.2021.107715</pub-id>
</citation></ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khorrami</surname> <given-names>M</given-names>
</name>
<name>
<surname>Khorrami</surname> <given-names>M</given-names>
</name>
<name>
<surname>Farhangi</surname> <given-names>F</given-names>
</name>
</person-group>. <article-title>Evaluation of tree-based ensemble algorithms for predicting the big five personality traits based on social media photos: Evidence from an Iranian sample</article-title>. <source>Pers Individ Dif</source>. (<year>2022</year>) <volume>188</volume>:<elocation-id>111479</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.paid.2021.111479</pub-id>
</citation></ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Philip</surname> <given-names>J</given-names>
</name>
<name>
<surname>Shah</surname> <given-names>D</given-names>
</name>
<name>
<surname>Nayak</surname> <given-names>S</given-names>
</name>
<name>
<surname>Patel</surname> <given-names>S</given-names>
</name>
<name>
<surname>Devashrayee</surname> <given-names>Y</given-names>
</name>
</person-group>. <article-title>Machine learning for personality analysis based on big five model</article-title>. <source>Adv Intelligent Syst Computing</source>. (<year>2019</year>) <volume>839</volume>:<page-range>345&#x2013;55</page-range>.</citation></ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pennebaker</surname> <given-names>JW</given-names>
</name>
<name>
<surname>Mayne</surname> <given-names>TJ</given-names>
</name>
<name>
<surname>Francis</surname> <given-names>ME</given-names>
</name>
</person-group>. <article-title>Linguistic predictors of adaptive bereavement</article-title>. <source>J Pers Soc Psychol</source>. (<year>1997</year>) <volume>72</volume>:<page-range>863&#x2013;71</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/0022-3514.72.4.863</pub-id>, PMID: <pub-id pub-id-type="pmid">9108699</pub-id></citation></ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yuan</surname> <given-names>C</given-names>
</name>
<name>
<surname>Hong</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Personality expression and recognition in chinese language usage</article-title>. <source>User Modeling User-Adapted Interaction</source>. (<year>2021</year>) <volume>31</volume>:<page-range>121&#x2013;47</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11257-020-09276-2</pub-id>
</citation></ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mikolov</surname> <given-names>T</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>K</given-names>
</name>
<name>
<surname>Corrado</surname> <given-names>G</given-names>
</name>
<name>
<surname>Dean</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Efficient estimation of word representations in vector space</article-title>. <source>Comput Lang</source>. (<year>2013</year>) <volume>3</volume>.</citation></ref>
<ref id="B44">
<label>44</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Devlin</surname> <given-names>J</given-names>
</name>
<name>
<surname>Chang</surname> <given-names>M-W</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>K</given-names>
</name>
<name>
<surname>Toutanova</surname> <given-names>K</given-names>
</name>
</person-group>. &#x201c;<article-title>Bert: Pre-training of deep bidirectional transformers for language understanding</article-title>&#x201d;. In: <conf-name>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</conf-name>, (Vol. <volume>1</volume>) <publisher-loc>Minneapolis, Minnesota</publisher-loc>: <publisher-name>Association for Computational Linguistics</publisher-name>. (<year>2018</year>). pp. <page-range>4171&#x2013;86</page-range>.</citation></ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hanwushuang</surname> <given-names>B</given-names>
</name>
<name>
<surname>Zixi</surname> <given-names>W</given-names>
</name>
<name>
<surname>Xi</surname> <given-names>C</given-names>
</name>
<name>
<surname>Zhan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Ying</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Guangyao</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>Psychological research based on word embedding techniques: Methods and applications</article-title>. <source>Adv psychol Sci</source>. (<year>2023</year>) <volume>31</volume>:<fpage>887</fpage>&#x2013;<lpage>904</lpage>.</citation></ref>
<ref id="B46">
<label>46</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>T</given-names>
</name>
</person-group>. <article-title>Deep learning for constructing microblog behavior representation to identify social media user&#x2019;s personality</article-title>. <source>PeerJ Comput Sci</source>. (<year>2016</year>) <volume>2</volume>:<fpage>e81</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.7717/peerj-cs.81</pub-id>
</citation></ref>
<ref id="B47">
<label>47</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mahajan</surname> <given-names>R</given-names>
</name>
<name>
<surname>Mahajan</surname> <given-names>R</given-names>
</name>
<name>
<surname>Sharma</surname> <given-names>E</given-names>
</name>
<name>
<surname>Mansotra</surname> <given-names>V</given-names>
</name>
</person-group>. <article-title>are we tweeting our real selves?&#x201d; personality prediction of Indian twitter users using deep learning ensemble model</article-title>. <source>Comput Hum Behav</source>. (<year>2022</year>) <volume>128</volume>:<fpage>107101</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.chb.2021.107101</pub-id>
</citation></ref>
<ref id="B48">
<label>48</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cutler</surname> <given-names>A</given-names>
</name>
<name>
<surname>Condon</surname> <given-names>DM</given-names>
</name>
</person-group>. <article-title>Deep lexical hypothesis: Identifying personality structure in natural language</article-title>. <source>J Pers Soc Psychol</source>. (<year>2023</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.31234/osf.io/gdm5v</pub-id>, PMID: <pub-id pub-id-type="pmid">36395036</pub-id></citation></ref>
<ref id="B49">
<label>49</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dissing</surname> <given-names>AS</given-names>
</name>
<name>
<surname>Andersen</surname> <given-names>TO</given-names>
</name>
<name>
<surname>Nrup</surname> <given-names>LN</given-names>
</name>
<name>
<surname>Clark</surname> <given-names>A</given-names>
</name>
<name>
<surname>Nejsum</surname> <given-names>M</given-names>
</name>
<name>
<surname>Rod</surname> <given-names>NH</given-names>
</name>
</person-group>. <article-title>Daytime and nighttime smartphone use: A study of associations between multidimensional smartphone behaviours and sleep among 24,856 danish adults</article-title>. <source>J Sleep Res</source>. (<year>2021</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.1111/jsr.13356</pub-id>, PMID: <pub-id pub-id-type="pmid">33899250</pub-id></citation></ref>
<ref id="B50">
<label>50</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>H</given-names>
</name>
<name>
<surname>Zhuang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>C</given-names>
</name>
<name>
<surname>Dong</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Social media big data-based research on the influencing factors of insomnia and spatiotemporal evolution</article-title>. <source>IEEE Access</source>. (<year>2020</year>) <volume>8</volume>:<page-range>41516&#x2013;29</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/Access.6287639</pub-id>
</citation></ref>
<ref id="B51">
<label>51</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yao</surname> <given-names>X</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>G</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Extracting depressive symptoms and their associations from an online depression community</article-title>. <source>Comput Hum Behav</source>. (<year>2021</year>) <volume>120</volume>:<elocation-id>106734</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.chb.2021.106734</pub-id>
</citation></ref>
<ref id="B52">
<label>52</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tian</surname> <given-names>X</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>G</given-names>
</name>
<name>
<surname>He</surname> <given-names>F</given-names>
</name>
</person-group>. <article-title>An analysis of sleep complaints on sina weibo</article-title>. <source>Comput Hum Behav</source>. (<year>2016</year>) <volume>62</volume>:<page-range>230&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.chb.2016.04.014</pub-id>
</citation></ref>
<ref id="B53">
<label>53</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stachl</surname> <given-names>C</given-names>
</name>
<name>
<surname>Pargent</surname> <given-names>F</given-names>
</name>
<name>
<surname>Hilbert</surname> <given-names>S</given-names>
</name>
<name>
<surname>Harari</surname> <given-names>GM</given-names>
</name>
<name>
<surname>Schoedel</surname> <given-names>R</given-names>
</name>
<name>
<surname>Vaid</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Personality research and assessment in the era of machine learning</article-title>. <source>Eur J Pers</source>. (<year>2020</year>) <volume>34</volume>:<page-range>613&#x2013;31</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/per.2257</pub-id>
</citation></ref>
<ref id="B54">
<label>54</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>MC</given-names>
</name>
<name>
<surname>He</surname> <given-names>L</given-names>
</name>
<name>
<surname>Jie</surname> <given-names>L</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>The development and psychometric evaluation of the chinese big five personality inventory-15</article-title>. <source>PloS One</source>. (<year>2019</year>) <volume>14</volume>(<issue>8</issue>):<elocation-id>e0221621</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0221621</pub-id>, PMID: <pub-id pub-id-type="pmid">31454383</pub-id></citation></ref>
<ref id="B55">
<label>55</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hochreiter</surname> <given-names>S</given-names>
</name>
<name>
<surname>Schmidhuber</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Long short-term memory</article-title>. <source>Neural Comput</source>. (<year>1997</year>) <volume>9</volume>:<page-range>1735&#x2013;80</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1162/neco.1997.9.8.1735</pub-id>, PMID: <pub-id pub-id-type="pmid">9377276</pub-id></citation></ref>
<ref id="B56">
<label>56</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y-K</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>S</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Ernie: Enhanced representation through knowledge integration</article-title>. (<year>2019</year>).</citation></ref>
<ref id="B57">
<label>57</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Mohammadi</surname> <given-names>S</given-names>
</name>
<name>
<surname>Chapon</surname> <given-names>M</given-names>
</name>
</person-group>. &#x201c;<article-title>Investigating the performance of fine-tuned text classification models based-on bert</article-title>.&#x201d; In: <conf-name>Proceedings of the 2020 IEEE 22nd International Conference on High Performance Computing and Communications; IEEE 18th International Conference on Smart City; IEEE 6th International Conference on Data Science and Systems (HPCC/SmartCity/DSS)</conf-name>, (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>). (<year>2020</year>).  pp. <page-range>1252&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/HPCC/SmartCity/DSS50907.2020.00170</pub-id>
</citation></ref>
<ref id="B58">
<label>58</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arab Mohebi Shahrabi</surname> <given-names>A</given-names>
</name>
<name>
<surname>Mortazavi Nasiri</surname> <given-names>F</given-names>
</name>
<name>
<surname>Pakdaman</surname> <given-names>S</given-names>
</name>
<name>
<surname>Sadatian</surname> <given-names>S</given-names>
</name>
<name>
<surname>Madani</surname> <given-names>F</given-names>
</name>
</person-group>. <article-title>A study on factor structure and validation of social reward questionnaire in Iranian youth</article-title>. <source>Int J Behav Sci</source>. (<year>2017</year>) <volume>11</volume>:<fpage>96</fpage>&#x2013;<lpage>100</lpage>.</citation></ref>
<ref id="B59">
<label>59</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vazire</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Who knows what about a person? the self&#x2013;other knowledge asymmetry (soka) model</article-title>. <source>J Pers Soc Psychol</source>. (<year>2010</year>) <volume>98</volume>:<fpage>281</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/a0017908</pub-id>, PMID: <pub-id pub-id-type="pmid">20085401</pub-id></citation></ref>
<ref id="B60">
<label>60</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hintsanen</surname> <given-names>M</given-names>
</name>
<name>
<surname>Puttonen</surname> <given-names>S</given-names>
</name>
<name>
<surname>Smith</surname> <given-names>K</given-names>
</name>
<name>
<surname>Tornroos</surname> <given-names>M</given-names>
</name>
<name>
<surname>Jokela</surname> <given-names>M</given-names>
</name>
<name>
<surname>Pulkki-Raback</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>Five-factor personality traits and sleep: Evidence from two population-based cohort studies</article-title>. <source>Health Psychol</source>. (<year>2014</year>) <volume>33</volume>:<page-range>1214&#x2013;23</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/hea0000105</pub-id>, PMID: <pub-id pub-id-type="pmid">25133841</pub-id></citation></ref>
<ref id="B61">
<label>61</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zimmer</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>but the data is already public&#x201d;: On the ethics of research in facebook</article-title>. <source>Ethics Inf Technol</source>. (<year>2010</year>) <volume>12</volume>:<page-range>313&#x2013;25</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10676-010-9227-5</pub-id>
</citation></ref>
<ref id="B62">
<label>62</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mikal</surname> <given-names>JP</given-names>
</name>
<name>
<surname>Hurst</surname> <given-names>S</given-names>
</name>
<name>
<surname>Conway</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Ethical issues in using twitter for public health surveillance and research: Developing a taxonomy of ethical concepts from the research literature</article-title>. <source>J Med Internet Res</source>. (<year>2016</year>) <volume>18</volume>:<fpage>e218</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2196/jmir.5597</pub-id>, PMID: <pub-id pub-id-type="pmid">25533619</pub-id></citation></ref>
<ref id="B63">
<label>63</label>
<citation citation-type="web">
<person-group person-group-type="author">
<collab>American Psychological Association</collab>
</person-group>. <article-title>Guidelines for the practice of telepsychology</article-title> (<year>2013</year>). Available online at: <uri xlink:href="https://www.apa.org/practice/guidelines/telepsychology">https://www.apa.org/practice/guidelines/telepsychology</uri>. (Accessed <access-date>June 29, 2025</access-date>).</citation></ref>
<ref id="B64">
<label>64</label>
<citation citation-type="web">
<person-group person-group-type="author">
<collab>British Psychological Society</collab>
</person-group>. <article-title>Ethics guidelines for internet-mediated research (inf206/04.2017)</article-title> (<year>2017</year>). Available online at: <uri xlink:href="https://www.bps.org.uk/news-and-policy">https://www.bps.org.uk/news-and-policy</uri> (Accessed <access-date>June 29, 2025</access-date>).</citation></ref>
<ref id="B65">
<label>65</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>H&#xfc;lsheger</surname> <given-names>UR</given-names>
</name>
<name>
<surname>Alberts</surname> <given-names>HJEM</given-names>
</name>
<name>
<surname>Feinholdt</surname> <given-names>A</given-names>
</name>
<name>
<surname>Lang</surname> <given-names>JWB</given-names>
</name>
</person-group>. <article-title>Benefits of mindfulness at work: The role of mindfulness in emotion regulation, emotional exhaustion, and job satisfaction</article-title>. <source>J Appl Psychol</source>. (<year>2013</year>) <volume>98</volume>:<page-range>310&#x2013;25</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1037/a0031313</pub-id>, PMID: <pub-id pub-id-type="pmid">23276118</pub-id></citation></ref>
<ref id="B66">
<label>66</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Erzen</surname> <given-names>E</given-names>
</name>
<name>
<surname>Ozabaci</surname> <given-names>N</given-names>
</name>
</person-group>. <article-title>Effects of personality traits, social support and self-efficacy on predicting university adjustment</article-title>. <source>Front Psychol</source>. (<year>2023</year>) <volume>14</volume>:<elocation-id>1050</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpsyg.2023.1050</pub-id>
</citation></ref>
</ref-list>
</back>
</article>