<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychol.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Psychology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1664-1078</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyg.2026.1762573</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Measuring scientific creative thinking: development and validation of a process-oriented instrument</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Lu</surname>
<given-names>Huanhuan</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3303664"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mi</surname>
<given-names>Shuaishuai</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2652267"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Bi</surname>
<given-names>Hualin</given-names>
</name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3307930"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>School of Education, Shandong Women&#x2019;s University</institution>, <city>Jinan</city>, <state>Shandong</state>, <country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>School of Physics and Electronics, Shandong Normal University</institution>, <city>Jinan</city>, <state>Shandong</state>, <country country="cn">China</country></aff>
<aff id="aff3"><label>3</label><institution>College of Chemistry, Engineering and Materials Science, Shandong Normal University</institution>, <city>Jinan</city>, <state>Shandong</state>, <country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>&#x002A;</label>Correspondence: Hualin Bi, <email xlink:href="mailto:bihualin@sdnu.edu.cn">bihualin@sdnu.edu.cn</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-03-03">
<day>03</day>
<month>03</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>17</volume>
<elocation-id>1762573</elocation-id>
<history>
<date date-type="received">
<day>07</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>16</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>17</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2026 Lu, Mi and Bi.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Lu, Mi and Bi</copyright-holder>
<license>
<ali:license_ref start_date="2026-03-03">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Scientific creative thinking (SCT) is a critical cognitive process that drives scientific discovery and innovation. To address the limitations of existing assessment tools in capturing its multi-stage, domain-specific nature, this study developed and validated the Scientific Creative Thinking Scale (SCTS). Grounded in an integrative psychological framework, the SCTS combines explicit indicators of divergent thinking with implicit theories of within-domain appropriateness. The scale employs three open-ended tasks based on real-world scientific scenarios to systematically assess the three core stages of SCT: problem identification, hypothesis construction, and experimental verification. Using a two-stage independent sample design with 401 tenth-grade students, the scale was rigorously validated. Exploratory factor analysis (<italic>n</italic>&#x202F;=&#x202F;182) employing Principal Axis Factoring (PAF) with parallel analysis extracted a stable three-factor structure, accounting for 70.189% of the total variance. Confirmatory factor analysis with an independent sample (<italic>n</italic>&#x202F;=&#x202F;219) confirmed the three-factor model with good fit indices (CFI&#x202F;=&#x202F;0.948, TLI&#x202F;=&#x202F;0.922, RMSEA&#x202F;=&#x202F;0.076, SRMR&#x202F;=&#x202F;0.032). The scale demonstrated robust reliability: internal consistency was satisfactory (Cronbach&#x2019;s <italic>&#x03B1;</italic>&#x202F;=&#x202F;0.87; McDonald&#x2019;s <italic>&#x03C9;</italic>&#x202F;=&#x202F;0.89), and inter-rater reliability was excellent (ICC&#x202F;&#x2265;&#x202F;0.95). Composite reliability for each dimension exceeded 0.86, and average variance extracted exceeded 0.67, indicating good convergent validity. The Fornell-Larcker criterion was met, as the square root of AVE for each dimension exceeded its correlations with other factors, supporting discriminant validity. Additionally, the SCTS total score showed a significant positive correlation with science academic achievement (<italic>&#x03C1;</italic>&#x202F;=&#x202F;0.55, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.001), providing preliminary evidence for criterion-related validity. This study offers a process-oriented, psychometrically sound instrument for measuring SCT, laying a methodological foundation for future research on its cognitive mechanisms, individual differences, and developmental trajectories.</p>
</abstract>
<kwd-group>
<kwd>cognitive process</kwd>
<kwd>instrument development</kwd>
<kwd>process-oriented assessment</kwd>
<kwd>psychometrics</kwd>
<kwd>scientific creative thinking</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This work was supported by the 2024 Key Planning Project of Educational Research from the Chinese Society of Education (Grant No. 202416299817A): Research on the Practical Path of Cultivating Higher-Order Chemical Thinking from the Perspective of Core Competency, and additionally by the Scientific Research Fund for High-level Talents at Shandong Women&#x2019;s University (Grant No. 2023RCYJ15).</funding-statement>
</funding-group>
<counts>
<fig-count count="1"/>
<table-count count="9"/>
<equation-count count="0"/>
<ref-count count="47"/>
<page-count count="11"/>
<word-count count="8875"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Educational Psychology</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>Contemporary human society is confronted with a series of complex challenges, including climate change, public health crises, artificial intelligence ethics, and energy sustainability. These challenges are often characterized by their cross-disciplinary boundaries, uncertainty, and intricate structures (<xref ref-type="bibr" rid="ref13">Clark and Wallace, 2015</xref>; <xref ref-type="bibr" rid="ref37">Steiner, 2025</xref>). Addressing such problems requires individuals not only to integrate information and perspectives from diverse disciplines but also to propose solutions that transcend conventional approaches, and ultimately to translate these ideas into concrete, actionable plans. The core of Scientific Creative Thinking (SCT) lies precisely in generating high-quality, original, and elegant solutions to such complex, novel, and ill-defined scientific problems (<xref ref-type="bibr" rid="ref27">Mumford et al., 2012</xref>; <xref ref-type="bibr" rid="ref6">Ayas and Sak, 2014</xref>). Therefore, SCT not only serves as the core cognitive foundation of individual scientific creativity but also constitutes a fundamental competence for addressing global societal challenges, driving technological progress, and fostering sustainable social development (<xref ref-type="bibr" rid="ref38">Steiner et al., 2015</xref>; <xref ref-type="bibr" rid="ref33">Saleh and Brem, 2023</xref>).</p>
<p>From a cognitive psychology perspective, scientific creativity is far from a vague, holistic concept; it is a decomposable, multi-stage cognitive process. A central methodological challenge, however, lies in externalizing and objectively measuring this complex internal mental activity. The lack of precise measurement tools constrains both the assessment of individual differences in scientific creative potential and deeper investigation into the fundamental question of how creativity emerges. Therefore, developing a theoretically grounded, process-oriented assessment tool with sound psychometric properties is not merely an applied need, but foundational work essential for advancing cognitive theories of creativity and bridging the gap between neural mechanisms and observable behavior.</p>
<p>Despite significant advances in creativity research (<xref ref-type="bibr" rid="ref9">Beghetto and Kaufman, 2010</xref>; <xref ref-type="bibr" rid="ref42">Treffinger et al., 2001</xref>), measurement tools specifically designed for SCT remain relatively scarce. Existing instruments exhibit two primary limitations. First, regarding process completeness, most tools fail to systematically cover the core cognitive stages of scientific creative activity. Domain-general instruments, such as the Torrance Tests of Creative Thinking (TTCT) (<xref ref-type="bibr" rid="ref41">Torrance, 1974</xref>), possess sound psychometric properties. However, their abstract tasks are detached from authentic scientific inquiry practices and thus struggle to capture the distinctive thinking characteristics inherent to the scientific domain, raising concerns about their ecological and construct validity (<xref ref-type="bibr" rid="ref46">Zeng et al., 2011</xref>). While domain-specific tests represent an improvement, they still exhibit limitations. Early instruments, such as the tasks designed by <xref ref-type="bibr" rid="ref17">Hu and Adey (2002)</xref> (e.g., &#x201C;unusual uses,&#x201D; &#x201C;product improvement&#x201D;), did not adequately simulate the authentic research processes through which scientists systematically explore natural phenomena. Subsequent instruments have deepened aspects such as hypothesis generation and experimental design (<xref ref-type="bibr" rid="ref32">Sak and Ayas, 2013</xref>; <xref ref-type="bibr" rid="ref5">Atesgoz and Sak, 2021</xref>; <xref ref-type="bibr" rid="ref45">Yurt, 2025</xref>) and have introduced advances in assessment techniques (<xref ref-type="bibr" rid="ref43">Weng et al., 2025</xref>). However, they have generally overlooked the critical front-end stage of problem identification (<xref ref-type="bibr" rid="ref14">Einstein and Infeld, 1938</xref>). Research indicates that problem-finding ability may be even more strongly correlated with creativity than problem-solving; problem finding is not only a key component of the creative process but can also be reliably assessed (<xref ref-type="bibr" rid="ref11">Chand and Runco, 1993</xref>). An ideal assessment instrument should encompass all critical stages of the creative process (<xref ref-type="bibr" rid="ref46">Zeng et al., 2011</xref>).</p>
<p>Second, regarding assessment dimensions, existing instruments inadequately capture the core creativity element of appropriateness (<xref ref-type="bibr" rid="ref32">Sak and Ayas, 2013</xref>; <xref ref-type="bibr" rid="ref5">Atesgoz and Sak, 2021</xref>; <xref ref-type="bibr" rid="ref45">Yurt, 2025</xref>; <xref ref-type="bibr" rid="ref43">Weng et al., 2025</xref>). The scoring systems of these tools either treat appropriateness merely as a preliminary screening threshold for response plausibility or as a localized feature of a specific stage within SCT. They fail to recognize appropriateness as a core dimension that permeates and profoundly influences the entire scientific creative process. However, within the scientific context, &#x201C;appropriateness&#x201D; carries a richer meaning extending beyond general &#x201C;plausibility.&#x201D; It encompasses the research value of the problem, the testability of the hypothesis, the fundamental fit of the explanation, and the sophistication of the method. Judgments on these elements are highly dependent on the implicit norms and knowledge systems embedded within the scientific community.</p>
<p>To address these research gaps, this study aims to develop and validate the SCTS grounded in an explicit process model, from the perspectives of cognitive psychology and psychometrics. Compared to existing instruments, the SCTS offers three main improvements. First, framed around the complete scientific creative process, it formally incorporates problem identification as a core assessment component. Second, it elevates appropriateness to a core dimension parallel to novelty, operationalizing it based on the specific scientific creative process. Third, it enhances ecological validity by using authentic scientific scenarios as a thread, constructing task prototypes around fundamental scientific principles that require participants to engage in coherent creative thinking activities. In summary, the SCTS aims to provide an assessment approach for measuring SCT that offers greater process completeness and contextual relevance.</p>
<p>Based on this, the central research question this study seeks to answer is: What empirical evidence exists for the reliability and validity of the developed SCTS?</p>
</sec>
<sec id="sec2">
<label>2</label>
<title>Theoretical foundation</title>
<p>This study is grounded in the established scholarly consensus that defines &#x201C;creativity&#x201D; as the ability to produce outcomes that are both novel and appropriate (<xref ref-type="bibr" rid="ref40">Sternberg and Lubart, 1996</xref>; <xref ref-type="bibr" rid="ref29">Piffer, 2012</xref>; <xref ref-type="bibr" rid="ref30">Plucker et al., 2004</xref>). Scientific creativity, specifically, refers to the capacity to generate novel ideas or products that are relevant and scientifically useful within a given context (<xref ref-type="bibr" rid="ref6">Ayas and Sak, 2014</xref>). Building on this foundation, the present study operationally defines SCT as the structured cognitive process of exploring and understanding the natural world, aimed at generating solutions to problems that are both novel (unique, unconventional) and appropriate (consistent with scientific norms, logically rigorous, and testable). The construction of the assessment framework is informed by the following core theoretical pillars.</p>
<sec id="sec3">
<label>2.1</label>
<title>Domain specificity and the hierarchical nature of creativity</title>
<p>Research indicates that the manifestation and assessment of creativity are significantly domain-dependent (<xref ref-type="bibr" rid="ref8">Baer, 1998</xref>; <xref ref-type="bibr" rid="ref35">Silvia et al., 2009</xref>). This specificity is primarily evidenced in three ways. First, creative thinking is highly reliant on a domain-specific knowledge base. The organization, accessibility, and fluent application of this knowledge profoundly influence the generation and quality of creative outputs (<xref ref-type="bibr" rid="ref1">Alexander, 1992</xref>; <xref ref-type="bibr" rid="ref16">Feldhusen, 2006</xref>; <xref ref-type="bibr" rid="ref25">Mayer, 2006</xref>). Second, creative activities in different domains systematically demand distinct psychological characteristics and dominant cognitive modes. For instance, scientific creativity emphasizes logical reasoning and empirical verification, whereas artistic creativity relies more on esthetic perception and emotional expression (<xref ref-type="bibr" rid="ref21">Kind and Kind, 2007</xref>); this difference is also reflected in the personality traits of creative individuals (<xref ref-type="bibr" rid="ref16">Feldhusen, 2006</xref>). Third, cognitive neuroscience provides mechanistic evidence for domain specificity. For example, while scientific and artistic creativity share some foundational neural networks, they specifically activate brain regions associated with logical reasoning and problem-driven processing (e.g., cingulate gyrus) and those related to novelty-seeking and perceptual information processing (e.g., temporal lobe), respectively (<xref ref-type="bibr" rid="ref34">Shen et al., 2010</xref>). Therefore, effective measurement of scientific creativity must be grounded in its unique domain-specific norms, knowledge systems, and cognitive logic.</p>
<p>Simultaneously, creative performance exists at different levels of maturity and recognition. <xref ref-type="bibr" rid="ref20">Kaufman and Beghetto (2009)</xref> Four C model provides a key framework here, notably by articulating the concept of &#x201C;mini-c&#x201D; creativity&#x2014;the novel and personally meaningful interpretations constructed by individuals during learning and experience. The SCTS developed in this study is designed to measure precisely this developmental cognitive process, corresponding to the &#x201C;mini-c&#x201D; level as exhibited during scientific problem-solving. This focus ensures the tool&#x2019;s sensitivity to intrinsic, nascent creative thinking activities rather than solely to mature, publicly acknowledged creative products. Accordingly, SCTS tasks are not designed to simulate high-difficulty scientific discovery but use authentic, relatable scenarios to elicit learners&#x2019; scientific inquiry, thereby tapping into the personalized creative potential within their thought processes.</p>
</sec>
<sec id="sec4">
<label>2.2</label>
<title>A three-stage cognitive process model of scientific creative thinking</title>
<p>Scientific creativity is fundamentally a structured, domain-specific form of complex problem-solving. It involves systematic cognitive exploration within a defined &#x201C;problem space,&#x201D; employing various strategies to transform an initial problem state into a desired goal state (<xref ref-type="bibr" rid="ref36">Simon, 1977</xref>). Synthesizing analyses of scientific discovery (<xref ref-type="bibr" rid="ref24">Mansfield and Busse, 1981</xref>; <xref ref-type="bibr" rid="ref22">Klahr and Dunbar, 1988</xref>; <xref ref-type="bibr" rid="ref10">Bliersbach and Reiners, 2017</xref>), this study proposes a three-stage SCT process model, deconstructing the continuous flow of creative thought into observable and assessable cognitive units:</p>
<p>
<list list-type="bullet">
<list-item>
<p>Problem Identification. This stage requires the thinker to detect anomalies, contradictions, gaps in knowledge, or potential, underexplored research value within complex natural or experimental phenomena with high sensitivity and insight. The core cognitive task is to precisely refine and define these vague perceptions or initial curiosities into clear, specific, and investigable scientific questions. This stage reflects cognitive sensitivity and insightfulness.</p>
</list-item>
<list-item>
<p>&#x00B7;Hypothesis Construction. Based on the identified problem, the thinker needs to mobilize their existing knowledge base, scientific theoretical frameworks, intuitive hunches, or cross-domain analogies to generate one or more speculative explanations or solutions&#x2014;that is, scientific hypotheses&#x2014;that possess explanatory power and are, in principle, testable. This stage embodies the generative, associative, and explanatory aspects of thinking.</p>
</list-item>
<list-item>
<p>Experimental Verification. The thinker designs and rigorously implements corresponding empirical testing plans. This typically involves carefully constructed experiments but can also extend to systematic observation, computer simulation, and other scientific methods. This stage emphasizes the critical, logical, and empirically-oriented nature of thinking.</p>
</list-item>
</list>
</p>
</sec>
<sec id="sec5">
<label>2.3</label>
<title>Implicit theories of creativity</title>
<p>To construct a comprehensive framework for assessing SCT, particularly to capture its indispensable &#x201C;appropriateness&#x201D; dimension, this study introduces implicit theories of creativity as a core theoretical basis. This theory posits that within a specific domain (e.g., science), knowledgeable practitioners (e.g., scientists or science teachers) can make stable and valid judgments about the quality of creative products based on their internalized, shared standards and consensus regarding &#x201C;what constitutes good creative work in that domain&#x201D; (<xref ref-type="bibr" rid="ref39">Sternberg, 1985</xref>). This provides the methodological foundation for this study&#x2019;s assessment of &#x201C;appropriateness.&#x201D; Based on this theory, the SCTS establishes &#x201C;appropriateness&#x201D; as a core, judgeable construct that permeates all stages of SCT. In the scientific context, its connotation is specifically manifested as research value, essence, testability, and effectiveness. This ensures the assessment attends not only to the novelty and quantity of ideas but also to their conformity with the internal logic and norms of scientific inquiry, thereby enhancing the domain-specific explanatory power and ecological validity of the measurement tool.</p>
</sec>
</sec>
<sec id="sec6">
<label>3</label>
<title>Conceptual framework</title>
<p>Based on the three-stage cognitive process model of SCT, this study constructed an integrative conceptual framework (<xref ref-type="fig" rid="fig1">Figure 1</xref>). This framework aims to systematically elucidate the core constitutive dimensions of SCT and the principles underlying its assessment, integrating explicit indicators of divergent thinking with implicit criteria of scientific appropriateness. Specifically, the divergent thinking indicators, derived from the classic theory of Guilford and others, are used to quantify the generative characteristics of thinking outputs (such as fluency and flexibility). The scientific appropriateness criteria, grounded in domain-specific implicit theories, are applied through qualitative judgments by knowledgeable raters to assess the fitness of thinking products with scientific logic and empirical norms.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Conceptual framework of scientific creative thinking.</p>
</caption>
<graphic xlink:href="fpsyg-17-1762573-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Diagram illustrating a cyclic process with three main stages: problem identification, hypothesis construction, and experimental verification, each linked by arrows and associated with evaluation criteria listed beside each transition.</alt-text>
</graphic>
</fig>
<p>Concretely, the framework is organized around the following three stages and their core dimensions:</p>
<p>
<list list-type="bullet">
<list-item>
<p>In the Problem Identification stage, the core dimensions include: (1) Uniqueness, which refers to proposing questions with a frequency of occurrence below 10% among all participants (referring to the definition by <xref ref-type="bibr" rid="ref19">Hu and Han, 2006</xref>). Due to differences in the phenomenological features and scientific principles underlying the three task scenarios, the questions posed by students are context-specific, therefore, uniqueness is calculated separately for each scenario and is not aggregated across scenarios; (2) Value, judged by raters based on implicit theory, focusing on whether the question is purposefully clear, conducive to critical inquiry, and touches the essence of the phenomenon, serving as the core indicator of appropriateness for this stage; and (3) Quantity of Questions, directly reflecting the fluency of thinking.</p>
</list-item>
<list-item>
<p>In the Hypothesis Construction stage, the core dimensions include: (1) Essentiality, meaning whether the hypothesis aims to explain the core internal mechanism of the problem, judged by raters as a key manifestation of appropriateness in this stage; (2) Verifiability, referring to whether the hypothesis can, in principle, be tested through experiment or observation, also a key dimension of appropriateness; and (3) Quantity of Hypotheses, reflecting the flexibility of thinking.</p>
</list-item>
<list-item>
<p>In the Experimental Verification stage, the core dimensions include: (1) Effectiveness, meaning whether the designed plan can logically and rigorously test the target hypothesis, judged by raters as constituting the core of appropriateness for this stage; (2) Elaboration, assessing whether the plan is clear, specific, operational, and contains well-defined variables and control steps; and (3) Quantity of Verification Methods, used to measure the fluency of solution generation.</p>
</list-item>
</list>
</p>
</sec>
<sec id="sec7">
<label>4</label>
<title>Research method</title>
<sec id="sec8">
<label>4.1</label>
<title>Instrument development</title>
<p>Based on the conceptual framework of SCT, this study employed open-ended questions for assessment. Participants were presented with a thought-provoking, real-world problem scenario and asked to complete a response encompassing problem identification, hypothesis construction, and experimental verification. The design of such creative problem-solving tasks adhered to two key principles: first, the scenario must be related to curriculum standards to ensure the relevance of the assessment to students&#x2019; science learning experiences; second, the scenario itself must not be the central focus of any instructional unit to prevent the creativity measurement from devolving into a knowledge test (<xref ref-type="bibr" rid="ref15">Enger and Yager, 1998</xref>).</p>
<p>Guided by these principles, this study designed three core open-ended task scenarios to elicit and assess the key cognitive processes of SCT. All selected scenarios were drawn from everyday life and closely linked to fundamental scientific principles, aiming to ensure ecological validity while avoiding direct testing of specific scientific knowledge.</p>
<p>Scenario 1, &#x201C;Candle Combustion,&#x201D; involves a widely recognized phenomenon encompassing multiple scientific concepts such as combustion conditions, changes in states of matter, chemical reactions, and gas composition. It provides participants with an open-structured platform for multi-faceted exploration.</p>
<p>Scenario 2, &#x201C;Apple Discoloration,&#x201D; is based on the common phenomenon of enzymatic browning (the browning of a cut apple surface in air). The process implies a wealth of investigable scientific questions, effectively stimulating conjecture and testing regarding the underlying chemical and biological mechanisms.</p>
<p>Scenario 3, &#x201C;Steamed Bun Fermentation,&#x201D; concretizes microbial activity and chemical changes by presenting differences in dough state under varying fermentation conditions. It involves biological and chemical principles of the fermentation process, offering participants another authentic, relatable, and deeply investigable problem space.</p>
<p>For each scenario, participants sequentially completed three continuous cognitive tasks: (1) Problem Identification: based on the presented scenario, list all scientific questions of interest, then independently select the one deemed most valuable for research as the core for subsequent thinking; (2) Hypothesis Construction: for the chosen problem, propose as many possible explanations as possible and formulate testable hypotheses; (3) Experimental Verification: select one of the proposed hypotheses and design a specific, operational experimental plan to verify its plausibility. Given the study&#x2019;s focus on measuring the cognitive process of SCT and the practical constraints of large-scale testing, the &#x201C;Experimental Verification&#x201D; section focused on the conception and design of the experimental plan, not involving subsequent steps such as hands-on operation, data collection, or analysis.</p>
</sec>
<sec id="sec9">
<label>4.2</label>
<title>Scoring rubric</title>
<p>The scoring for this study was based on the fundamental principle of the Consensual Assessment Technique, whereby experts familiar with a specific domain can make independent and reliable subjective judgments about the novelty and appropriateness of creative products based on their internalized creativity standards (<xref ref-type="bibr" rid="ref2">Amabile, 1982</xref>). However, because assessing &#x201C;appropriateness&#x201D; in scientific contexts involves more complex domain-specific judgments, this study introduced a structured rater training component on top of the classic technique. The focus of the training was to establish a unified understanding among raters regarding the operational definitions of core constructs like &#x201C;research value&#x201D; and &#x201C;essence,&#x201D; rather than prescribing specific answers. This approach aimed to maintain judgments grounded in professional implicit consensus while enhancing inter-rater consistency, thereby achieving a balance between ecological validity and measurement reliability.</p>
<p>During the process of frequency calculation and scoring, responses that were semantically equivalent (i.e., expressed in different wording but referring to the same scientific question) were consolidated by the raters. Specifically, two raters first independently conducted preliminary coding for each response, then reached a consensus through discussion to identify responses addressing the same question in the following cases: (1) responses using different sentence structures but conveying the same core inquiry (e.g., &#x201C;Why does the apple turn yellow?&#x201D; and &#x201C;What is the reason for the apple turning yellow?&#x201D;); (2) responses posing detailed follow-up questions about the same phenomenon that essentially target the same underlying mechanism (e.g., &#x201C;Why does it start turning yellow from the middle?&#x201D; and &#x201C;Whether the discoloration begins at the center?&#x201D;). In cases of disagreement, a third subject matter expert was invited to provide arbitration, ensuring the accuracy of frequency statistics and the consistency of scoring.</p>
</sec>
<sec id="sec10">
<label>4.3</label>
<title>Pilot testing and scale revision</title>
<p>This stage involved a systematic examination of the initial version of the SCTS through a small-scale pilot test. The purpose was to evaluate item quality, scoring procedures, and preliminary validity, leading to subsequent revisions.</p>
<sec id="sec11">
<label>4.3.1</label>
<title>Pilot sample and procedure</title>
<p>The pilot testing involved 43 tenth-grade students from a key high school in a city in Shandong Province. Following the test, retrospective interviews were conducted with a subset of students. The interviews employed a &#x201C;think-aloud&#x201D; method, requiring students to verbally report their thought processes while completing each task scenario, including: how they understood the scenario description, how they identified problems, the basis on which they formulated hypotheses, and how they conceived experimental designs. The interviews were audio-recorded and subsequently transcribed. Two researchers independently analyzed the transcripts to confirm the inherent alignment between students&#x2019; responses and the constructs the scale intended to measure. Additionally, item analysis was conducted on the pilot data to examine the scale&#x2019;s comprehensibility, feasibility, and item quality.</p>
</sec>
<sec id="sec12">
<label>4.3.2</label>
<title>Pilot results and revision</title>
<sec id="sec13">
<label>4.3.2.1</label>
<title>Face validity and item quality</title>
<p>The think-aloud protocols provided evidence for the scale&#x2019;s face validity from the perspective of students&#x2019; interpretation and cognition of the task scenarios. Interview results indicated that all students accurately understood the scientific content and task requirements of the three scenarios, with no misinterpretation or ambiguity regarding the instructions. During the problem identification stage, students&#x2019; thinking primarily revolved around the potential mechanisms underlying the observed phenomena. In the hypothesis construction and experimental verification stages, students were able to reason based on their existing scientific knowledge, and their thinking pathways were largely consistent with the three-stage theoretical model. Taken together, these findings suggest that the instrument possesses strong face validity as perceived by the target population. Additionally, 98% of students completed all three scenarios within 45&#x202F;min, indicating that the time allocation for the test was reasonable.</p>
<p>Item analysis indicated the items demonstrated sufficient variability (standard deviations ranging from 0.89 to 1.21), and all item-total correlations reached moderate to high levels (<italic>r</italic>&#x202F;=&#x202F;0.42&#x2013;0.68), suggesting good item discrimination.</p>
</sec>
<sec id="sec14">
<label>4.3.2.2</label>
<title>Content validity</title>
<p>To examine the scale&#x2019;s content validity, four experts (two university professors of science education and two experienced secondary school science teachers) were invited to evaluate it, employing a combination of quantitative and qualitative methods.</p>
<p>For the quantitative assessment, experts used a 5-point Likert scale (1&#x202F;=&#x202F;&#x201C;Very inadequate&#x201D;&#x202F;~&#x202F;5&#x202F;=&#x202F;&#x201C;Very adequate&#x201D;) to rate scenario appropriateness (i.e., whether the three scenarios could effectively measure SCT) and task structure validity (i.e., whether the three-tiered &#x201C;Problem Identification&#x2014;Hypothesis Construction&#x2014;Experimental Verification&#x201D; structure accurately reflected the target construct). All dimension scores averaged above 4.0, indicating experts deemed the scale to have good content representativeness.</p>
<p>Fleiss&#x2019; Kappa coefficient was further used to assess inter-expert rating consistency. Following the criteria proposed by <xref ref-type="bibr" rid="ref47">Zuehlke et al. (2009)</xref>, the Fleiss&#x2019; Kappa coefficient in this study was 0.798, falling within the 0.6&#x2013;0.8 range, indicating a high level of agreement among experts (see <xref ref-type="table" rid="tab1">Table 1</xref>).</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Fleiss&#x2019; kappa test results for expert ratings.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Fleiss&#x2019; <italic>&#x03BA;</italic></th>
<th align="center" valign="top"><italic>SE</italic></th>
<th align="center" valign="top"><italic>z</italic></th>
<th align="center" valign="top"><italic>p</italic></th>
<th align="center" valign="top">95% <italic>CI</italic></th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">0.798</td>
<td align="char" valign="middle" char=".">0.17</td>
<td align="char" valign="middle" char=".">4.79</td>
<td align="char" valign="middle" char=".">&#x003C; 0.001</td>
<td align="center" valign="middle">[0.74, 0.85]</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The qualitative assessment involved collecting experts&#x2019; specific suggestions for improving the clarity of item descriptions and structural rationality through open-ended questions, providing crucial guidance for subsequent revision.</p>
</sec>
<sec id="sec15">
<label>4.3.2.3</label>
<title>Inter-rater reliability check</title>
<p>To examine the operability of the scoring criteria, two trained raters (both with backgrounds in science education) independently scored 30 pilot responses. Results showed intraclass correlation coefficients (ICCs) of 0.87 for the Problem Identification dimension, 0.83 for Hypothesis Construction, and 0.85 for Experimental Verification. This indicates the scoring criteria were clear and feasible, with good inter-rater reliability.</p>
</sec>
<sec id="sec16">
<label>4.3.2.4</label>
<title>Scale revision</title>
<p>Integrating feedback from student pilot testing and optimization suggestions from expert review, the initial scale was revised. Revisions primarily focused on optimizing the instructions and item descriptions, and the scoring guide was updated accordingly, culminating in the final SCTS (<xref ref-type="supplementary-material" rid="SM1">Supplementary Appendix 1</xref>) and its revised scoring rubric (see <xref ref-type="table" rid="tab2">Table 2</xref>).</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Scoring rubric for the scientific creative thinking scale (revised version).</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Task</th>
<th align="center" valign="top">Score</th>
<th align="left" valign="top">Behavioral description</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top" rowspan="4">Problem identification</td>
<td align="center" valign="top">3</td>
<td align="left" valign="top">Proposes &#x2265;2 unique questions demonstrating research value.</td>
</tr>
<tr>
<td align="center" valign="top">2</td>
<td align="left" valign="top">Proposes 1 unique question demonstrating research value.</td>
</tr>
<tr>
<td align="center" valign="top">1</td>
<td align="left" valign="top">Proposes a question with either uniqueness or research value (but not both).</td>
</tr>
<tr>
<td align="center" valign="top">0</td>
<td align="left" valign="top">Questions lack both uniqueness and research value.</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="4">Hypothesis construction</td>
<td align="center" valign="top">3</td>
<td align="left" valign="top">Generates &#x2265;2 substantive hypotheses that are empirically testable.</td>
</tr>
<tr>
<td align="center" valign="top">2</td>
<td align="left" valign="top">Generates 1 substantive hypothesis that is empirically testable.</td>
</tr>
<tr>
<td align="center" valign="top">1</td>
<td align="left" valign="top">Hypothesis is either substantive or testable (but not both).</td>
</tr>
<tr>
<td align="center" valign="top">0</td>
<td align="left" valign="top">Hypotheses are neither substantive nor testable.</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="4">Experimental verification</td>
<td align="center" valign="top">3</td>
<td align="left" valign="top">Designs &#x2265;2 elaborate and valid verification plans.</td>
</tr>
<tr>
<td align="center" valign="top">2</td>
<td align="left" valign="top">Designs 1 elaborate and valid verification plan.</td>
</tr>
<tr>
<td align="center" valign="top">1</td>
<td align="left" valign="top">Plan is valid but not elaborate, or elaborate but invalid.</td>
</tr>
<tr>
<td align="center" valign="top">0</td>
<td align="left" valign="top">Plans are neither valid nor elaborate.</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Operational definitions: (1) Unique questions are those generated by fewer than 10% of participants. (2) Valuable questions exhibit thoughtfulness or criticality and are amenable to further investigation. (3) Essential hypotheses address the core mechanism of the problem, independent of their factual correctness. (4) Testable hypotheses are those verifiable through specific empirical procedures. (5) Valid plans are designs capable of logically and rigorously testing the target hypothesis. (6) Elaborated plans are specific and operable, featuring clear steps, controlled variables, and concrete procedures.</p>
</table-wrap-foot>
</table-wrap>
</sec>
</sec>
</sec>
<sec id="sec17">
<label>4.4</label>
<title>Formal testing</title>
<sec id="sec18">
<label>4.4.1</label>
<title>Formal sample and procedure</title>
<p>This study employed a two-stage sampling design to conduct exploratory factor analysis (EFA) and confirmatory factor analysis (CFA) of the scale, respectively. The EFA sample consisted of tenth-grade students recruited from three provinces in China: Zhejiang (eastern China), Shandong (northern China), and Jilin (northeastern China). A total of 189 scales were distributed, with 186 returned. After excluding four invalid responses, the final valid sample comprised 182 participants (valid response rate: 96%). Participants&#x2019; ages ranged from 16 to 17&#x202F;years, including 94 females (51.6%) and 88 males (48.4%). The CFA sample was recruited separately from the same grade level (tenth grade) in Shandong Province. A total of 230 students participated, yielding 219 valid questionnaires (valid response rate: 95%). The age distribution of this sample was consistent with the EFA sample (16&#x2013;17&#x202F;years), comprising 112 females (51.1%) and 107 males (48.9%).</p>
<p>The scale was administered in a paper-and-pencil format in group settings to avoid systematic biases potentially associated with online surveys (<xref ref-type="bibr" rid="ref44">Wright, 2005</xref>). The administration was conducted during regular class hours with permission from the schools and relevant teachers. Classroom science teachers or homeroom teachers supervised the sessions to ensure a consistent testing environment. Each student independently completed the scale, which contained three scenario-based tasks. The time allotted for each task was 15&#x202F;min, resulting in a total completion time of 45&#x202F;min. To mitigate social desirability bias, students were explicitly informed that there were no &#x201C;correct answers&#x201D; for the tasks, that all responses would be kept strictly confidential and used solely for academic research purposes, and that their individual answers would not be disclosed. Although class identifiers were included for administrative purposes, students were encouraged to respond based on their genuine thoughts and to work independently.</p>
</sec>
<sec id="sec19">
<label>4.4.2</label>
<title>Scoring procedure</title>
<p>To ensure scoring consistency, the two raters received systematic training on the revised scoring guide prior to formal scoring. Subsequently, 30 responses (approximately 16% of the sample) were randomly selected for independent pilot scoring. Following this, a consensus meeting was held, focusing specifically on responses where scoring discrepancies were &#x2265;1 point. Raters articulated their reasoning for their scores, and consensus was reached through discussion, interpretation, and clarification of the scoring criteria. This iterative &#x201C;independent pilot scoring&#x2013;consensus meeting&#x201D; process was repeated, each time using a new random sample of no fewer than 20 responses, until the intraclass correlation coefficient [ICC(2,1)] calculated for two consecutive iterations was &#x2265;0.70, indicating an acceptable level of inter-rater agreement had been achieved. Subsequently, the raters independently performed the formal scoring for all 401 valid responses based on the finalized scoring rules. To illustrate the scoring criteria and enhance transparency, Appendix 2 presents annotated response exemplars for the Apple Discoloration scenario, including verbatim student responses and the rationale for each assigned score.</p>
</sec>
<sec id="sec20">
<label>4.4.3</label>
<title>Data analysis</title>
<p>To comprehensively evaluate the psychometric properties of the scale, data analyses were conducted from the perspectives of reliability and validity. Reliability analyses included: assessing the internal consistency of the total scale and each scenario-specific subscale using Cronbach&#x2019;s <italic>&#x03B1;</italic> coefficient and McDonald&#x2019;s <italic>&#x03C9;</italic> coefficient; and evaluating the scoring consistency of two raters across the three core dimensions using the intraclass correlation coefficient (ICC). Validity analyses included: examining the underlying factor structure of the scale through Exploratory Factor Analysis (EFA)&#x2014;employing Principal Axis Factoring (PAF) for factor extraction, utilizing Promax oblique rotation, and supplementing with parallel analysis to determine the number of factors to retain; further testing the robustness and model fit of this structure using Confirmatory Factor Analysis (CFA) with an independent sample; and examining criterion-related validity by analyzing Spearman&#x2019;s rank correlations between the total scale score, scenario-specific scores, and students&#x2019; science academic achievement. Data analyses were conducted using SPSS 25.0 and AMOS 26.0 software.</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="sec21">
<label>5</label>
<title>Results</title>
<sec id="sec22">
<label>5.1</label>
<title>Descriptive statistics and item quality</title>
<p>Descriptive statistical analyses were conducted on the test data. Each item was scored on a 4-point scale ranging from 0 to 3, yielding a theoretical total score range of 0&#x2013;27 for the SCTS. In the present sample, students&#x2019; actual scores ranged from 3 to 25, with a mean score of 13.45 (SD&#x202F;=&#x202F;5.38), and the score distribution approximated normality. Item means ranged from 1.19 to 2.09 (out of a maximum of 3), with standard deviations ranging from 0.87 to 1.20. The proportions of participants scoring the minimum (0) or maximum (3) on any item were both below 10%, indicating no significant floor or ceiling effects and suggesting that the items possess good discriminatory power.</p>
</sec>
<sec id="sec23">
<label>5.2</label>
<title>Reliability</title>
<sec id="sec24">
<label>5.2.1</label>
<title>Internal consistency reliability</title>
<p>The SCTS demonstrated good internal consistency overall (Cronbach&#x2019;s <italic>&#x03B1;</italic>&#x202F;=&#x202F;0.87; McDonald&#x2019;s <italic>&#x03C9;</italic>&#x202F;=&#x202F;0.89). In the Cronbach&#x2019;s &#x03B1; analysis, item-total correlation coefficients for all items ranged from 0.42 to 0.68, indicating that each item effectively reflected the measurement objectives of the total scale. To verify the consistency of measurement across different scenario-based tasks, we calculated the reliability of the scenario-specific subscales using both Cronbach&#x2019;s &#x03B1; and McDonald&#x2019;s &#x03C9; coefficients. As shown in <xref ref-type="table" rid="tab3">Table 3</xref>, the &#x03B1; coefficients for the three scenario subscales ranged from 0.75 to 0.82, and the &#x03C9; coefficients ranged from 0.76 to 0.85, all exceeding the acceptable threshold of 0.70. These results indicate that the scale possesses good internal consistency reliability.</p>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Reliability of scenario-specific subscales.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Scenario</th>
<th align="center" valign="top">&#x03B1;</th>
<th align="center" valign="top">&#x03C9;</th>
<th align="center" valign="top">Items</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Candle combustion</td>
<td align="char" valign="middle" char=".">0.75</td>
<td align="char" valign="middle" char=".">0.77</td>
<td align="center" valign="middle">3</td>
</tr>
<tr>
<td align="left" valign="middle">Apple discoloration</td>
<td align="char" valign="middle" char=".">0.82</td>
<td align="char" valign="middle" char=".">0.85</td>
<td align="center" valign="middle">3</td>
</tr>
<tr>
<td align="left" valign="middle">Steamed bun fermentation</td>
<td align="char" valign="middle" char=".">0.75</td>
<td align="char" valign="middle" char=".">0.76</td>
<td align="center" valign="middle">3</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>&#x03B1;, Cronbach&#x2019;s alpha coefficient; &#x03C9;, McDonald&#x2019;s omega coefficient.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="sec25">
<label>5.2.2</label>
<title>Inter-rater reliability</title>
<p>The intraclass correlation coefficient ICC (2,1) under a two-way random-effects model was calculated to assess inter-rater reliability. As shown in <xref ref-type="table" rid="tab4">Table 4</xref>, the ICC values for the three dimensions ranged from 0.95 to 0.97, all exceeding the &#x201C;good&#x201D; threshold of 0.75 (<xref ref-type="bibr" rid="ref12">Cicchetti, 1994</xref>), indicating excellent inter-rater agreement and that the scoring criteria were clear and reliably implemented.</p>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>Intraclass correlations for inter-rater reliability by dimension.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Dimension</th>
<th align="center" valign="top"><italic>ICC</italic></th>
<th align="center" valign="top">95% <italic>CI</italic></th>
<th align="center" valign="top"><italic>p</italic></th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Problem identification</td>
<td align="char" valign="middle" char=".">0.95</td>
<td align="center" valign="middle">[0.91, 0.97]</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Hypothesis construction</td>
<td align="char" valign="middle" char=".">0.95</td>
<td align="center" valign="middle">[0.93, 0.97]</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Experimental verification</td>
<td align="char" valign="middle" char=".">0.97</td>
<td align="center" valign="middle">[0.95, 0.98]</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>ICC, intraclass correlation coefficient; Model: absolute-agreement, two-way random-effects (ICC[2,1]).</p>
</table-wrap-foot>
</table-wrap>
</sec>
</sec>
<sec id="sec26">
<label>5.3</label>
<title>Validity</title>
<sec id="sec27">
<label>5.3.1</label>
<title>Construct validity</title>
<p>Exploratory Factor Analysis (EFA). Exploratory factor analysis was conducted using the first subsample (<italic>n</italic>&#x202F;=&#x202F;182). The suitability of the data for factor analysis was examined, yielding a Kaiser-Meyer-Olkin (KMO) measure of sampling adequacy of 0.796 and a significant Bartlett&#x2019;s test of sphericity (&#x03C7;<sup>2</sup>&#x202F;=&#x202F;1095.26, df&#x202F;=&#x202F;36, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.001), indicating that the data were appropriate for factor analysis. Principal Axis Factoring (PAF) was employed for factor extraction. Given the theoretical expectation of associations among the three dimensions, Promax oblique rotation was used to allow for correlations among factors (<xref ref-type="bibr" rid="ref9001">Montag and Walla, 2016</xref>). To determine the number of factors to retain, multiple criteria were employed. The Kaiser-Guttman criterion indicated that the first three factors had eigenvalues greater than 1.0; the scree plot revealed a distinct inflection point after the third factor, after which the trend leveled off; additionally, Parallel Analysis was conducted as a more robust standard (<xref ref-type="bibr" rid="ref9002">Hayton et al., 2004</xref>). Based on 1,000 randomly generated datasets, the observed eigenvalues were compared against the 95th percentile eigenvalues from the random data. The results showed that the eigenvalues for the first three factors exceeded their corresponding random counterparts, while the eigenvalue for the fourth factor fell below the random criterion, thus providing stable support for a three-factor structure. The three extracted factors cumulatively accounted for 70.189% of the total variance (see <xref ref-type="table" rid="tab5">Table 5</xref>).</p>
<table-wrap position="float" id="tab5">
<label>Table 5</label>
<caption>
<p>Total variance explained by principal axis factoring.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Factor</th>
<th align="center" valign="top" colspan="3">Initial eigenvalues</th>
<th align="center" valign="top" colspan="3">Extraction sums of squared loadings</th>
<th align="center" valign="top">Rotation sums of squared loadings</th>
</tr>
<tr>
<th align="center" valign="top">Total</th>
<th align="center" valign="top">% of variance</th>
<th align="center" valign="top">Cumulative %</th>
<th align="center" valign="top">Total</th>
<th align="center" valign="top">% of variance</th>
<th align="center" valign="top">Cumulative %</th>
<th align="center" valign="top">Total</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">1</td>
<td align="char" valign="middle" char=".">3.920</td>
<td align="char" valign="middle" char=".">43.556</td>
<td align="char" valign="middle" char=".">43.556</td>
<td align="char" valign="middle" char=".">3.124</td>
<td align="char" valign="middle" char=".">34.711</td>
<td align="char" valign="middle" char=".">34.711</td>
<td align="char" valign="middle" char=".">2.735</td>
</tr>
<tr>
<td align="left" valign="middle">2</td>
<td align="char" valign="middle" char=".">1.315</td>
<td align="char" valign="middle" char=".">14.611</td>
<td align="char" valign="middle" char=".">58.167</td>
<td align="char" valign="middle" char=".">1.874</td>
<td align="char" valign="middle" char=".">20.822</td>
<td align="char" valign="middle" char=".">55.533</td>
<td align="char" valign="middle" char=".">2.388</td>
</tr>
<tr>
<td align="left" valign="middle">3</td>
<td align="char" valign="middle" char=".">1.082</td>
<td align="char" valign="middle" char=".">12.022</td>
<td align="char" valign="middle" char=".">70.189</td>
<td align="char" valign="middle" char=".">1.319</td>
<td align="char" valign="middle" char=".">14.656</td>
<td align="char" valign="middle" char=".">70.189</td>
<td align="char" valign="middle" char=".">1.194</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Extraction Method: Principal Axis Factoring. Rotation Method: Promax with Kaiser Normalization. Parallel analysis (1,000 iterations, 95th percentile) confirmed the retention of three factors. Rotation converged in 5 iterations.</p>
</table-wrap-foot>
</table-wrap>
<p>The rotated factor pattern matrix (see <xref ref-type="table" rid="tab6">Table 6</xref>) revealed that all nine items demonstrated factor loadings above 0.78 on their corresponding primary factors, with no significant cross-loadings, indicating a clear factor structure. The three factors corresponded, respectively, to the theoretical model&#x2019;s dimensions: &#x201C;Problem Identification&#x201D; (Items 1, 4, and 7), &#x201C;Hypothesis Construction&#x201D; (Items 2, 5, and 8), and &#x201C;Experimental Verification&#x201D; (Items 3, 6, and 9).</p>
<table-wrap position="float" id="tab6">
<label>Table 6</label>
<caption>
<p>Rotated factor pattern matrix from Promax rotation.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Item</th>
<th align="center" valign="top">Factor 1</th>
<th align="center" valign="top">Factor 2</th>
<th align="center" valign="top">Factor 3</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Q1</td>
<td align="char" valign="top" char=".">0.898</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Q4</td>
<td align="char" valign="top" char=".">0.847</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Q7</td>
<td align="char" valign="top" char=".">0.885</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Q2</td>
<td/>
<td align="char" valign="top" char=".">0.807</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Q5</td>
<td/>
<td align="char" valign="top" char=".">0.812</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Q8</td>
<td/>
<td align="char" valign="top" char=".">0.785</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Q3</td>
<td/>
<td/>
<td align="char" valign="top" char=".">0.915</td>
</tr>
<tr>
<td align="left" valign="middle">Q6</td>
<td/>
<td/>
<td align="char" valign="top" char=".">0.906</td>
</tr>
<tr>
<td align="left" valign="middle">Q9</td>
<td/>
<td/>
<td align="char" valign="top" char=".">0.887</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Extraction Method: Principal Axis Factoring. Rotation Method: Promax with Kaiser Normalization.</p>
</table-wrap-foot>
</table-wrap>
<p>The correlations among factors ranged from 0.462 to 0.523 (see <xref ref-type="table" rid="tab7">Table 7</xref>), indicating moderate to strong positive relationships among the three factors. These intercorrelations support the use of oblique rotation and suggest that, while the dimensions are empirically distinct, they represent related aspects of a broader construct (<xref ref-type="bibr" rid="ref26">Mostafa et al., 2025</xref>). The strongest correlation was observed between Problem Identification and Hypothesis Construction (<italic>r</italic>&#x202F;=&#x202F;0.523), suggesting that these two dimensions may be mutually reinforcing. Experimental Verification showed slightly lower correlations with the other two factors (r ranging from 0.462 to 0.487), indicating a greater degree of distinctiveness for this dimension.</p>
<table-wrap position="float" id="tab7">
<label>Table 7</label>
<caption>
<p>Factor correlation matrix from Promax rotation.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Factor</th>
<th align="center" valign="top">Problem identification</th>
<th align="center" valign="top">Hypothesis construction</th>
<th align="center" valign="top">Experimental verification</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Problem identification</td>
<td align="center" valign="middle">1</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Hypothesis construction</td>
<td align="center" valign="middle">0.523&#x002A;&#x002A;</td>
<td align="center" valign="middle">1</td>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Experimental verification</td>
<td align="center" valign="middle">0.487&#x002A;&#x002A;</td>
<td align="center" valign="middle">0.462&#x002A;&#x002A;</td>
<td align="center" valign="middle">1</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>&#x002A;&#x002A;<italic>p</italic>&#x202F;&#x003C;&#x202F;0.01.</p>
</table-wrap-foot>
</table-wrap>
<p>Confirmatory Factor Analysis (CFA). Confirmatory factor analysis was conducted using the second independent subsample (<italic>n</italic>&#x202F;=&#x202F;219). Based on the theoretical framework, the nine observed indicators (Q1&#x2013;Q9) were specified to load onto three latent variables: Problem Identification, Hypothesis Construction, and Experimental Verification. The model fit results are presented in <xref ref-type="table" rid="tab8">Table 8</xref>. The goodness-of-fit indices indicated that the three-factor model fit the data well: &#x03C7;<sup>2</sup>/df&#x202F;=&#x202F;3.009, which is below the recommended threshold of 5; CFI&#x202F;=&#x202F;0.948 and TLI&#x202F;=&#x202F;0.922, both exceeding the 0.90 criterion; RMSEA&#x202F;=&#x202F;0.076, falling below the acceptable level of 0.08; and SRMR&#x202F;=&#x202F;0.032, well below the 0.80 threshold. All fit indices met acceptable standards, demonstrating that the three-factor model exhibited good fit with the data.</p>
<table-wrap position="float" id="tab8">
<label>Table 8</label>
<caption>
<p>Fit indices for the CFA.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Fit indices</th>
<th align="center" valign="top">&#x03C7;<sup>2</sup></th>
<th align="center" valign="top">df</th>
<th align="center" valign="top">&#x03C7;<sup>2</sup>/df</th>
<th align="center" valign="top">GFI</th>
<th align="center" valign="top">AGFI</th>
<th align="center" valign="top">CFI</th>
<th align="center" valign="top">TLI</th>
<th align="center" valign="top">RMSEA</th>
<th align="center" valign="top">SRMR</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Value</td>
<td align="char" valign="middle" char=".">72.227</td>
<td align="center" valign="middle">24</td>
<td align="center" valign="middle">3.009</td>
<td align="char" valign="middle" char=".">0.910</td>
<td align="char" valign="middle" char=".">0.832</td>
<td align="char" valign="middle" char=".">0.948</td>
<td align="char" valign="middle" char=".">0.922</td>
<td align="center" valign="middle">0.076</td>
<td align="char" valign="middle" char=".">0.032</td>
</tr>
<tr>
<td align="left" valign="middle">Criteria of fit indices</td>
<td/>
<td/>
<td align="center" valign="middle">&#x003C;3 is excellent; 3&#x2013;5 is good</td>
<td align="char" valign="middle" char=".">&#x003E;0.90</td>
<td align="char" valign="middle" char=".">&#x003E;0.90</td>
<td align="char" valign="middle" char=".">&#x003E;0.90</td>
<td align="char" valign="middle" char=".">&#x003E;0.90</td>
<td align="center" valign="middle">&#x003C;0.05 is excellent; 0.05&#x2013;0.08 is acceptable</td>
<td align="char" valign="middle" char=".">&#x003C;0.05</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec28">
<label>5.3.2</label>
<title>Convergent validity and discriminant validity</title>
<p>Composite reliability (CR) and average variance extracted (AVE) were calculated based on factor loadings. The results showed that CR values for all dimensions exceeded the recommended threshold of 0.70 (<xref ref-type="bibr" rid="ref31">Raykov, 1997</xref>): Problem Identification CR&#x202F;=&#x202F;0.9035, Hypothesis Construction CR&#x202F;=&#x202F;0.8622, Experimental Verification CR&#x202F;=&#x202F;0.8605. AVE values all exceeded the 0.50 threshold (<xref ref-type="bibr" rid="ref28">Nunnally and Bernstein, 1994</xref>): Problem Identification AVE&#x202F;=&#x202F;0.7575, Hypothesis Construction AVE&#x202F;=&#x202F;0.6776, Experimental Verification AVE&#x202F;=&#x202F;0.673. These results indicate that the scale possesses good convergent validity.</p>
<p>Discriminant validity concerns the extent to which items measuring different constructs are relatively uncorrelated (<xref ref-type="bibr" rid="ref18">Hu and Bi, 2025</xref>). The square root of AVE for each factor (Problem Identification &#x221A;0.7575&#x202F;=&#x202F;0.870; Hypothesis Construction &#x221A;0.6776&#x202F;=&#x202F;0.823; Experimental Verification &#x221A;0.673&#x202F;=&#x202F;0.820) exceeded its correlations with the other factors, satisfying the Fornell-Larcker criterion. This indicates that the scale demonstrates good discriminant validity.</p>
</sec>
<sec id="sec29">
<label>5.3.3</label>
<title>Criterion validity</title>
<p>Students&#x2019; science academic achievement was employed as an external criterion to examine its Spearman&#x2019;s rank correlation with the total SCTS score. Given that the three task scenarios in the scale were all grounded in chemical principles, students&#x2019; scores on a standardized school-administered chemistry examination from the most recent end-of-semester assessment were selected as the criterion measure. This examination was conducted approximately 4 weeks prior to the SCTS administration and was not specifically designed for this study. The tests were developed by experienced chemistry teachers and reviewed by subject matter experts. To account for differences in examination difficulty across schools, raw scores were converted to within-school z-scores, thereby rendering all students&#x2019; scores comparable on a common scale. As shown in <xref ref-type="table" rid="tab9">Table 9</xref>, the total scale score demonstrated a significant positive correlation with the transformed achievement scores (<italic>&#x03C1;</italic>&#x202F;=&#x202F;0.55, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.001). Scores on each scenario-specific subscale also showed significant, moderate positive correlations with achievement scores (&#x03C1; ranging from 0.50 to 0.57, all <italic>p</italic>&#x202F;&#x003C;&#x202F;0.001), providing preliminary evidence for the criterion-related validity of the scale.</p>
<table-wrap position="float" id="tab9">
<label>Table 9</label>
<caption>
<p>Correlation between academic achievement and scientific creative thinking performance.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Measure</th>
<th align="center" valign="top">&#x03C1;</th>
<th align="center" valign="top"><italic>p</italic></th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Candle combustion</td>
<td align="char" valign="middle" char=".">0.50</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Apple discoloration</td>
<td align="char" valign="middle" char=".">0.57</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Steamed bun fermentation</td>
<td align="char" valign="middle" char=".">0.55</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Total scale</td>
<td align="char" valign="middle" char=".">0.55</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Spearman&#x2019;s &#x03C1; reported. All <italic>p</italic>-values are two-tailed.</p>
</table-wrap-foot>
</table-wrap>
</sec>
</sec>
</sec>
<sec id="sec30">
<label>6</label>
<title>Discussion, limitations, and future directions</title>
<p>Guided by a three-stage cognitive model and integrating explicit and implicit assessment approaches, this study developed and initially validated the SCTS. The scale operationalizes SCT as a sequential process involving problem identification, hypothesis construction, and experimental verification. Empirical evidence indicates that the SCTS possesses sound psychometric properties, offering a novel assessment pathway and an empirical foundation for understanding the cognitive architecture of scientific creativity.</p>
<p>In terms of reliability, the SCTS demonstrated excellent properties. The internal consistency reliability of the total scale was good (<italic>&#x03B1;</italic>&#x202F;=&#x202F;0.87, <italic>&#x03C9;</italic>&#x202F;=&#x202F;0.89), and the reliabilities of each scenario-specific subscale also reached acceptable levels (&#x03B1;&#x202F;=&#x202F;0.75&#x2013;0.82, &#x03C9;&#x202F;=&#x202F;0.76&#x2013;0.85). These results indicate that the items reliably measure the latent construct of &#x201C;scientific creative thinking.&#x201D; Crucially, through systematic rater training and consensus-building procedures, exceptionally high inter-rater agreement was achieved for all three core cognitive dimensions (ICC&#x202F;&#x2265;&#x202F;0.95). This outcome holds significant methodological importance: it suggests that by designing domain-specific, structured tasks combined with a standardized implicit judgment process, the objectivity and reliability of subjective scoring for complex cognitive constructs can be effectively enhanced. This addresses the longstanding challenges faced by traditional divergent thinking tests regarding predictive and ecological validity (<xref ref-type="bibr" rid="ref46">Zeng et al., 2011</xref>). This study also provides a reference model for measuring domain-embedded higher-order thinking skills, one that balances ecological validity with psychometric rigor.</p>
<p>Regarding construct validity, exploratory factor analysis employing Principal Axis Factoring (PAF) with Promax oblique rotation, supplemented by parallel analysis to determine the number of factors to retain, robustly supported a three-factor structure, accounting for 70.189% of the total variance. All items demonstrated factor loadings exceeding 0.78 on their corresponding factors, indicating a clear factor structure that aligned precisely with the theoretical framework. Confirmatory factor analysis conducted with an independent sample further confirmed the adequate fit of the three-factor model (CFI&#x202F;=&#x202F;0.948, TLI&#x202F;=&#x202F;0.922, RMSEA&#x202F;=&#x202F;0.076, SRMR&#x202F;=&#x202F;0.032). Inter-factor correlations ranged from 0.46 to 0.52, reflecting moderate associations and indicating that the SCTS successfully operationalizes SCT as a multidimensional structure comprising interrelated yet distinct dimensions. These findings provide empirical support for the cognitive theory that conceptualizes scientific discovery as a systematic search across hypothesis and experiment spaces (<xref ref-type="bibr" rid="ref22">Klahr and Dunbar, 1988</xref>), thereby offering psychometric evidence for the perspective that scientific creativity represents a domain-specific, structured cognitive process.</p>
<p>Regarding convergent and discriminant validity, the composite reliability (CR) for each dimension exceeded 0.86, and the average variance extracted (AVE) for each dimension exceeded 0.67, indicating that the scale possesses good convergent validity. The square root of the AVE for each factor (ranging from 0.82 to 0.87) was greater than its correlations with the other factors, satisfying the Fornell-Larcker criterion and further confirming the discriminant validity of the scale.</p>
<p>For criterion-related validity, the total SCTS score showed a moderate positive correlation with students&#x2019; academic achievement in science. This aligns with the theoretical expectation that domain knowledge provides a foundation for creative thinking (<xref ref-type="bibr" rid="ref4">Anwar and Aness, 2012</xref>), offering preliminary evidence for the scale&#x2019;s criterion validity.</p>
<p>It should be noted that the assessment in this study was conducted sequentially across the three stages of problem identification, hypothesis construction, and experimental verification, and that students&#x2019; performance may exhibit systematic differences across these stages. This variability does not represent measurement error but rather reflects the stage-specific characteristics of the SCT process. The cognitive tasks at each stage differ in nature: problem identification emphasizes observation and questioning, hypothesis construction relies on association and reasoning, and experimental verification stresses logical and operational design. Individuals possess different strengths across these cognitive components, reflecting the heterogeneous structure of scientific creativity (<xref ref-type="bibr" rid="ref17">Hu and Adey, 2002</xref>). Furthermore, the degree of openness and difficulty varies across stages; the problem identification stage imposes a higher cognitive load, whereas the hypothesis and verification stages involve relatively more structured tasks (<xref ref-type="bibr" rid="ref23">Lin and Lien, 2013</xref>). Therefore, this study treats the scores from the three stages as independent indicators reflecting distinct sub-constructs and does not advocate for simple summation or cross-stage comparisons. Future research could employ cognitive interviewing, eye-tracking, or other methods to further investigate differences in cognitive strategies across stages, or conduct task difficulty equalization to more precisely differentiate stage effects from individual differences.</p>
<p>The core theoretical contribution of this study lies in proposing an integrative assessment framework. The SCTS is not merely a transplantation of general creativity indicators into the science domain. Instead, it attempts a deep integration of explicit indicators of cognitive products with implicit judgments of domain appropriateness. Traditional divergent thinking tests primarily assess the novelty of products (e.g., fluency, originality), while the assessment of &#x201C;appropriateness&#x201D; or &#x201C;effectiveness&#x201D; is often superficial. Building on Sternberg&#x2019;s implicit theory, this study recognizes that judgments of &#x201C;appropriateness&#x201D; in scientific creation are highly dependent on internalized domain norms. Therefore, it adopted and refined the Consensual Assessment Technique, allowing raters to provide comprehensive judgments on aspects like &#x201C;research value,&#x201D; &#x201C;essence,&#x201D; and &#x201C;effectiveness&#x201D; based on their implicit professional consensus. This methodological integration enables the SCTS to capture both the novelty and appropriateness dimensions of creativity simultaneously, offering conceptual and methodological reference for measuring domain-specific creativity that requires balancing &#x201C;breakthrough&#x201D; with &#x201C;compliance.&#x201D; Furthermore, by anchoring abstract scientific creativity in the specific cognitive sequence of &#x201C;problem identification&#x2014;hypothesis construction&#x2014;experimental verification,&#x201D; it provides an operational, testable theoretical model, facilitating future empirical research on related cognitive mechanisms.</p>
<p>Several limitations of this study should be acknowledged. First, the sample was limited to Chinese secondary school students; thus, the cross-cultural and cross-age generalizability of the findings requires further validation. Second, while the study examined internal consistency and inter-rater reliability, evidence for cross-time stability (test&#x2013;retest reliability) was not assessed. Third, due to sample size constraints and the lack of sufficiently large and balanced subgroups, we were unable to test for measurement invariance across key demographic groups such as gender and school type. This limits our ability to confirm that the SCTS measures the same constructs in the same way across these populations. Fourth, although the significant correlation between SCTS scores and science academic achievement (<italic>&#x03C1;</italic>&#x202F;=&#x202F;0.55) provides preliminary evidence for criterion-related validity, this finding should be interpreted with caution, as prior academic achievement and cognitive ability were not controlled for as potential confounding variables. Fifth, while the three task scenarios were designed to approximate real-life situations, they may still carry certain cultural specificities (e.g., the steamed bun fermentation scenario may be less familiar in some cultural contexts).</p>
<p>Future research should address these limitations in several ways. First, the psychometric properties of the SCTS should be further examined in more diverse and representative samples, employing longitudinal designs to assess cross-time stability and utilizing stratified sampling to conduct multi-group confirmatory factor analyses for testing measurement invariance. Second, future studies should include control variables such as prior academic achievement and cognitive ability to examine the incremental validity of the SCTS. Additionally, developing more culturally adaptable scenario banks or tasks targeting different scientific sub-domains, along with employing multiple criterion measures and multi-method approaches, will help to further enrich the validity evidence for the scale.</p>
<p>Looking ahead, the SCTS can serve as a foundational tool for exploring a range of deeper questions. For example, employing cognitive neuroscience methods to investigate the brain activity patterns corresponding to the three thinking stages and their dynamic interactions; examining the relationships between SCT and classic personality/cognitive variables such as openness, need for cognition, and executive functions; or using longitudinal studies to track its developmental trajectory and key influencing factors. Such work will not only deepen the understanding of SCT itself but also help integrate it more systematically into the broader landscape of individual differences and cognitive psychology.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec31">
<title>Data availability statement</title>
<p>The datasets presented in this article are not readily available because the datasets generated and analyzed during the current study are not publicly available due to ethical and privacy restrictions. The primary data consist of written, open-ended responses from minor participants (secondary school students). Furthermore, the informed consent obtained from participants and their guardians did not include authorization for public data deposition. De-identified, aggregated data that underpin the findings reported in this manuscript are available from the corresponding author (Prof. Hualin Bi) upon reasonable request. Requests to access the datasets should be directed to Hualin Bi, <email xlink:href="mailto:bihualin@sdnu.edu.cn">bihualin@sdnu.edu.cn</email>.</p>
</sec>
<sec sec-type="ethics-statement" id="sec32">
<title>Ethics statement</title>
<p>The studies involving humans were approved by the Institutional Review Board of Shandong Normal University. The studies were conducted in accordance with the local legislation and institutional requirements. Written informed consent for participation in this study was provided by the participants&#x2019; legal guardians/next of kin.</p>
</sec>
<sec sec-type="author-contributions" id="sec33">
<title>Author contributions</title>
<p>HL: Conceptualization, Data curation, Investigation, Methodology, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. SM: Formal analysis, Validation, Writing &#x2013; review &#x0026; editing. HB: Funding acquisition, Project administration, Resources, Supervision, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="COI-statement" id="sec34">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec35">
<title>Generative AI statement</title>
<p>The author(s) declared that Generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec36">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec37">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fpsyg.2026.1762573/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fpsyg.2026.1762573/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Supplementary_file_1.pdf" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Supplementary_file_2.pdf" id="SM2" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Alexander</surname><given-names>P. A.</given-names></name></person-group> (<year>1992</year>). <article-title>Domain knowledge: evolving themes and emerging concerns</article-title>. <source>Educ. Psychol.</source> <volume>27</volume>, <fpage>33</fpage>&#x2013;<lpage>51</lpage>. doi: <pub-id pub-id-type="doi">10.1207/s15326985ep2701_4</pub-id></mixed-citation></ref>
<ref id="ref2"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Amabile</surname><given-names>T. M.</given-names></name></person-group> (<year>1982</year>). <article-title>Social psychology of creativity: a consensual assessment technique</article-title>. <source>J. Pers. Soc. Psychol.</source> <volume>43</volume>, <fpage>997</fpage>&#x2013;<lpage>1013</lpage>. doi: <pub-id pub-id-type="doi">10.1037/0022-3514.43.5.997</pub-id></mixed-citation></ref>
<ref id="ref4"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Anwar</surname><given-names>M. N.</given-names></name> <name><surname>Aness</surname><given-names>M.</given-names></name></person-group> (<year>2012</year>). <article-title>An examination of the relationship between creative thinking and academic achievements of secondary school students</article-title>. <source>Int. Interdiscip. J. Educ.</source> <volume>1</volume>, <fpage>1</fpage>&#x2013;<lpage>4</lpage>. doi: <pub-id pub-id-type="doi">10.36752/1764-001-003-001</pub-id></mixed-citation></ref>
<ref id="ref5"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Atesgoz</surname><given-names>N. N.</given-names></name> <name><surname>Sak</surname><given-names>U.</given-names></name></person-group> (<year>2021</year>). <article-title>Test of scientific creativity animations for children: development and validity study</article-title>. <source>Think. Skills Creat.</source> <volume>40</volume>:<fpage>100818</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tsc.2021.100818</pub-id></mixed-citation></ref>
<ref id="ref6"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ayas</surname><given-names>M. B.</given-names></name> <name><surname>Sak</surname><given-names>U.</given-names></name></person-group> (<year>2014</year>). <article-title>Objective measure of scientific creativity: psychometric validity of the creative scientific ability test</article-title>. <source>Think. Skills Creat.</source> <volume>13</volume>, <fpage>195</fpage>&#x2013;<lpage>205</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tsc.2014.06.001</pub-id></mixed-citation></ref>
<ref id="ref8"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Baer</surname><given-names>J.</given-names></name></person-group> (<year>1998</year>). <article-title>The case for domain specificity of creativity</article-title>. <source>Creat. Res. J.</source> <volume>11</volume>, <fpage>173</fpage>&#x2013;<lpage>177</lpage>. doi: <pub-id pub-id-type="doi">10.1207/s15326934crj1102_7</pub-id></mixed-citation></ref>
<ref id="ref9"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Beghetto</surname><given-names>R. A.</given-names></name> <name><surname>Kaufman</surname><given-names>J. C.</given-names></name></person-group> (<year>2010</year>). <source>Nurturing creativity in the classroom</source>. <publisher-loc>Cambridge</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>.</mixed-citation></ref>
<ref id="ref10"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bliersbach</surname><given-names>M.</given-names></name> <name><surname>Reiners</surname><given-names>C. S.</given-names></name></person-group> (<year>2017</year>). <article-title>Kreativit&#x00E4;t und Chemie?</article-title> <source>Chem. Unserer Zeit.</source> <volume>51</volume>, <fpage>324</fpage>&#x2013;<lpage>331</lpage>. doi: <pub-id pub-id-type="doi">10.1002/ciuz.201700796</pub-id></mixed-citation></ref>
<ref id="ref11"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chand</surname><given-names>I.</given-names></name> <name><surname>Runco</surname><given-names>M. A.</given-names></name></person-group> (<year>1993</year>). <article-title>Problem finding skills as components in the creative process</article-title>. <source>Pers. Individ. Dif.</source> <volume>14</volume>, <fpage>155</fpage>&#x2013;<lpage>162</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0191-8869(93)90185-6</pub-id></mixed-citation></ref>
<ref id="ref12"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cicchetti</surname><given-names>D. V.</given-names></name></person-group> (<year>1994</year>). <article-title>Guidelines, criteria, and rules of thumb for evaluating normed and standardized assessment instruments in psychology</article-title>. <source>Psychol. Assess.</source> <volume>6</volume>, <fpage>284</fpage>&#x2013;<lpage>290</lpage>. doi: <pub-id pub-id-type="doi">10.1037/1040-3590.6.4.284</pub-id></mixed-citation></ref>
<ref id="ref13"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Clark</surname><given-names>S. G.</given-names></name> <name><surname>Wallace</surname><given-names>R. L.</given-names></name></person-group> (<year>2015</year>). <article-title>Integration and interdisciplinarity: concepts, frameworks, and education</article-title>. <source>Policy. Sci.</source> <volume>48</volume>, <fpage>233</fpage>&#x2013;<lpage>255</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11077-015-9210-4</pub-id></mixed-citation></ref>
<ref id="ref14"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Einstein</surname><given-names>A.</given-names></name> <name><surname>Infeld</surname><given-names>L.</given-names></name></person-group> (<year>1938</year>). <source>The evolution of physics</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Simon &#x0026; Schuster</publisher-name>.</mixed-citation></ref>
<ref id="ref15"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Enger</surname><given-names>K. E.</given-names></name> <name><surname>Yager</surname><given-names>R. E.</given-names></name></person-group> (<year>1998</year>). <source>The Iowa assessment handbook</source>. <publisher-loc>Iowa City, IA</publisher-loc>: <publisher-name>University of Iowa, Science Education Center</publisher-name>.</mixed-citation></ref>
<ref id="ref16"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Feldhusen</surname><given-names>J. F.</given-names></name></person-group> (<year>2006</year>). &#x201C;<chapter-title>The role of the knowledge base in creative thinking</chapter-title>&#x201D; in <source>Creativity and reason in cognitive development</source>. eds. <person-group person-group-type="editor"><name><surname>Kaufman</surname><given-names>J. C.</given-names></name> <name><surname>Baer</surname><given-names>J.</given-names></name></person-group> (<publisher-loc>Cambridge</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>), <fpage>137</fpage>&#x2013;<lpage>144</lpage>.</mixed-citation></ref>
<ref id="ref9002"><mixed-citation><person-group person-group-type="author"><name><surname>Hayton</surname><given-names>J. C.</given-names></name> <name><surname>Allen</surname><given-names>D. G.</given-names></name> <name><surname>Scarpello</surname><given-names>V.</given-names></name></person-group> (<year>2004</year>). <article-title>Factor retention decisions in exploratory factor analysis: A tutorial on parallel analysis</article-title>. <source>Organizational Research Methods</source>, <volume>7</volume>, <fpage>191</fpage>&#x2013;<lpage>205</lpage>. doi: <pub-id pub-id-type="doi">10.1177/1094428104263675</pub-id></mixed-citation></ref>
<ref id="ref17"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname><given-names>W.</given-names></name> <name><surname>Adey</surname><given-names>P.</given-names></name></person-group> (<year>2002</year>). <article-title>A scientific creativity test for secondary school students</article-title>. <source>Int. J. Sci. Educ.</source> <volume>24</volume>, <fpage>389</fpage>&#x2013;<lpage>403</lpage>. doi: <pub-id pub-id-type="doi">10.1080/09500690110098912</pub-id></mixed-citation></ref>
<ref id="ref18"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname><given-names>X.</given-names></name> <name><surname>Bi</surname><given-names>H.</given-names></name></person-group> (<year>2025</year>). <article-title>Exploring and validating the componential model of students' scientific critical thinking in science education</article-title>. <source>Think. Skills Creat.</source> <volume>55</volume>:<fpage>101695</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tsc.2024.101695</pub-id></mixed-citation></ref>
<ref id="ref19"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname><given-names>W.</given-names></name> <name><surname>Han</surname><given-names>Q.</given-names></name></person-group> (<year>2006</year>). <article-title>A developmental study on primary school students' creative scientific question-asking ability</article-title>. <source>Psychol. Sci.</source> <volume>29</volume>, <fpage>944</fpage>&#x2013;<lpage>946</lpage>. doi: <pub-id pub-id-type="doi">10.16719/j.cnki.1671-6981.2006.04.044</pub-id></mixed-citation></ref>
<ref id="ref20"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kaufman</surname><given-names>J. C.</given-names></name> <name><surname>Beghetto</surname><given-names>R. A.</given-names></name></person-group> (<year>2009</year>). <article-title>Beyond big and little: the four c model of creativity</article-title>. <source>Rev. Gen. Psychol.</source> <volume>13</volume>, <fpage>1</fpage>&#x2013;<lpage>12</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0013688</pub-id></mixed-citation></ref>
<ref id="ref21"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kind</surname><given-names>P. M.</given-names></name> <name><surname>Kind</surname><given-names>V.</given-names></name></person-group> (<year>2007</year>). <article-title>Creativity in science education: perspectives and challenges for developing school science</article-title>. <source>Stud. Sci. Educ.</source> <volume>43</volume>, <fpage>1</fpage>&#x2013;<lpage>37</lpage>. doi: <pub-id pub-id-type="doi">10.1080/03057260708560225</pub-id></mixed-citation></ref>
<ref id="ref22"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Klahr</surname><given-names>D.</given-names></name> <name><surname>Dunbar</surname><given-names>K.</given-names></name></person-group> (<year>1988</year>). <article-title>Dual space search during scientific reasoning</article-title>. <source>Cogn. Sci.</source> <volume>12</volume>, <fpage>1</fpage>&#x2013;<lpage>48</lpage>. doi: <pub-id pub-id-type="doi">10.1207/s15516709cog1201_1</pub-id></mixed-citation></ref>
<ref id="ref23"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname><given-names>W.-L.</given-names></name> <name><surname>Lien</surname><given-names>Y.-W.</given-names></name></person-group> (<year>2013</year>). <article-title>The different role of working memory in open-ended versus closed-ended creative problem solving: a dual-process theory account</article-title>. <source>Creat. Res. J.</source> <volume>25</volume>, <fpage>85</fpage>&#x2013;<lpage>96</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10400419.2013.752249</pub-id></mixed-citation></ref>
<ref id="ref24"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Mansfield</surname><given-names>R. S.</given-names></name> <name><surname>Busse</surname><given-names>T. V.</given-names></name></person-group> (<year>1981</year>). <source>The psychology of creativity and discovery: scientists and their work</source>. <publisher-loc>Chicago, IL</publisher-loc>: <publisher-name>Nelson-Hall</publisher-name>.</mixed-citation></ref>
<ref id="ref25"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Mayer</surname><given-names>R. E.</given-names></name></person-group> (<year>2006</year>). &#x201C;<chapter-title>The role of domain knowledge in creative problem solving</chapter-title>&#x201D; in <source>Creativity and reason in cognitive development</source>. eds. <person-group person-group-type="editor"><name><surname>Kaufman</surname><given-names>J. C.</given-names></name> <name><surname>Baer</surname><given-names>J.</given-names></name></person-group> (<publisher-loc>Cambridge</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>), <fpage>145</fpage>&#x2013;<lpage>158</lpage>.</mixed-citation></ref>
<ref id="ref9001"><mixed-citation><person-group person-group-type="author"><name><surname>Montag</surname><given-names>C.</given-names></name> <name><surname>Walla</surname><given-names>P.</given-names></name></person-group> (<year>2016</year>). <article-title>Carpe diem instead of losing your social mind: Beyond digital addiction and why we all suffer from digital overuse</article-title>. <source>Cogent Psychology</source>,  <volume>3</volume>:<fpage>1157281</fpage>. doi: <pub-id pub-id-type="doi">10.1080/23311908.2016.1157281</pub-id></mixed-citation></ref>
<ref id="ref26"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mostafa</surname><given-names>M. M.</given-names></name> <name><surname>Ibrahim</surname><given-names>A. R.</given-names></name> <name><surname>Nemt-allah</surname><given-names>M. A.</given-names></name> <name><surname>Arafa</surname><given-names>S. Z.</given-names></name> <name><surname>Hassan</surname><given-names>A. A.</given-names></name> <name><surname>Helali</surname><given-names>M. M.</given-names></name></person-group> (<year>2025</year>). <article-title>Development and psychometric validation of the brain rot scale: measuring digital content overconsumption among generation alpha and generation Z</article-title>. <source>Eur. J. Investig. Health Psychol. Educ.</source> <volume>15</volume>:<fpage>262</fpage>. doi: <pub-id pub-id-type="doi">10.3390/ejihpe15120262</pub-id>, <pub-id pub-id-type="pmid">41440168</pub-id></mixed-citation></ref>
<ref id="ref27"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mumford</surname><given-names>M. D.</given-names></name> <name><surname>Medeiros</surname><given-names>K. E.</given-names></name> <name><surname>Partlow</surname><given-names>P. J.</given-names></name></person-group> (<year>2012</year>). <article-title>Creative thinking: processes, strategies, and knowledge</article-title>. <source>J. Creat. Behav.</source> <volume>46</volume>, <fpage>30</fpage>&#x2013;<lpage>47</lpage>. doi: <pub-id pub-id-type="doi">10.1002/jocb.003</pub-id></mixed-citation></ref>
<ref id="ref28"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Nunnally</surname><given-names>J. C.</given-names></name> <name><surname>Bernstein</surname><given-names>I. H.</given-names></name></person-group> (<year>1994</year>). <source>Psychometric theory</source>. <edition>3rd</edition> <italic>Edn</italic>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>McGraw-Hill</publisher-name>.</mixed-citation></ref>
<ref id="ref29"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Piffer</surname><given-names>D.</given-names></name></person-group> (<year>2012</year>). <article-title>Can creativity be measured? An attempt to clarify the notion of creativity and general directions for future research</article-title>. <source>Think. Skills Creat.</source> <volume>7</volume>, <fpage>258</fpage>&#x2013;<lpage>264</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tsc.2012.04.009</pub-id></mixed-citation></ref>
<ref id="ref30"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Plucker</surname><given-names>J.</given-names></name> <name><surname>Beghetto</surname><given-names>R. A.</given-names></name> <name><surname>Dow</surname><given-names>G.</given-names></name></person-group> (<year>2004</year>). <article-title>Why isn't creativity more important to educational psychologists? Potential, pitfalls, and future directions in creativity research</article-title>. <source>Educ. Psychol.</source> <volume>39</volume>, <fpage>83</fpage>&#x2013;<lpage>96</lpage>. doi: <pub-id pub-id-type="doi">10.1207/s15326985ep3902_1</pub-id></mixed-citation></ref>
<ref id="ref31"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Raykov</surname><given-names>T.</given-names></name></person-group> (<year>1997</year>). <article-title>Estimation of composite reliability for congeneric measures</article-title>. <source>Appl. Psychol. Meas.</source> <volume>21</volume>, <fpage>173</fpage>&#x2013;<lpage>184</lpage>. doi: <pub-id pub-id-type="doi">10.1177/01466216970212006</pub-id></mixed-citation></ref>
<ref id="ref32"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sak</surname><given-names>U.</given-names></name> <name><surname>Ayas</surname><given-names>M. B.</given-names></name></person-group> (<year>2013</year>). <article-title>Creative scientific ability test (C-SAT): a new measure of scientific creativity</article-title>. <source>Psychol. Test Assess. Model.</source> <volume>55</volume>, <fpage>316</fpage>&#x2013;<lpage>329</lpage>. doi: <pub-id pub-id-type="doi">10.1037/t72324-000</pub-id></mixed-citation></ref>
<ref id="ref33"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Saleh</surname><given-names>R.</given-names></name> <name><surname>Brem</surname><given-names>A.</given-names></name></person-group> (<year>2023</year>). <article-title>Creativity for sustainability: an integrative literature review</article-title>. <source>J. Clean. Prod.</source> <volume>388</volume>:<fpage>135848</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jclepro.2023.135848</pub-id></mixed-citation></ref>
<ref id="ref34"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shen</surname><given-names>W.</given-names></name> <name><surname>Wang</surname><given-names>Y.</given-names></name> <name><surname>Liu</surname><given-names>C.</given-names></name></person-group> (<year>2010</year>). <article-title>The neural basis of artistic creativity</article-title>. <source>Adv. Psychol. Sci.</source> <volume>18</volume>, <fpage>1520</fpage>&#x2013;<lpage>1528</lpage>.</mixed-citation></ref>
<ref id="ref35"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Silvia</surname><given-names>P. J.</given-names></name> <name><surname>Kaufman</surname><given-names>J. C.</given-names></name> <name><surname>Pretz</surname><given-names>J. E.</given-names></name></person-group> (<year>2009</year>). <article-title>Is creativity domain-specific? Latent class models of creative accomplishments and creative self-descriptions</article-title>. <source>Psychol. Aesthet. Creat. Arts</source> <volume>3</volume>, <fpage>139</fpage>&#x2013;<lpage>148</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0014940</pub-id></mixed-citation></ref>
<ref id="ref36"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Simon</surname><given-names>H. A.</given-names></name></person-group> (<year>1977</year>). <source>Models of discovery</source>. <publisher-loc>Dordrecht</publisher-loc>: <publisher-name>D. Reidel</publisher-name>.</mixed-citation></ref>
<ref id="ref37"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Steiner</surname><given-names>G.</given-names></name></person-group> (<year>2025</year>). &#x201C;<chapter-title>Transdisciplinarity for mastering poly-crises by mutual learning between science and practice</chapter-title>&#x201D; in <source>Transdisciplinary thinking and acting: fundamentals and perspectives</source>. ed. <person-group person-group-type="editor"><name><surname>Sch&#x00FC;z</surname><given-names>M.</given-names></name></person-group> (<publisher-loc>Berlin</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>155</fpage>&#x2013;<lpage>182</lpage>.</mixed-citation></ref>
<ref id="ref38"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Steiner</surname><given-names>G.</given-names></name> <name><surname>Risopoulos</surname><given-names>F.</given-names></name> <name><surname>Mulej</surname><given-names>M.</given-names></name></person-group> (<year>2015</year>). <article-title>Social responsibility and citizen-driven innovation in sustainably mastering global socio-economic crises</article-title>. <source>Syst. Res. Behav. Sci.</source> <volume>32</volume>, <fpage>160</fpage>&#x2013;<lpage>167</lpage>. doi: <pub-id pub-id-type="doi">10.1002/sres.2255</pub-id></mixed-citation></ref>
<ref id="ref39"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sternberg</surname><given-names>R. J.</given-names></name></person-group> (<year>1985</year>). <article-title>Implicit theories of intelligence, creativity, and wisdom</article-title>. <source>J. Pers. Soc. Psychol.</source> <volume>49</volume>, <fpage>607</fpage>&#x2013;<lpage>627</lpage>. doi: <pub-id pub-id-type="doi">10.1037/0022-3514.49.3.607</pub-id></mixed-citation></ref>
<ref id="ref40"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sternberg</surname><given-names>R. J.</given-names></name> <name><surname>Lubart</surname><given-names>T. I.</given-names></name></person-group> (<year>1996</year>). <article-title>Investing in creativity</article-title>. <source>Am. Psychol.</source> <volume>51</volume>, <fpage>677</fpage>&#x2013;<lpage>688</lpage>. doi: <pub-id pub-id-type="doi">10.1037/0003-066X.51.7.677</pub-id></mixed-citation></ref>
<ref id="ref41"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Torrance</surname><given-names>E. P.</given-names></name></person-group> (<year>1974</year>). <source>The Torrance tests of creative thinking: Norms-technical manual research edition</source>. <publisher-loc>Princeton, NJ</publisher-loc>: <publisher-name>Personnel Press</publisher-name>.</mixed-citation></ref>
<ref id="ref42"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Treffinger</surname><given-names>D.</given-names></name> <name><surname>Young</surname><given-names>G.</given-names></name> <name><surname>Selby</surname><given-names>E.</given-names></name> <name><surname>Shepardson</surname><given-names>C.</given-names></name></person-group> (<year>2001</year>). &#x201C;<chapter-title>Definition and characteristics of creativity and creative thinking</chapter-title>&#x201D; in <source>Creative learning today</source>. ed. <person-group person-group-type="editor"><name><surname>Treffinger</surname><given-names>D.</given-names></name></person-group> (<publisher-loc>Sarasota, FL</publisher-loc>: <publisher-name>Centre for Creative Learning</publisher-name>).</mixed-citation></ref>
<ref id="ref43"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Weng</surname><given-names>W.</given-names></name> <name><surname>Liu</surname><given-names>C.</given-names></name> <name><surname>Zhao</surname><given-names>G.</given-names></name> <name><surname>Song</surname><given-names>L.</given-names></name> <name><surname>Zhang</surname><given-names>X.</given-names></name></person-group> (<year>2025</year>). <article-title>Intelligent assessment of scientific creativity by integrating data augmentation and pseudo-labeling</article-title>. <source>Information</source> <volume>16</volume>:<fpage>785</fpage>. doi: <pub-id pub-id-type="doi">10.3390/info16090785</pub-id></mixed-citation></ref>
<ref id="ref44"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wright</surname><given-names>K. B.</given-names></name></person-group> (<year>2005</year>). <article-title>Researching internet-based populations: advantages and disadvantages of online survey research, online questionnaire authoring software packages, and web survey services</article-title>. <source>J. Comput.-Mediat. Commun.</source> <volume>10</volume>:<fpage>JCMC1034</fpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1083-6101.2005.tb00259.x</pub-id></mixed-citation></ref>
<ref id="ref45"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yurt</surname><given-names>E.</given-names></name></person-group> (<year>2025</year>). <article-title>The creative problem-solving skills test: development and initial validation</article-title>. <source>Int. J. Educ. Math. Sci. Technol.</source> <volume>13</volume>, <fpage>761</fpage>&#x2013;<lpage>790</lpage>. doi: <pub-id pub-id-type="doi">10.46328/ijemst.4711</pub-id></mixed-citation></ref>
<ref id="ref46"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zeng</surname><given-names>L.</given-names></name> <name><surname>Proctor</surname><given-names>R. W.</given-names></name> <name><surname>Salvendy</surname><given-names>G.</given-names></name></person-group> (<year>2011</year>). <article-title>Can traditional divergent thinking tests be trusted in measuring and predicting real-world creativity?</article-title> <source>Creat. Res. J.</source> <volume>23</volume>, <fpage>24</fpage>&#x2013;<lpage>37</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10400419.2011.545713</pub-id></mixed-citation></ref>
<ref id="ref47"><mixed-citation publication-type="confproc"><person-group person-group-type="author"><name><surname>Zuehlke</surname><given-names>D.</given-names></name> <name><surname>Geweniger</surname><given-names>T.</given-names></name> <name><surname>Heimann</surname><given-names>U.</given-names></name> <name><surname>Villmann</surname><given-names>T.</given-names></name></person-group>. (<year>2009</year>). <chapter-title>Fuzzy Fleiss-kappa for comparison of fuzzy classifiers</chapter-title>. In <conf-name>Proceedings of the 17th European Symposium on Artificial Neural Networks (ESANN) (Bruges)</conf-name> Bruges, Belgium: d-side publications, <fpage>443</fpage>&#x2013;<lpage>448</lpage>.</mixed-citation></ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0001"><p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1137920/overview">S&#x00ED;lvio Manuel da Rocha Brito</ext-link>, Polytechnic Institute of Tomar (IPT), Portugal</p></fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0002"><p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3202615/overview">Abdul Wahid</ext-link>, Universitas Muhammadiyah Makassar, Indonesia</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3371908/overview">Firdaus Firdaus</ext-link>, Universitas Sains Al-Qur&#x2019;an, Indonesia</p></fn>
</fn-group>
</back>
</article>