<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" dtd-version="1.3" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Educ.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Education</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Educ.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2504-284X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/feduc.2026.1749760</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Development of a multidimensional questionnaire on students&#x00027; perceived authenticity in science learning contexts</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Senel</surname> <given-names>Deniz C.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3092146"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Sch&#x000FC;ttler</surname> <given-names>Tobias</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Ertl</surname> <given-names>Bernhard</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/404686"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Watzka</surname> <given-names>Bianca</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<uri xlink:href="https://loop.frontiersin.org/people/2166883"/>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Didactics of Physics and Technology, RWTH Aachen University</institution>, <city>Aachen</city>, <country country="de">Germany</country></aff>
<aff id="aff2"><label>2</label><institution>DLR_School_Lab, German Aerospace Center (DLR)</institution>, <city>We&#x000DF;ling</city>, <country country="de">Germany</country></aff>
<aff id="aff3"><label>3</label><institution>Learning and Teaching with Media, Institute of Education, Universit&#x000E4;t der Bundeswehr M&#x000FC;nchen</institution>, <city>Neubiberg</city>, <country country="de">Germany</country></aff>
<author-notes>
<corresp id="c001"><label>&#x0002A;</label>Correspondence: Deniz C. Senel, <email xlink:href="mailto:senel@physik.rwth-aachen.de">senel@physik.rwth-aachen.de</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-13">
<day>13</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>11</volume>
<elocation-id>1749760</elocation-id>
<history>
<date date-type="received">
<day>19</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>13</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>14</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2026 Senel, Sch&#x000FC;ttler, Ertl and Watzka.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Senel, Sch&#x000FC;ttler, Ertl and Watzka</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-13">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Authentic learning environments are recognized as effective for increasing students&#x00027; interest and engagement in science education. However, the development and improvement of such environments are constrained by the absence of robust and comprehensive measurement tools for students&#x00027; perceptions of authenticity. Existing instruments often do not capture the multidimensional nature of authenticity. More recently, researchers have developed questionnaires that operationalize authenticity as a multidimensional construct in educational contexts. Yet, even these instruments do not address all theoretically relevant aspects of authenticity identified in established models. In this study, we therefore develop and validate a new questionnaire designed to measure students&#x00027; perceived authenticity in learning settings. The questionnaire comprises six dimensions: <italic>location, instructor, innovation, methods, materials</italic>, and <italic>content</italic>. Data were collected from <italic>N</italic> = 146 secondary school students at an out-of-school laboratory in Germany and analyzed using confirmatory factor analysis. The results indicate a six-factor solution aligned with the hypothesized model, with internal consistencies exceeding 0.75 for five of the six scales. The resulting instrument provides a more precise tool for assessing students&#x00027; perceptions of authenticity, facilitating a more accurate evaluation of authentic learning environments in science education and supporting the development of interventions to enhance authenticity in instructional design.</p></abstract>
<kwd-group>
<kwd>confirmatory factor analysis</kwd>
<kwd>disciplinary authenticity</kwd>
<kwd>instrument development</kwd>
<kwd>perceived authenticity</kwd>
<kwd>questionnaire validation</kwd>
<kwd>science communication</kwd>
</kwd-group>
<funding-group>
<award-group id="gs1">
<funding-source id="sp1">
<institution-wrap>
<institution>Deutsche Forschungsgemeinschaft</institution>
<institution-id institution-id-type="doi" vocab="open-funder-registry" vocab-identifier="10.13039/open_funder_registry">10.13039/501100001659</institution-id>
</institution-wrap>
</funding-source>
</award-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. We thank the Deutsche Forschungsgemeinschaft (German Research Foundation, DFG) for support through the Research Unit FOR 5599 on structured magnetic elastomers, project no. 511114185, via DFG grant reference no. WA 5276/1-1.</funding-statement>
</funding-group>
<counts>
<fig-count count="1"/>
<table-count count="7"/>
<equation-count count="0"/>
<ref-count count="65"/>
<page-count count="16"/>
<word-count count="12497"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>STEM Education</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<label>1</label>
<title>Introduction</title>
<p>Authenticity has become a central concept in science education, serving both as a guiding principle for designing learning environments and as a means to enhance students&#x00027; interest and engagement in science (<xref ref-type="bibr" rid="B19">Habig and Gupta, 2021</xref>). In response to critiques of traditional instruction, which often features tasks with procedural clarity and predetermined outcomes (<xref ref-type="bibr" rid="B11">Chinn and Malhotra, 2002</xref>), researchers have advocated for more authentic learning experiences that are intended to bridge the gap between science-based school activities and scientific practice (<xref ref-type="bibr" rid="B56">Schwartz et al., 2004</xref>).</p>
<p>Although authenticity is a widely used term in science education, it remains complex and multifaceted (<xref ref-type="bibr" rid="B1">Anker-Hansen and Andr&#x000E9;e, 2019</xref>). Various research domains highlight different aspects, including disciplinary realism, professional practice, real-world authenticity, and personal authenticity (<xref ref-type="bibr" rid="B34">Lee and Butler, 2003</xref>; <xref ref-type="bibr" rid="B64">Watkins et al., 2012</xref>; <xref ref-type="bibr" rid="B62">van Vorst et al., 2015</xref>; <xref ref-type="bibr" rid="B30">Kapon et al., 2018</xref>; <xref ref-type="bibr" rid="B53">Schriebl et al., 2023</xref>). A domain-oriented perspective conceptualizes authenticity (so-called &#x0201C;disciplinary authenticity&#x0201D;) as the extent to which learning environments mirror the epistemic, procedural, and contextual characteristics of actual scientific practice (<xref ref-type="bibr" rid="B2">Betz, 2018</xref>; <xref ref-type="bibr" rid="B59">Sommer et al., 2018</xref>). Building on this framework, <xref ref-type="bibr" rid="B16">Finger et al. (2022</xref>) conceptualize authenticity as a continuum from simplified tasks to complex, open-ended representations of professional practice. This study adopts this perspective and draws on the definition provided by <xref ref-type="bibr" rid="B42">Nachtigall et al. (2022</xref>, p. 1482), who, based primarily on seminal work by <xref ref-type="bibr" rid="B23">Herrington and Oliver (2000</xref>), describe authentic learning settings as &#x0201C;characterized by learners, who collaboratively try to solve a complex and ill-structured real-world problem through self-directed inquiry and investigation [...] together with practitioners or experts, in a real-world or professional setting, [...] using materials and tools that are either typically also applied by practitioners or are used in daily life.&#x0201D;</p>
<p>While this definition sets a high-level ideal of authentic learning, it is important to clarify that authenticity in science education does not require direct participation in professional research or immersion in real scientific institutions. Rather, authenticity can be meaningfully achieved through pedagogically designed representations of scientific practice&#x02014;by approximating core features such as epistemic openness, procedural reasoning, and the use of authentic tools or data within the constraints of school and outreach settings (<xref ref-type="bibr" rid="B3">Betz et al., 2016</xref>; <xref ref-type="bibr" rid="B48">Roth, 1995</xref>). Students do not need to generate novel scientific knowledge to experience learning as authentic. In this sense, learning is considered authentic when it reflects the routines, tools, and complexity of scientific work (<xref ref-type="bibr" rid="B6">Braund and Reiss, 2006</xref>).</p>
<p>However, authenticity is not only a property of learning environments but also emerges through the interaction between the learner and the learning context itself (<xref ref-type="bibr" rid="B26">Honebein et al., 1993</xref>; <xref ref-type="bibr" rid="B42">Nachtigall et al., 2022</xref>). As <xref ref-type="bibr" rid="B20">Habig et al. (2018</xref>) argue, students&#x00027; perceptions are not only influenced by features of the learning environment but are also shaped by their prior knowledge, beliefs and representations of science. This implies that even well-designed environments may not be perceived as authentic by all learners.</p>
<sec>
<label>1.1</label>
<title>Authenticity as a multidimensional construct</title>
<p>To conceptually capture the interaction between learner characteristics and environmental design features, (<xref ref-type="bibr" rid="B3">Betz et al. 2016</xref>) proposed a multidimensional model of authenticity in science communication (see <xref ref-type="fig" rid="F1">Figure 1</xref>). The model outlines how perceived authenticity emerges through a process called <italic>authentication</italic>, in which objectively authentic features of a learning environment are interpreted through the lens of the learner&#x00027;s individual characteristics, such as prior knowledge, interest, epistemological beliefs or experience. The model consists of five elements: (a) <italic>personal characteristics</italic>; (b) <italic>characteristics of the learning setting</italic>; (c) <italic>authentication through interaction</italic>; (d) <italic>an individual feeling of authenticity</italic>; and (e) <italic>its effects</italic>. These are organized into three conceptual parts: input (Part 1), interaction (Part 2), and output (Part 3).</p>
<fig position="float" id="F1">
<label>Figure 1</label>
<caption><p>Conceptual model of perceived authenticity in science education, based on the theoretical framework by <xref ref-type="bibr" rid="B3">Betz et al. (2016</xref>). It illustrates how authenticity emerges through the interaction between individual learner characteristics <bold>(a)</bold> and features of the learning environment <bold>(b)</bold>. This interaction <bold>(c)</bold> results in an individual perception of authenticity <bold>(d)</bold>, which in turn may affect motivational, cognitive, and behavioral outcomes <bold>(e)</bold>.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="feduc-11-1749760-g0001.tif">
<alt-text content-type="machine-generated">Conceptual diagram summarizing how personal characteristics and learning setting characteristics interact through an authentication process to shape individual perceptions of authenticity. These perceptions can result in affective, behavioral, and cognitive learning outcomes.</alt-text>
</graphic>
</fig>
<p>In the first part (input), a learner with their <italic>personal dispositions and characteristics</italic> (a) interacts with a <italic>learning setting and its design features</italic> (b). This interaction determines whether a student perceives the situation as authentic. The model identifies key dimensions of instructional design that act as cues for perceived authenticity, including <italic>location, instructors, methods, materials, content</italic>, and <italic>innovation</italic>. These features can be varied to convey more or less authenticity depending on the domain. Empirical studies show that physical materials (<xref ref-type="bibr" rid="B46">Peacock, 1997</xref>; <xref ref-type="bibr" rid="B38">Mierwald et al., 2018</xref>) and the learning location (<xref ref-type="bibr" rid="B55">Sch&#x000FC;ttler et al., 2021</xref>) often play particularly salient roles. Recent findings by <xref ref-type="bibr" rid="B24">Hohrath et al. (2024</xref>) further support these dimensions: In interviews following an experimental project day, students referred to authenticity cues such as location, instructor and materials when describing what they considered authentic research. In the second part (interaction), the two inputs (a) and (b) converge into the element <italic>authentication</italic> (c), describing how learners evaluate and interpret authenticity through their own dispositions, resulting in <italic>an individual perception of authenticity</italic> (d). In the final part (output), this perception may lead to various <italic>affective, cognitive</italic>, and <italic>behavioral effects</italic> (e), such as situational interest, motivation, changes in beliefs and the development of domain-specific competencies.</p>
</sec>
<sec>
<label>1.2</label>
<title>Relevance of assessing learners&#x00027; perceived authenticity</title>
<p>Beyond its conceptual relevance, learners&#x00027; perceived authenticity plays a central role in explaining the effects of authentic learning environments. A comprehensive review by <xref ref-type="bibr" rid="B42">Nachtigall et al. (2022</xref>), synthesizing 50 experimental and quasi-experimental studies, demonstrates that authentically designed learning settings frequently yield positive motivational and cognitive outcomes, such as increased situational interest, motivation, engagement, and learning performance. The results of this review suggest that authentic learning environments tend to foster motivational outcomes&#x02014;particularly situational interest&#x02014;more consistently than cognitive learning outcomes. For example, rich real-world materials and contexts are effective in triggering learners&#x00027; curiosity and engagement, as they are perceived as meaningful and relevant. At the same time, these same features may affect cognitive learning if the complexity of authentic materials exceeds learners&#x00027; processing capacities or if instructional guidance is insufficient. Consequently, authenticity-related gains in interest do not automatically translate into improved conceptual understanding. Rather, cognitive outcomes appear to depend on how different aspects of authenticity are realized and supported through instruction. This further underscores the importance of distinguishing between different dimensions of perceived authenticity when examining their effects on motivational vs. cognitive learning outcomes.</p>
<p>Empirical studies further substantiate this differentiation by demonstrating that specific dimensions of learners&#x00027; perceived authenticity are associated with motivational and cognitive learning outcomes in distinct ways (<xref ref-type="bibr" rid="B40">Nachtigall and Rummel, 2021</xref>). With regard to the authenticity of the method, <xref ref-type="bibr" rid="B24">Hohrath et al. (2024</xref>) showed that learners&#x00027; perceived method authenticity was positively related to knowledge acquisition, indicating that this dimension can directly support cognitive learning under appropriate instructional conditions. In contrast, the authenticity of the instructor appears to primarily affect motivational outcomes: <xref ref-type="bibr" rid="B21">Hagenk&#x000F6;tter et al. (2024</xref>) demonstrated that perceived instructor authenticity was associated with triggered situational interest, whereas no significant effects on knowledge outcomes were observed. A similar pattern emerges for material-related authenticity: <xref ref-type="bibr" rid="B65">Zachrich et al. (2024</xref>) reported that perceived authenticity of materials in the context of history education was associated with increased engagement and interest, while effects on cognitive learning outcomes were more variable. More evidence is provided by <xref ref-type="bibr" rid="B55">Sch&#x000FC;ttler et al. (2021</xref>), who showed that the authenticity of laboratory equipment selectively affected epistemic components of situational interest and learners&#x00027; perceived relevance of the learning content, whereas emotional and value-related interest components were less consistently influenced. With regard to location-related authenticity, <xref ref-type="bibr" rid="B55">Sch&#x000FC;ttler et al. (2021</xref>) demonstrated that perceived authenticity of the learning site positively influenced students&#x00027; situational interest and relevance perceptions during visits to out-of-school science laboratories, a finding consistent with earlier work by <xref ref-type="bibr" rid="B2">Betz (2018</xref>). In contrast, findings regarding knowledge acquisition are inconsistent: <xref ref-type="bibr" rid="B51">Scharfenberg et al. (2007</xref>) reported a positive effect of the learning location, whereas no positive effects were found by <xref ref-type="bibr" rid="B29">Itzek-Greulich et al. (2015</xref>). When it comes to the perceived authenticity of content and innovation in particular, empirical evidence remains scarce, as these aspects have rarely been examined as learners&#x00027; perceptions and instead often remain subsumed under broader design characteristics.</p>
<p>Conclusively, while empirical studies have begun to disentangle the effects of different dimensions of authenticity, empirical evidence on the effects of perceived authenticity remains fragmented, thereby motivating a multidimensional assessment approach.</p>
<p>This differentiated relationship between learners&#x00027; perceived authenticity and motivational vs. cognitive learning outcomes is also consistent with the previously described theoretical model of authenticity by <xref ref-type="bibr" rid="B3">Betz et al. (2016</xref>). In this model, perceived authenticity is conceptualized as a central mediating variable through which design elements of authentic learning environments influence learning processes and outcomes. In particular, the model assumes that authenticity primarily operates by enhancing learners&#x00027; engagement, relevance perceptions, and motivation, which may subsequently, but not necessarily, support cognitive learning. The empirically observed pattern of robust motivational effects but more variable cognitive outcomes aligns with this assumption (<xref ref-type="bibr" rid="B42">Nachtigall et al., 2022</xref>). It suggests that perceived authenticity may constitute a necessary but not sufficient condition for cognitive learning, which additionally depends on instructional support, task structure, and cognitive load. From this perspective, the present focus on learners&#x00027; perceived authenticity and its multidimensional assessment provides an important empirical basis for further examining and refining the mechanisms proposed in the model by (<xref ref-type="bibr" rid="B3">Betz et al. 2016</xref>).</p>
</sec>
<sec>
<label>1.3</label>
<title>Instruments for measuring authenticity</title>
<p>Despite the growing consensus on the multidimensionality of authenticity, as demonstrated by recent frameworks (e.g., <xref ref-type="bibr" rid="B2">Betz, 2018</xref>; <xref ref-type="bibr" rid="B43">Nachtigall et al., 2024</xref>; <xref ref-type="bibr" rid="B59">Sommer et al., 2018</xref>), this perspective has only gradually been reflected in empirical research. Earlier studies typically employed one-dimensional measures, such as global ratings or single items, to assess perceived authenticity (e.g., <xref ref-type="bibr" rid="B14">Engeln, 2004</xref>; <xref ref-type="bibr" rid="B45">Pawek, 2009</xref>; <xref ref-type="bibr" rid="B44">Nicaise et al., 2000</xref>). More recent studies have aimed to develop instruments that better reflect the multidimensional nature of authenticity by linking it to design elements of learning environments, such as <italic>location</italic> (<xref ref-type="bibr" rid="B54">Schriebl et al., 2021</xref>; <xref ref-type="bibr" rid="B55">Sch&#x000FC;ttler et al., 2021</xref>), <italic>instructional format and design</italic> (<xref ref-type="bibr" rid="B61">Sv&#x000E4;rd et al., 2024</xref>), and <italic>tools or materials</italic> (<xref ref-type="bibr" rid="B46">Peacock, 1997</xref>; <xref ref-type="bibr" rid="B55">Sch&#x000FC;ttler et al., 2021</xref>). Yet, many of these instruments assess only isolated aspects of authenticity or merge distinct dimensions into broader factors, thus failing to capture its full complexity.</p>
<p>A first validated multidimensional attempt was made by <xref ref-type="bibr" rid="B16">Finger et al. (2022</xref>), who developed a questionnaire to capture perceived authenticity in out-of-school settings. Their instrument, also known as FEWAW<xref ref-type="fn" rid="fn0003"><sup>1</sup></xref>, is based on the framework by <xref ref-type="bibr" rid="B3">Betz et al. (2016</xref>) and serves as the starting point for the present study. However, their confirmatory factor analysis did not support the proposed five-factor model. Instead, <italic>materials</italic> and <italic>methods</italic> collapsed into one factor (<italic>approach</italic>, &#x0201C;Vorgehen&#x0201D; in FEWAW). Furthermore, the instrument excluded the theoretically relevant dimension of <italic>content</italic>. Taken together, these findings motivated an extension of the original FEWAW instrument to differentiate six theoretically grounded dimensions of perceived authenticity, namely <italic>location, instructor, materials, methods, innovation</italic>, and <italic>content</italic> (see <xref ref-type="fig" rid="F1">Figure 1</xref>).</p>
</sec>
<sec>
<label>1.4</label>
<title>Aims and research questions</title>
<p>Based on theoretical considerations and previous empirical findings, the aims of this study are to develop and validate an extended multidimensional instrument for assessing perceived authenticity in science education. To address this, the following questions (RQs) guide our research:</p>
<list list-type="bullet">
<list-item><p>RQ1 (factorial structure): Does the adapted and extended version of the FEWAW questionnaire reflect a six-factor structure corresponding to the dimensions of <italic>location, instructor, materials, methods, innovation</italic>, and <italic>content</italic>?</p></list-item>
<list-item><p>RQ2 (psychometric properties): To what extent does the revised instrument demonstrate psychometric quality across key dimensions of scale validation?</p></list-item>
</list>
<list list-type="bullet">
<list-item><p>RQ2.1 (internal consistency): Do all the scales show sufficient internal consistency (e.g., McDonald&#x00027;s &#x003C9;&#x02265;0.70), indicating reliable measurement of each construct?</p></list-item>
<list-item><p>RQ2.2 (discriminant validity): Are all dimensions empirically distinguishable, as indicated by latent correlations below 0.80 (<xref ref-type="bibr" rid="B9">Cheung et al., 2024</xref>) and Heterotrait-Monotrait (HTMT) ratios of correlations below 0.85 (<xref ref-type="bibr" rid="B22">Henseler et al., 2015</xref>)?</p></list-item>
<list-item><p>RQ2.3 (convergent validity): Are the scales positively and significantly correlated with theoretically related constructs such as general authenticity and is the Average Variance Extracted (AVE) for each dimension 0.50 or greater (<xref ref-type="bibr" rid="B18">Fornell and Larcker, 1981</xref>)?</p></list-item>
<list-item><p>RQ2.4 (measurement invariance): Does the instrument yield comparable scores across different learner groups, as shown by measurement invariance?</p></list-item>
</list>
</sec>
</sec>
<sec id="s2">
<label>2</label>
<title>Methods</title>
<p>In the following, we will first describe the development of the instrument, then outline the sample and the setting in which this study took place and finally present the procedures used for data analysis.</p>
<sec>
<label>2.1</label>
<title>Instrument development</title>
<sec>
<label>2.1.1</label>
<title>Approach for a new multidimensional instrument on authenticity</title>
<p>In this study, we aim to develop and evaluate a refined set of scales that distinguishes key components of disciplinary authenticity, drawing on the authenticity framework proposed by <xref ref-type="bibr" rid="B3">Betz et al. (2016</xref>). The resulting instrument comprises six theoretically derived dimensions: <italic>location, instructor, materials, methods, innovation</italic>, and the newly introduced dimension <italic>content</italic>. To address issues of conceptual overlap and insufficient discrimination, the definitions for the <italic>materials</italic> and <italic>methods</italic> scales were revised and a new definition was created for <italic>content</italic>, while the original definitions for <italic>location, instructor</italic>, and <italic>innovation</italic> were mostly retained. In addition, each dimension is explicitly differentiated from other related dimensions to ensure conceptual clarity and to avoid overlap in interpretation. As the original definitions were formulated in German, the following section provides English translations of all six dimensions, including the revised and newly developed ones.</p>
<p><italic>Location</italic> refers to the physical context surrounding the learning setting. This dimension captures how authentically students perceive the buildings, rooms and places visited. It also includes locations beyond student laboratories, such as botanical gardens, excavation sites or research vessels (<xref ref-type="bibr" rid="B6">Braund and Reiss, 2006</xref>). A location is considered authentic if it is actually or potentially used for scientific work (<xref ref-type="bibr" rid="B55">Sch&#x000FC;ttler et al., 2021</xref>). This dimension differs from <italic>instructor, materials</italic>, and <italic>methods</italic> in that it focuses solely on the spatial characteristics of the learning setting rather than on the people, artifacts or procedures involved in scientific work.</p>
<p><italic>Instructor</italic> refers to individuals who take on a teaching or guiding role within the learning activity. This dimension reflects how authentically students perceive these individuals. Instructors are considered authentic if they work professionally as scientists and offer direct access to real scientific practices within their discipline (<xref ref-type="bibr" rid="B44">Nicaise et al., 2000</xref>).</p>
<p><italic>Innovation</italic> refers to the novelty of the research question or problem addressed. A question is considered authentic if it is embedded in ongoing, relevant research and allows students to contribute to its resolution. The more central the inquiry into something genuinely new is and the less existing knowledge is merely received or replicated, the more innovative the project is perceived to be (<xref ref-type="bibr" rid="B58">Sommer et al., 2020</xref>). This dimension differs from <italic>content</italic> in that it focuses on the epistemic novelty of the task rather than on the scientific relevance of the subject matter itself.</p>
<p><italic>Methods</italic> refer to the specific scientific procedures used to investigate a research question. This dimension reflects the extent to which students perceive their working process as scientific. A method is considered authentic when it aligns with the standards of disciplinary inquiry and is embedded in a systematic process of knowledge generation. Typical examples include experimentation, modeling, simulation, data analysis or observation (<xref ref-type="bibr" rid="B4">Bolger et al., 2021</xref>). Although there is a pluralism of methods within scientific disciplines, in most cases, only one of these methods is focused on in educational contexts. This dimension differs from <italic>materials</italic> in that it concerns the scientific procedures themselves rather than the physical artifacts used to carry them out.</p>
<p><italic>Materials</italic> refer to all objects that students interact with during the activity, excluding instructional materials. This dimension reflects how authentic students perceive these materials. Materials are considered authentic when they originate from scientific research or closely resemble such materials in form, function and use, with minimal didactic simplification (<xref ref-type="bibr" rid="B59">Sommer et al., 2018</xref>). This includes both objects of investigation (e.g., soil samples, texts, interview transcripts) and instruments or visualizations that support real research (e.g., microscopes, measuring devices, simulations or lab software; <xref ref-type="bibr" rid="B57">Smetana and Bell, 2012</xref>). This dimension differs from <italic>methods</italic> in that it focuses on the physical artifacts used in scientific work and not on the procedural steps through which knowledge is generated.</p>
<p><italic>Content</italic> refers to the scientific topics, concepts or questions addressed during the learning activity. This dimension reflects how authentically students perceive the subject matter. Content is considered authentic when it relates to a real research topic in the discipline and has not been overly simplified or artificially constructed for instructional purposes (<xref ref-type="bibr" rid="B59">Sommer et al., 2018</xref>). This dimension differs from <italic>innovation</italic> in that it focuses on the relevance of the subject matter itself, not on the epistemic novelty or potential for generating new knowledge.</p>
<p>To clarify the conceptual refinements made to the original FEWAW instrument, it is necessary to specify how the present definitions differ from and expand upon those previously proposed by <xref ref-type="bibr" rid="B16">Finger et al. (2022</xref>).</p>
<p>In their version, <italic>materials</italic> were broadly defined as any non-instructional objects that students interact with, including objects of investigation (e.g., soil samples, texts) and research instruments (e.g., microscopes, indicator solutions). We mostly retained this two-part structure but made the criteria for authenticity more explicit by emphasizing the origin of the materials (i.e., from authentic scientific research) and their similarity in form, function and use to those typically found in scientific practice. Additionally, the definition was extended to include scientific visualizations and digital tools (e.g., simulations or laboratory software), which are widely used in science (<xref ref-type="bibr" rid="B57">Smetana and Bell, 2012</xref>).</p>
<p>Similarly, the original <italic>methods</italic> dimension referred to the scientific character of students&#x00027; activities and their participation in systematic inquiry. While the core idea was preserved, concrete examples of disciplinary procedures (e.g., experimenting, modeling and data analysis) were added to reflect the methodological diversity of scientific practice and to help learners identify what constitutes authentic scientific work (<xref ref-type="bibr" rid="B4">Bolger et al., 2021</xref>).</p></sec>
<sec>
<label>2.1.2</label>
<title>Item generation and refinement</title>
<p>The initial item pool was developed based on theoretically derived dimensions of perceived authenticity, using the FEWAW questionnaire by <xref ref-type="bibr" rid="B16">Finger et al. (2022</xref>) as the primary reference. Definitions for the dimensions <italic>location, instructor</italic>, and <italic>innovation</italic>, which showed empirical distinctiveness and acceptable mean values in the original study, were adopted with minor linguistic modifications for clarity and consistency. The original item sets for these three dimensions were retained to preserve continuity with the established scale structure. In contrast, new items were created for the <italic>methods, materials</italic>, and <italic>content</italic> dimensions according to the extended theoretical definitions. The <italic>content</italic> dimension, which was not included in the original instrument, was added to capture the perceived authenticity of scientific topics and disciplinary concepts (<xref ref-type="bibr" rid="B3">Betz et al., 2016</xref>).</p>
<p>To refine and validate the item pool, several iterative rounds of theoretical and linguistic review were conducted. A group of eight experts in science education, including professors, teachers, and doctoral students, as well as a group of five secondary school students, independently classified each item into one of the six dimensions of perceived authenticity. For this purpose, all participants were provided with the item pool and the corresponding dimensions. In addition to the classification task, students were asked to provide feedback on the linguistic comprehensibility of the items using an optional open-response format. Experts were additionally asked to evaluate item unidimensionality, that is, whether each item clearly reflected only one dimension or could plausibly be assigned to multiple dimensions. This qualitative feedback was incorporated into subsequent item revisions. Despite substantial inter-rater reliability (Fleiss&#x00027; &#x003BA;&#x0003E;0.85; <xref ref-type="bibr" rid="B33">Landis and Koch, 1977</xref>), several items required revision due to ambiguous or overlapping content.</p>
<p>Subsequent internal discussions focused on items that potentially reflected more than one dimension. For instance, several items in the <italic>materials</italic> and <italic>methods</italic> categories included implicit references to scientific instruments, also associated with the <italic>location</italic> dimension. To minimize anticipated side and cross-loadings, wording was refined to better represent the intended constructs. The conceptual distinction between <italic>content</italic> and <italic>innovation</italic> was also revisited, given the difficulty students may have in distinguishing novel scientific topics from those simply new to them.</p>
<p>Unlike the original FEWAW questionnaire, which used a response scale based on the perceived correctness of statements, the present version was designed to assess students&#x00027; subjective perceptions, aligning with the interpretative nature of perceived authenticity. Most items were formulated in the first-person perspective and used active constructions to encourage participants to draw on personal experiences rather than evaluate externally verifiable facts. A five-point Likert scale was implemented, ranging from &#x0201C;strongly disagree (1)&#x0201D; to &#x0201C;strongly agree (5).&#x0201D;</p></sec>
<sec>
<label>2.1.3</label>
<title>External validation criteria</title>
<p>To gather initial evidence for construct validity, selected external criteria theoretically related to specific aspects of perceived authenticity were included. Most validation scales were adapted from the original FEWAW study by <xref ref-type="bibr" rid="B16">Finger et al. (2022</xref>) with minor linguistic adjustments for stylistic consistency. These included measures of general authenticity (<xref ref-type="bibr" rid="B13">Damerau, 2012</xref>), authenticity of tasks (<xref ref-type="bibr" rid="B41">Nachtigall et al., 2018</xref>), perceived instructor expertise (<xref ref-type="bibr" rid="B28">Huber et al., 2009</xref>) and epistemological beliefs regarding the origin (<xref ref-type="bibr" rid="B32">Kremer, 2010</xref>) and changeability of knowledge (<xref ref-type="bibr" rid="B39">Moschner and Gruber, 2017</xref>).</p>
<p>Two additional short scales were included to reflect the extended model structure. To further validate the <italic>methods</italic> scale, an adapted version of a measure on participation in scientific practices based on the PISA framework and revised according to <xref ref-type="bibr" rid="B10">Chi et al. (2018</xref>) was used. It assesses engagement in core elements of scientific inquiry such as planning, conducting, and reflecting on experiments. For the <italic>materials</italic> scale, we included a scale adapted from <xref ref-type="bibr" rid="B55">Sch&#x000FC;ttler et al. (2021</xref>) capturing the perceived authenticity of laboratory equipment and scientific tools used during the program. A summary of all validation scales (<italic>N</italic> &#x0003D; 39 items) and descriptive statistics is presented in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Overview of external validation scales including the number of items, means (<italic>M</italic>), standard deviations (SD), and internal consistencies (&#x003B1;).</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Source</bold></th>
<th valign="top" align="left"><bold>Scale</bold></th>
<th valign="top" align="center"><bold>Items</bold></th>
<th valign="top" align="center"><bold><italic>M</italic></bold></th>
<th valign="top" align="center"><bold>SD</bold></th>
<th valign="top" align="center"><bold>&#x003B1;</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B13">Damerau (2012</xref>)</td>
<td valign="top" align="left">General authenticity</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">3.37</td>
<td valign="top" align="center">0.97</td>
<td valign="top" align="center">0.78</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B41">Nachtigall et al. (2018</xref>)</td>
<td valign="top" align="left">Task and material authenticity</td>
<td valign="top" align="center">9</td>
<td valign="top" align="center">3.03</td>
<td valign="top" align="center">0.69</td>
<td valign="top" align="center">0.78</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B28">Huber et al. (2009</xref>)</td>
<td valign="top" align="left">Instructor expertise</td>
<td valign="top" align="center">5</td>
<td valign="top" align="center">4.15</td>
<td valign="top" align="center">0.86</td>
<td valign="top" align="center">0.89</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B32">Kremer (2010</xref>)</td>
<td valign="top" align="left">Epistemological beliefs: origin</td>
<td valign="top" align="center">5</td>
<td valign="top" align="center">2.56</td>
<td valign="top" align="center">0.94</td>
<td valign="top" align="center">0.85</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B39">Moschner and Gruber (2017</xref>)</td>
<td valign="top" align="left">Epistemological beliefs: changeability</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">3.56</td>
<td valign="top" align="center">0.68</td>
<td valign="top" align="center">0.74</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B10">Chi et al. (2018</xref>)</td>
<td valign="top" align="left">Participation in scientific practices</td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">3.40</td>
<td valign="top" align="center">0.74</td>
<td valign="top" align="center">0.70</td>
</tr>
<tr>
<td valign="top" align="left"><xref ref-type="bibr" rid="B55">Sch&#x000FC;ttler et al. (2021</xref>)</td>
<td valign="top" align="left">Perceived authenticity of lab equipment</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">2.98</td>
<td valign="top" align="center">0.96</td>
<td valign="top" align="center">0.83</td>
</tr></tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec>
<label>2.2</label>
<title>Sample and setting</title>
<p>A total of <italic>N</italic> &#x0003D; 146 secondary school students participated in this study. The sample included 55 students (37.7%) from 10th grade and 68 (46.6%) from 11th grade. In terms of gender, 79 participants (54.1%) identified as male, 65 (44.5%) as female and 2 (1.4%) as diverse. The average age was 16.42 years (SD &#x0003D; 1.36).</p>
<p>Data collection took place between June and July 2025 at the DLR_School_Lab, an out-of-school science lab in Germany. The full-day extracurricular program engaged school classes in activities related to aerospace research, including flight simulation, infrared technology, robotics programming and satellite data analysis. The program followed a non-linear, station-based structure and covered a broad spectrum of topics under the overarching theme of &#x0201C;aeronautics and space.&#x0201D;</p>
<p>To ensure standardized administration, instructors received written guidelines outlining the procedure. Students were informed that the questionnaire was part of a scientific study investigating their impressions of authentic learning environments in the out-of-school lab. Participation was voluntary and students were assured that their responses would be anonymized and used exclusively for research and quality-improvement purposes. As part of the general admission process for the out-of-school program, written parental consent for participation in research-related evaluation activities had already been obtained. In addition, students received an information sheet explaining the purpose of the study. The study was conducted in accordance with the ethical standards approved by the Ethics Committee of Otto-von-Guericke University Magdeburg.</p>
<p>The questionnaire was administered in paper-and-pencil format and completed within approximately 30 minutes, directly after the final session of the program.</p>
</sec>
<sec>
<label>2.3</label>
<title>Data analysis</title>
<sec>
<label>2.3.1</label>
<title>Data preprocessing</title>
<p>All statistical analyses were conducted in R (RStudio version 2025.05.0, Build 496) using psychometric packages including <monospace>lavaan</monospace> (<xref ref-type="bibr" rid="B47">Rosseel, 2012</xref>). As the data were collected using a pencil-and-paper format, responses were digitized independently by two researchers. To assess data entry accuracy, each researcher independently re-digitized a subset of 15 questionnaires originally entered by the other, resulting in a total of 30 double-coded questionnaires. This procedure yielded excellent inter-rater agreement (Cohen&#x00027;s &#x003BA; &#x0003D; 0.998). Questionnaires with extensive missing data or implausible response patterns&#x02014;such as uniformly selecting the same option across scales or other typical indicators of careless responding (<xref ref-type="bibr" rid="B37">Meade and Craig, 2012</xref>)&#x02014;were excluded, resulting in a cleaned dataset of <italic>N</italic> &#x0003D; 130 valid cases. The full R script used for all data preprocessing steps and statistical analyses is provided as <xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref> to this article.</p>
<p>Overall, 1.67% of item responses were missing and considered missing at random. Prior to model estimation, univariate and multivariate distributions were examined. Most items exhibited acceptable skewness and kurtosis, yet Mardia&#x00027;s test indicated significant multivariate skewness (<italic>b</italic><sub>1<italic>p</italic></sub> &#x0003D; 851.72, <italic>p</italic> &#x0003C; 0.001) but no excess kurtosis (<italic>b</italic><sub>2<italic>p</italic></sub> &#x0003D; 1838.57, <italic>p</italic> &#x0003D; 0.44), suggesting moderate deviations from normality (<xref ref-type="bibr" rid="B17">Finney and DiStefano, 2006</xref>). Therefore, all confirmatory factor analyses (CFA) were estimated using full information maximum likelihood (FIML) with a robust maximum likelihood estimator (MLR), which accounts for both non-normality and missing data (<xref ref-type="bibr" rid="B35">Little and Rubin, 2002</xref>).</p></sec>
<sec>
<label>2.3.2</label>
<title>Confirmatory factor analysis and model optimization</title>
<p>The initial CFA model included all items from the six theoretically defined dimensions. Model evaluation was based on standard fit indices: Comparative Fit Index (CFI), Tucker-Lewis Index (TLI), Root Mean Square Error of Approximation (RMSEA, 90% CI), Standardized Root Mean Square Residual (SRMR) and the chi-square to degrees of freedom ratio (&#x003C7;<sup>2</sup>/df). Good model fit is typically indicated by CFI/TLI&#x0003E;0.95, SRMR &#x0003C; 0.08, RMSEA &#x0003C; 0.06 and &#x003C7;<sup>2</sup>/df &#x02264; 2 (<xref ref-type="bibr" rid="B27">Hu and Bentler, 1999</xref>; <xref ref-type="bibr" rid="B31">Kline, 2016</xref>; <xref ref-type="bibr" rid="B52">Schermelleh-Engel et al., 2003</xref>).</p>
<p>To optimize model fit, an iterative item reduction procedure was applied, consistent with recommended and common practice in CFA. The three established dimensions&#x02014;<italic>location, instructor</italic>, and <italic>innovation</italic>&#x02014;were locked to preserve comparability with the original FEWAW instrument (<xref ref-type="bibr" rid="B16">Finger et al., 2022</xref>). Items of the remaining dimensions (<italic>methods, materials, content</italic>) were evaluated in multiple steps using established CFA thresholds (<xref ref-type="bibr" rid="B7">Brown, 2015</xref>; <xref ref-type="bibr" rid="B31">Kline, 2016</xref>): (1) strong cross-loadings as indicated by high modification indices (MI &#x0003E;10); (2) low standardized loadings (&#x003BB; &#x0003C; 0.40); and (3) low explained variance (<italic>R</italic><sup>2</sup> &#x0003C; 0.30). After each modification step, the model was re-estimated and fit indices recalculated until no further exclusions were warranted.</p>
<p>The resulting model was then conceptually inspected for content redundancy, theoretical representativeness and comparable scale lengths. Additional items were removed where appropriate to further improve model fit while maintaining adequate construct coverage.</p></sec>
<sec>
<label>2.3.3</label>
<title>Reliability</title>
<p>Once satisfactory fit indices were achieved, internal consistency was evaluated using McDonald&#x00027;s &#x003C9; as a measure of scale reliability under heterogeneous factor loadings. In addition, Cronbach&#x00027;s &#x003B1; was reported to ensure comparability with the original FEWAW instrument (<xref ref-type="bibr" rid="B16">Finger et al., 2022</xref>), where scale reliability was evaluated using this coefficient. Following common conventions, values of &#x003C9;&#x02265;0.70 and &#x003B1;&#x02265;0.70 were considered indicative of acceptable reliability (<xref ref-type="bibr" rid="B5">Bortz and D&#x000F6;ring, 2015</xref>; <xref ref-type="bibr" rid="B36">McDonald, 1999</xref>; <xref ref-type="bibr" rid="B9">Cheung et al., 2024</xref>).</p></sec>
<sec>
<label>2.3.4</label>
<title>Discriminant and convergent validity</title>
<p>Furthermore, discriminant and convergent validity were also assessed. Discriminant validity was examined by inspecting the latent inter-factor correlations among the FEWAW dimensions, with all correlations remaining below the recommended threshold of <italic>r</italic> &#x0003D; 0.80, indicating adequate separation of the constructs. Additionally, discriminant validity was assessed using the Heterotrait&#x02013;Monotrait (HTMT) ratio of correlations, defined as the ratio of the average correlations between items of different constructs to the average correlations between items within the same construct. HTMT therefore reflects the extent to which two scales overlap in what they measure, with values at or below 0.85 indicating that the dimensions are empirically separable (<xref ref-type="bibr" rid="B22">Henseler et al., 2015</xref>; <xref ref-type="bibr" rid="B9">Cheung et al., 2024</xref>). Convergent validity was evaluated by correlating latent factor scores with external validation scales to confirm theoretically expected relationships (<xref ref-type="bibr" rid="B7">Brown, 2015</xref>). In addition, the Average Variance Extracted (AVE) was examined for each dimension, with values of at least 0.50 indicating that a latent construct explains more variance in its indicators than is due to measurement error (<xref ref-type="bibr" rid="B18">Fornell and Larcker, 1981</xref>).</p></sec>
<sec>
<label>2.3.5</label>
<title>Measurement invariance</title>
<p>Finally, to test group equivalence, measurement invariance was examined for gender and grade level using a stepwise comparison of configural, metric, and scalar models. Following <xref ref-type="bibr" rid="B8">Chen (2007</xref>), changes of &#x00394;CFI &#x02264; 0.01 and &#x00394;RMSEA &#x02264; 0.015 were used as invariance criteria.</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="s3">
<label>3</label>
<title>Results</title>
<p>In the subsequent sections, we present the results of the confirmatory factor analysis addressing RQ1, followed by the evaluation of the psychometric properties addressing RQ2 and its sub-questions (RQ2.1&#x02013;RQ2.4).</p>
<sec>
<label>3.1</label>
<title>Confirmatory factor analysis (RQ1)</title>
<p>The model evaluation proceeded in three distinct stages of item refinement, each aimed at improving factorial validity while maintaining theoretical coverage, following the procedure described in Section 2.3.2. <xref ref-type="table" rid="T2">Table 2</xref> summarizes the evolution of model fit statistics across these steps.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Model fit statistics for different item sets across CFA iterations.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Model version</bold></th>
<th valign="top" align="center"><bold>No. of items</bold></th>
<th valign="top" align="center"><bold>&#x003C7;<sup>2</sup></bold></th>
<th valign="top" align="center"><bold>df</bold></th>
<th valign="top" align="center"><bold>CFI</bold></th>
<th valign="top" align="center"><bold>TLI</bold></th>
<th valign="top" align="center"><bold>RMSEA</bold></th>
<th valign="top" align="center"><bold>SRMR</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Full item set (1)</td>
<td valign="top" align="center">42</td>
<td valign="top" align="center">1,200.54</td>
<td valign="top" align="center">804</td>
<td valign="top" align="center">0.837</td>
<td valign="top" align="center">0.825</td>
<td valign="top" align="center">0.062</td>
<td valign="top" align="center">0.079</td>
</tr>
<tr>
<td valign="top" align="left">After statistical trimming (2)</td>
<td valign="top" align="center">32</td>
<td valign="top" align="center">616.83</td>
<td valign="top" align="center">449</td>
<td valign="top" align="center">0.907</td>
<td valign="top" align="center">0.898</td>
<td valign="top" align="center">0.054</td>
<td valign="top" align="center">0.073</td>
</tr>
<tr>
<td valign="top" align="left">After conceptual trimming (3)</td>
<td valign="top" align="center">21</td>
<td valign="top" align="center">214.81</td>
<td valign="top" align="center">174</td>
<td valign="top" align="center">0.962</td>
<td valign="top" align="center">0.954</td>
<td valign="top" align="center">0.042</td>
<td valign="top" align="center">0.070</td>
</tr></tbody>
</table>
</table-wrap>
<p>(1) Full item set</p>
<p>The initial CFA comprised all 42 items from the six theoretically derived dimensions of perceived authenticity. The model demonstrated acceptable overall fit, &#x003C7;<sup>2</sup>(804) &#x0003D; 1, 200.54, CFI &#x0003D; 0.84, TLI &#x0003D; 0.83, RMSEA &#x0003D; 0.062, SRMR &#x0003D; 0.079, with most items showing clear primary loadings and only small cross-loadings. However, the questionnaire length proved impractical for educational settings such as school-based laboratory visits. In these contexts, time and cognitive load are limited and the administration of 42 items, alongside other possible instruments, was not feasible. This test-ecological consideration prompted the need for item reduction, which was carried out not due to model misfit but to increase the instrument&#x00027;s practical usability.</p>
<p>(2) Statistical trimming</p>
<p>Based on the aforementioned trimming criteria, a first reduction was conducted following predefined statistical thresholds. This step resulted in the removal of 10 items. The revised 32-item model showed considerably improved fit: &#x003C7;<sup>2</sup>(449) &#x0003D; 616.83, CFI &#x0003D; 0.91, TLI &#x0003D; 0.90, RMSEA &#x0003D; 0.054, SRMR &#x0003D; 0.073. All six dimensions remained covered and scale structures were preserved.</p>
<p>(3) Conceptual trimming</p>
<p>A subsequent manual trimming phase was conducted to enhance the conceptual clarity of the instrument. Even though the retained items were statistically reasonable, further inspection revealed cases of overlapping phrasing, marginal <italic>R</italic><sup>2</sup> values (just above 0.30) or overly narrow content. This final model achieved an excellent fit: &#x003C7;<sup>2</sup>(174) &#x0003D; 214.81, CFI &#x0003D; 0.96, TLI &#x0003D; 0.95, RMSEA &#x0003D; 0.042, SRMR &#x0003D; 0.070. Overall, the final model explained <italic>R</italic><sup>2</sup> &#x0003D; 0.55 of item variance.</p>
<p>The final confirmatory factor model comprised six correlated latent variables representing the theorized dimensions of perceived authenticity: <italic>content, innovation, materials, methods, location</italic>, and <italic>instructor</italic>. Each factor in the final model was measured by three to five items that had been retained through sequential statistical and conceptual trimming procedures. <xref ref-type="table" rid="T3">Table 3</xref> displays the item codes, wording, descriptive statistics, and standardized factor loadings (&#x003BB;). All indicators were specified as continuous variables and the model was estimated using MLR with FIML for missing data.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Final CFA model: scales, item codes, item wordings, descriptive statistics (M, SD), and standardized factor loadings (&#x003BB;).</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Scale</bold></th>
<th valign="top" align="left"><bold>Code</bold></th>
<th valign="top" align="left"><bold>Item wording</bold></th>
<th valign="top" align="center"><bold><italic>M</italic></bold></th>
<th valign="top" align="center"><bold>SD</bold></th>
<th valign="top" align="center"><bold>&#x003BB;<sub>C</sub></bold></th>
<th valign="top" align="center"><bold>&#x003BB;<sub>IN</sub></bold></th>
<th valign="top" align="center"><bold>&#x003BB;<sub>MA</sub></bold></th>
<th valign="top" align="center"><bold>&#x003BB;<sub>ME</sub></bold></th>
<th valign="top" align="center"><bold>&#x003BB;<sub>L</sub></bold></th>
<th valign="top" align="center"><bold>&#x003BB;<sub>I</sub></bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Content</td>
<td valign="top" align="left">AUC1</td>
<td valign="top" align="left">The content I encountered was based on real scientific research.</td>
<td valign="top" align="center">3.42</td>
<td valign="top" align="center">1.13</td>
<td valign="top" align="center">0.729</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUC2</td>
<td valign="top" align="left">The content reflected what researchers actually work on.</td>
<td valign="top" align="center">3.59</td>
<td valign="top" align="center">1.04</td>
<td valign="top" align="center">0.764</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUC6</td>
<td valign="top" align="left">The content seemed closely related to real scientific questions.</td>
<td valign="top" align="center">3.12</td>
<td valign="top" align="center">1.07</td>
<td valign="top" align="center">0.706</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUC9</td>
<td valign="top" align="left">I had the impression that the topics were genuine research topics.</td>
<td valign="top" align="center">3.29</td>
<td valign="top" align="center">1.14</td>
<td valign="top" align="center">0.710</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Innovation</td>
<td valign="top" align="left">AUIN1</td>
<td valign="top" align="left">I tried to discover something new for science.</td>
<td valign="top" align="center">2.17</td>
<td valign="top" align="center">1.24</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.525</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUIN2</td>
<td valign="top" align="left">I helped science answer an important question.</td>
<td valign="top" align="center">1.70</td>
<td valign="top" align="center">1.14</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.418</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUIN3</td>
<td valign="top" align="left">I contributed to answering a current research question.</td>
<td valign="top" align="center">2.18</td>
<td valign="top" align="center">1.24</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.824</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Materials</td>
<td valign="top" align="left">AUMA2</td>
<td valign="top" align="left">I worked with instruments similar to those used in research.</td>
<td valign="top" align="center">3.05</td>
<td valign="top" align="center">1.06</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.765</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUMA5</td>
<td valign="top" align="left">I used materials that are also used in real research.</td>
<td valign="top" align="center">3.11</td>
<td valign="top" align="center">1.17</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.818</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUMA7</td>
<td valign="top" align="left">The instruments felt like genuine research devices in their use.</td>
<td valign="top" align="center">3.12</td>
<td valign="top" align="center">1.19</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.707</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUMA9</td>
<td valign="top" align="left">I used materials typical of scientific research.</td>
<td valign="top" align="center">3.11</td>
<td valign="top" align="center">1.12</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.757</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUMA10</td>
<td valign="top" align="left">The measuring instruments felt largely unmodified for teaching.</td>
<td valign="top" align="center">2.98</td>
<td valign="top" align="center">1.23</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.711</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Methods</td>
<td valign="top" align="left">AUME5</td>
<td valign="top" align="left">I proceeded in the same way as one would in science.</td>
<td valign="top" align="center">2.55</td>
<td valign="top" align="center">1.05</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.763</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUME8</td>
<td valign="top" align="left">I proceeded as I imagine researchers would.</td>
<td valign="top" align="center">2.61</td>
<td valign="top" align="center">1.02</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.654</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUME9</td>
<td valign="top" align="left">The way I worked reminded me of scientific research.</td>
<td valign="top" align="center">2.97</td>
<td valign="top" align="center">1.10</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.772</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Location</td>
<td valign="top" align="left">AUL1</td>
<td valign="top" align="left">I was in a place where real research is conducted.</td>
<td valign="top" align="center">4.19</td>
<td valign="top" align="center">1.12</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.867</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUL2</td>
<td valign="top" align="left">I worked in a place where research takes place.</td>
<td valign="top" align="center">3.87</td>
<td valign="top" align="center">1.28</td>
<td valign="top" align="center">0.305<sup>a</sup></td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.378<sup>a</sup></td>
<td valign="top" align="center">0.331<sup>a</sup></td>
<td valign="top" align="center">0.697</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUL3</td>
<td valign="top" align="left">I was in an environment where research is done.</td>
<td valign="top" align="center">4.35</td>
<td valign="top" align="center">1.06</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.824</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Instructor</td>
<td valign="top" align="left">AUI1</td>
<td valign="top" align="left">I was supported by a real researcher today.</td>
<td valign="top" align="center">3.02</td>
<td valign="top" align="center">1.43</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.903</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUI2</td>
<td valign="top" align="left">A scientist personally introduced me to research today.</td>
<td valign="top" align="center">2.88</td>
<td valign="top" align="center">1.31</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.701</td>
</tr>
 <tr>
<td/>
<td valign="top" align="left">AUI3</td>
<td valign="top" align="left">The person leading the project was a scientist.</td>
<td valign="top" align="center">3.16</td>
<td valign="top" align="center">1.38</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.809</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p><sup>a</sup>Despite no cross-loadings being estimated in the final CFA model, modification indices for item AUL2 indicate the hypothetical magnitude of cross-loadings that would improve global model fit if cross-loadings were permitted.</p>
</table-wrap-foot>
</table-wrap>
<p>The retained items loaded clearly and substantially on their intended factors, with standardized factor loadings ranging from &#x003BB; &#x0003D; 0.42 to 0.90. In five of the six dimensions, all items exceeded &#x003BB;&#x0003E;0.60. An exception to this pattern emerged within the <italic>innovation</italic> scale, where two of the three items (AUIN1: &#x003BB; &#x0003D; 0.53; AUIN2: &#x003BB; &#x0003D; 0.42) exhibited comparatively lower loadings.</p>
<p>Furthermore, no cross-loadings were estimated in the final model to preserve discriminant clarity. However, the modification indices indicated a small number of cross-factor relations that would have emerged if cross-loadings had been permitted in the model estimation. As shown in <xref ref-type="table" rid="T3">Table 3</xref>, despite a clear primary loading of AUL2 on <italic>location</italic> (AUL), modification indices indicate potential cross-loadings on <italic>materials</italic> (MI &#x0003D; 20.41, &#x003BB; &#x0003D; 0.38), <italic>methods</italic> (MI &#x0003D; 17.96, &#x003BB; &#x0003D; 0.33), and <italic>content</italic> (MI &#x0003D; 11.05, &#x003BB; &#x0003D; 0.31).</p>
</sec>
<sec>
<label>3.2</label>
<title>Psychometric properties (RQ2)</title>
<p>In line with RQ2 and its sub-questions (RQ2.1&#x02013;RQ2.4), we examined four central aspects of the psychometric quality of the revised instrument: Internal consistency, discriminant validity, convergent validity, and measurement invariance. The corresponding results are presented in the following subsections.</p>
<sec>
<label>3.2.1</label>
<title>Reliability and validity (RQ2.1&#x02013;RQ2.3)</title>
<sec>
<label>3.2.1.1</label>
<title>Internal consistency</title>
<p>To assess the reliability of the FEWAW dimensions, internal consistencies were examined using McDonald&#x00027;s &#x003C9; and Cronbach&#x00027;s &#x003B1; (see <xref ref-type="table" rid="T4">Table 4</xref>). McDonald&#x00027;s &#x003C9; and Cronbach&#x00027;s &#x003B1; coefficients ranged from &#x003C9; &#x0003D; 0.64 (<italic>innovation</italic>) to &#x003C9; &#x0003D; 0.87 (<italic>materials</italic>) and from &#x003B1; &#x0003D; 0.63 (<italic>innovation</italic>) to &#x003B1; &#x0003D; 0.87 (<italic>materials</italic>), respectively. With both &#x003C9; and &#x003B1; values above 0.75 for five of the six FEWAW dimensions, internal consistency was generally acceptable (see Section 2.3.3). Only the <italic>innovation</italic> dimension fell below commonly accepted thresholds, pointing to limited reliability of this scale (<xref ref-type="bibr" rid="B5">Bortz and D&#x000F6;ring, 2015</xref>; <xref ref-type="bibr" rid="B36">McDonald, 1999</xref>; <xref ref-type="bibr" rid="B9">Cheung et al., 2024</xref>).</p>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p>Internal consistencies (&#x003C9;, &#x003B1;), means (M), standard deviations (SD), and intercorrelations of the FEWAW dimensions (lower triangle only).</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Dimension</bold></th>
<th valign="top" align="center"><bold>&#x003C9;</bold></th>
<th valign="top" align="center"><bold>&#x003B1;</bold></th>
<th valign="top" align="center"><bold><italic>M</italic></bold></th>
<th valign="top" align="center"><bold>SD</bold></th>
<th valign="top" align="center"><bold>Content</bold></th>
<th valign="top" align="center"><bold>Innovation</bold></th>
<th valign="top" align="center"><bold>Materials</bold></th>
<th valign="top" align="center"><bold>Methods</bold></th>
<th valign="top" align="center"><bold>Location</bold></th>
<th valign="top" align="center"><bold>Instructor</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Content</td>
<td valign="top" align="center">0.82</td>
<td valign="top" align="center">0.82</td>
<td valign="top" align="center">3.36</td>
<td valign="top" align="center">0.88</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Innovation</td>
<td valign="top" align="center">0.64</td>
<td valign="top" align="center">0.63</td>
<td valign="top" align="center">2.02</td>
<td valign="top" align="center">0.91</td>
<td valign="top" align="center">0.19<sup>&#x0002A;</sup></td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Materials</td>
<td valign="top" align="center">0.87</td>
<td valign="top" align="center">0.87</td>
<td valign="top" align="center">3.94</td>
<td valign="top" align="center">0.93</td>
<td valign="top" align="center">0.67<sup>&#x0002A;&#x0002A;&#x0002A;</sup></td>
<td valign="top" align="center">0.30<sup>&#x0002A;&#x0002A;&#x0002A;</sup></td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Methods</td>
<td valign="top" align="center">0.78</td>
<td valign="top" align="center">0.78</td>
<td valign="top" align="center">2.71</td>
<td valign="top" align="center">0.87</td>
<td valign="top" align="center">0.52<sup>&#x0002A;&#x0002A;&#x0002A;</sup></td>
<td valign="top" align="center">0.40<sup>&#x0002A;&#x0002A;&#x0002A;</sup></td>
<td valign="top" align="center">0.68<sup>&#x0002A;&#x0002A;&#x0002A;</sup></td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Location</td>
<td valign="top" align="center">0.83</td>
<td valign="top" align="center">0.83</td>
<td valign="top" align="center">4.14</td>
<td valign="top" align="center">1.00</td>
<td valign="top" align="center">0.45<sup>&#x0002A;&#x0002A;&#x0002A;</sup></td>
<td valign="top" align="center">0.02</td>
<td valign="top" align="center">0.41<sup>&#x0002A;&#x0002A;&#x0002A;</sup></td>
<td valign="top" align="center">0.21<sup>&#x0002A;</sup></td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Instructor</td>
<td valign="top" align="center">0.85</td>
<td valign="top" align="center">0.84</td>
<td valign="top" align="center">3.03</td>
<td valign="top" align="center">1.21</td>
<td valign="top" align="center">0.32<sup>&#x0002A;&#x0002A;&#x0002A;</sup></td>
<td valign="top" align="center">0.22<sup>&#x0002A;</sup></td>
<td valign="top" align="center">0.44<sup>&#x0002A;&#x0002A;&#x0002A;</sup></td>
<td valign="top" align="center">0.29<sup>&#x0002A;&#x0002A;</sup></td>
<td valign="top" align="center">0.31<sup>&#x0002A;&#x0002A;&#x0002A;</sup></td>
<td valign="top" align="center">&#x02013;</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>All <italic>p</italic>-values were adjusted using Holm&#x00027;s method (<xref ref-type="bibr" rid="B25">Holm, 1979</xref>) and significance is denoted by <sup>&#x0002A;</sup><italic>p</italic> &#x0003C; 0.05, <sup>&#x0002A;&#x0002A;</sup><italic>p</italic> &#x0003C; 0.01, <sup>&#x0002A;&#x0002A;&#x0002A;</sup><italic>p</italic> &#x0003C; 0.001.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<label>3.2.1.2</label>
<title>Discriminant validity</title>
<p>To examine the distinctiveness of the FEWAW dimensions, we first inspected latent inter-factor correlations (see Section 2.3.4). Following the effect size conventions proposed by <xref ref-type="bibr" rid="B12">Cohen (1988</xref>), correlations of |<italic>r</italic>|&#x02248;0.10 are interpreted as small, |<italic>r</italic>|&#x02248;0.30 as medium and |<italic>r</italic>|&#x02248;0.50 as large effects. In line with common CFA practices, inter-factor correlations below <italic>r</italic> &#x0003D; 0.80 are additionally considered indicative of discriminant validity (<xref ref-type="bibr" rid="B7">Brown, 2015</xref>). Inter-dimension correlations were largely consistent with theoretical expectations. Dimensions tied to the realism of scientific work&#x02014;<italic>content, materials</italic>, and <italic>methods</italic>&#x02014;were moderately to strongly related (e.g., <italic>r</italic> &#x0003D; 0.67 for <italic>content</italic>&#x02013;<italic>materials</italic>; <italic>r</italic> &#x0003D; 0.68 for <italic>materials</italic>&#x02013;<italic>methods</italic>). Particularly high correlations between <italic>materials</italic> and <italic>methods</italic> suggest that students perceived the way experiments were conducted and the materials used as closely intertwined, while mean ratings indicate that <italic>materials</italic> were overall perceived as more authentic than <italic>methods</italic>. The <italic>innovation</italic> dimension showed the weakest inter-dimension correlations, with associations ranging from <italic>r</italic> &#x0003D; 0.02 to 0.40 and the lowest overall mean (<italic>M</italic> &#x0003D; 2.02), whereas the highest mean was found for the <italic>location</italic> dimension (<italic>M</italic> &#x0003D; 4.14). As a complementary criterion, discriminant validity was further examined using the Heterotrait-Monotrait (HTMT) ratio of correlations (see Section 2.3.4). Most HTMT values remained below the recommended threshold of 0.85, indicating sufficient separation between the FEWAW dimensions (see <xref ref-type="table" rid="T5">Table 5</xref>). The highest ratios were observed between <italic>materials</italic> and <italic>methods</italic> (HTMT &#x0003D; 0.83) as well as between <italic>materials</italic> and <italic>content</italic> (HTMT &#x0003D; 0.79).</p>
<table-wrap position="float" id="T5">
<label>Table 5</label>
<caption><p>HTMT ratios for the FEWAW dimensions (lower triangle only).</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Dimension</bold></th>
<th valign="top" align="center"><bold>Content</bold></th>
<th valign="top" align="center"><bold>Innovation</bold></th>
<th valign="top" align="center"><bold>Materials</bold></th>
<th valign="top" align="center"><bold>Methods</bold></th>
<th valign="top" align="center"><bold>Location</bold></th>
<th valign="top" align="center"><bold>Instructor</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Content</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Innovation</td>
<td valign="top" align="center">0.28</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Materials</td>
<td valign="top" align="center">0.79</td>
<td valign="top" align="center">0.42</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Methods</td>
<td valign="top" align="center">0.64</td>
<td valign="top" align="center">0.58</td>
<td valign="top" align="center">0.83</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Location</td>
<td valign="top" align="center">0.55</td>
<td valign="top" align="center">0.11</td>
<td valign="top" align="center">0.49</td>
<td valign="top" align="center">0.28</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Instructor</td>
<td valign="top" align="center">0.37</td>
<td valign="top" align="center">0.34</td>
<td valign="top" align="center">0.51</td>
<td valign="top" align="center">0.36</td>
<td valign="top" align="center">0.37</td>
<td valign="top" align="center">&#x02013;</td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>Values below the recommended threshold of 0.85 indicate sufficient discriminant validity (<xref ref-type="bibr" rid="B22">Henseler et al., 2015</xref>).</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<label>3.2.1.3</label>
<title>Convergent validity</title>
<p>Convergent validity was evaluated using two complementary approaches (see Section 2.3.4). First, we correlated latent factor scores with theoretically related external validation scales (see <xref ref-type="table" rid="T6">Table 6</xref>) to assess whether the FEWAW dimensions align with constructs that are conceptually linked to authenticity. The dimensions <italic>content, materials</italic>, and <italic>methods</italic> showed the strongest and most consistent associations across general authenticity (<italic>r</italic> &#x0003D; 0.51&#x02013;0.57<sup>&#x0002A;&#x0002A;&#x0002A;</sup>), task and material authenticity (<italic>r</italic> &#x0003D; 0.47&#x02013;0.64<sup>&#x0002A;&#x0002A;&#x0002A;</sup>), participation in scientific practices (<italic>r</italic> &#x0003D; 0.39&#x02013;0.42<sup>&#x0002A;&#x0002A;&#x0002A;</sup>) and perceived authenticity of lab equipment (<italic>r</italic> &#x0003D; 0.46&#x02013;0.67<sup>&#x0002A;&#x0002A;&#x0002A;</sup>). The <italic>location</italic> and <italic>instructor</italic> scales showed medium but consistent associations, whereas <italic>innovation</italic> displayed a distinct profile, including a selective association with epistemological beliefs about the <italic>origin of knowledge</italic> (<italic>r</italic> &#x0003D; 0.32<sup>&#x0002A;&#x0002A;</sup>). Second, we examined the Average Variance Extracted (AVE) for each dimension, where values at or above 0.50 indicate that a latent construct explains more variance in its indicators than is due to measurement error (<xref ref-type="bibr" rid="B18">Fornell and Larcker, 1981</xref>). The results for each scale were AVE<sub>AUC</sub> &#x0003D; 0.528, AVE<sub>AUMA</sub> &#x0003D; 0.564, AVE<sub>AUME</sub> &#x0003D; 0.539, AVE<sub>AUL</sub> &#x0003D; 0.625, AVE<sub>AUI</sub> &#x0003D; 0.658, while AVE<sub>AUIN</sub> &#x0003D; 0.386 fell slightly below, indicating weaker convergence within this factor.</p>
<table-wrap position="float" id="T6">
<label>Table 6</label>
<caption><p>Correlations between FEWAW dimensions and external validation scales.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>External scale</bold></th>
<th valign="top" align="center"><bold>Content</bold></th>
<th valign="top" align="center"><bold>Innovation</bold></th>
<th valign="top" align="center"><bold>Materials</bold></th>
<th valign="top" align="center"><bold>Methods</bold></th>
<th valign="top" align="center"><bold>Location</bold></th>
<th valign="top" align="center"><bold>Instructor</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">General authenticity</td>
<td valign="top" align="center"><bold>0.56<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center">0.27</td>
<td valign="top" align="center"><bold>0.57<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.51<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.44<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.45<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
</tr>
<tr>
<td valign="top" align="left">Task and material authenticity</td>
<td valign="top" align="center"><bold>0.57<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.32<sup>&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.64<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.47<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.32<sup>&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.33<sup>&#x0002A;&#x0002A;</sup></bold></td>
</tr>
<tr>
<td valign="top" align="left">Instructor expertise</td>
<td valign="top" align="center"><bold>0.34<sup>&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center">&#x02212;0.06</td>
<td valign="top" align="center"><bold>0.35<sup>&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center">0.19</td>
<td valign="top" align="center"><bold>0.44<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center">0.15</td>
</tr>
<tr>
<td valign="top" align="left">Epistemological beliefs: origin</td>
<td valign="top" align="center">&#x02212;0.09</td>
<td valign="top" align="center"><bold>0.32<sup>&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center">0.08</td>
<td valign="top" align="center">0.06</td>
<td valign="top" align="center">&#x02212;0.08</td>
<td valign="top" align="center">0.22</td>
</tr>
<tr>
<td valign="top" align="left">Epistemological beliefs: changeability</td>
<td valign="top" align="center"><bold>0.36<sup>&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center">0.11</td>
<td valign="top" align="center"><bold>0.30<sup>&#x0002A;</sup></bold></td>
<td valign="top" align="center">0.22</td>
<td valign="top" align="center">0.25</td>
<td valign="top" align="center">0.09</td>
</tr>
<tr>
<td valign="top" align="left">Participation in scientific practices</td>
<td valign="top" align="center"><bold>0.39<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center">0.13</td>
<td valign="top" align="center"><bold>0.42<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.42<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.35<sup>&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center">0.18</td>
</tr>
<tr>
<td valign="top" align="left">Perceived authenticity of lab equipment</td>
<td valign="top" align="center"><bold>0.54<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center">0.16</td>
<td valign="top" align="center"><bold>0.67<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.46<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.34<sup>&#x0002A;&#x0002A;</sup></bold></td>
<td valign="top" align="center"><bold>0.44<sup>&#x0002A;&#x0002A;&#x0002A;</sup></bold></td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>All <italic>p</italic>-values were adjusted using Holm&#x00027;s method (<xref ref-type="bibr" rid="B25">Holm, 1979</xref>) and significance is denoted by <sup>&#x0002A;</sup><italic>p</italic> &#x0003C; 0.05, <sup>&#x0002A;&#x0002A;</sup><italic>p</italic> &#x0003C; 0.01, <sup>&#x0002A;&#x0002A;&#x0002A;</sup><italic>p</italic> &#x0003C; 0.001. Values in bold indicate at least moderate and significant correlations with <italic>r</italic>&#x0003E;0.30 and <sup>&#x0002A;</sup><italic>p</italic> &#x0003C; 0.05.</p>
</table-wrap-foot>
</table-wrap>
</sec>
</sec>
<sec>
<label>3.2.2</label>
<title>Measurement invariance (RQ2.4)</title>
<p>To evaluate the robustness of the final six-factor structure, measurement invariance was tested across gender and grade level (see Section 2.3.5). A sequence of multiple-group CFA models was estimated using robust MLR estimation, comparing configural, metric, and scalar models following the recommendations by (<xref ref-type="bibr" rid="B8">Chen 2007</xref>). A <italic>post hoc</italic> power analysis was conducted using G*Power (Version 3.1.9.7) to assess the statistical sensitivity of the test (<xref ref-type="bibr" rid="B15">Faul et al., 2009</xref>). Based on the sample size of <italic>N</italic> &#x0003D; 130 and assuming a medium effect size (<italic>w</italic> &#x0003D; 0.30), the analysis indicated sufficient statistical power (1&#x02212;&#x003B2; &#x0003D; 0.87) to detect deviations from measurement equivalence in two groups. Model comparisons were based on changes in CFI and RMSEA, complemented by the Satorra&#x02013;Bentler scaled &#x003C7;<sup>2</sup> difference test (<xref ref-type="bibr" rid="B50">Satorra and Bentler, 2001</xref>). The results are summarized in <xref ref-type="table" rid="T7">Table 7</xref>.</p>
<table-wrap position="float" id="T7">
<label>Table 7</label>
<caption><p>Model fit statistics for measurement invariance of the six-factor model across gender and grade level.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left"><bold>Model</bold></th>
<th valign="top" align="center"><bold>&#x003C7;<sup>2</sup></bold></th>
<th valign="top" align="center"><bold>df</bold></th>
<th valign="top" align="center"><bold>CFI</bold></th>
<th valign="top" align="center"><bold>TLI</bold></th>
<th valign="top" align="center"><bold>RMSEA</bold></th>
<th valign="top" align="center"><bold>SRMR</bold></th>
<th valign="top" align="center"><bold><italic>&#x00394;&#x003C7;</italic><sup>2</sup></bold></th>
<th valign="top" align="center"><bold><italic>&#x00394;df</italic></bold></th>
<th valign="top" align="center"><bold><italic>p</italic></bold></th>
</tr>
</thead>
<tbody>
<tr style="background-color:#dee1e1;">
<td valign="top" align="left" colspan="10"><bold>Measurement invariance (gender)</bold></td>
</tr>
<tr>
<td valign="top" align="left">Configural invariance</td>
<td valign="top" align="center">512.00</td>
<td valign="top" align="center">348</td>
<td valign="top" align="center">0.855</td>
<td valign="top" align="center">0.825</td>
<td valign="top" align="center">0.094</td>
<td valign="top" align="center">0.095</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Metric invariance</td>
<td valign="top" align="center">528.38</td>
<td valign="top" align="center">363</td>
<td valign="top" align="center">0.854</td>
<td valign="top" align="center">0.831</td>
<td valign="top" align="center">0.093</td>
<td valign="top" align="center">0.105</td>
<td valign="top" align="center">16.38</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">0.358</td>
</tr>
<tr>
<td valign="top" align="left">Scalar invariance</td>
<td valign="top" align="center">548.00</td>
<td valign="top" align="center">378</td>
<td valign="top" align="center">0.850</td>
<td valign="top" align="center">0.834</td>
<td valign="top" align="center">0.092</td>
<td valign="top" align="center">0.107</td>
<td valign="top" align="center">19.21</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">0.204</td>
</tr>
<tr style="background-color:#dee1e1;">
<td valign="top" align="left" colspan="10"><bold>Measurement invariance (grade)</bold></td>
</tr>
<tr>
<td valign="top" align="left">Configural invariance</td>
<td valign="top" align="center">539.00</td>
<td valign="top" align="center">348</td>
<td valign="top" align="center">0.814</td>
<td valign="top" align="center">0.775</td>
<td valign="top" align="center">0.109</td>
<td valign="top" align="center">0.100</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Metric invariance</td>
<td valign="top" align="center">552.00</td>
<td valign="top" align="center">363</td>
<td valign="top" align="center">0.816</td>
<td valign="top" align="center">0.787</td>
<td valign="top" align="center">0.106</td>
<td valign="top" align="center">0.109</td>
<td valign="top" align="center">14.34</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">0.500</td>
</tr>
<tr>
<td valign="top" align="left">Scalar invariance</td>
<td valign="top" align="center">560.00</td>
<td valign="top" align="center">378</td>
<td valign="top" align="center">0.823</td>
<td valign="top" align="center">0.803</td>
<td valign="top" align="center">0.102</td>
<td valign="top" align="center">0.110</td>
<td valign="top" align="center">8.68</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">0.894</td>
</tr></tbody>
</table>
</table-wrap>
<p>Across both gender and grade level, changes in fit indices were negligible (&#x00394;CFI &#x02264; 0.01, &#x00394;RMSEA &#x02264; 0.015) and all Satorra&#x02013;Bentler &#x003C7;<sup>2</sup> difference tests were non-significant (<italic>p</italic>&#x0003E;0.20). These results indicate that the six-factor model is scalar invariant across groups.</p>
<p>Building on these results, we conducted group comparisons of observed scale means using non-parametric Mann&#x02013;Whitney <italic>U</italic>-tests (<xref ref-type="bibr" rid="B5">Bortz and D&#x000F6;ring, 2015</xref>). Across all six dimensions, no statistically significant differences were found between male and female students. Holm-adjusted <italic>p</italic>-values ranged from <italic>p</italic><sub>Holm</sub> &#x0003D; 0.194 to <italic>p</italic><sub>Holm</sub> &#x0003D; 1.000, with effect sizes ranging from <italic>r</italic> &#x0003D; &#x02212;0.102 to <italic>r</italic> &#x0003D; 0.114, indicating negligible group differences (<xref ref-type="bibr" rid="B25">Holm, 1979</xref>). Comparisons between students of different grades yielded a similar pattern. Although descriptive medians suggested slightly higher authenticity ratings for lower grade students in the <italic>methods, materials</italic>, and <italic>location</italic> dimensions, none of these differences reached statistical significance after Holm correction (<italic>p</italic><sub>Holm</sub> &#x0003D; 0.450&#x02013;1.000). The corresponding effect sizes were consistently small, with values ranging from <italic>r</italic> &#x0003D; &#x02212;0.130 to <italic>r</italic> &#x0003D; 0.171. These findings suggest that, beyond measurement equivalence, perceptions of authenticity were consistent across gender and grade level in this sample.</p>
</sec>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<label>4</label>
<title>Discussion</title>
<p>The present study aimed to validate an extended version of the FEWAW questionnaire for measuring students&#x00027; perceived authenticity in educational settings. The revised instrument includes six scales: <italic>content, innovation, materials, methods, location</italic>, and <italic>instructor</italic>. The following section discusses the findings in the context of the research questions (RQ1&#x02013;RQ2.4), focusing on the factorial structure, internal consistency, discriminant, and convergent validity and measurement invariance.</p>
<sec>
<label>4.1</label>
<title>Factorial structure (RQ1)</title>
<p>Confirmatory factor analysis supported the proposed six-factor structure with acceptable-to-excellent global fit and robust loadings (see <xref ref-type="table" rid="T2">Tables 2</xref>, <xref ref-type="table" rid="T3">3</xref>). This adds to the literature that has long argued for a multi-faceted, relational construct of authenticity in science education (<xref ref-type="bibr" rid="B2">Betz, 2018</xref>; <xref ref-type="bibr" rid="B42">Nachtigall et al., 2022</xref>). In contrast to earlier validation results in which <italic>materials</italic> and <italic>methods</italic> merged into a single factor (<xref ref-type="bibr" rid="B16">Finger et al., 2022</xref>), the present results empirically distinguish these subdimensions. Theoretically, this separation echoes the distinction between the <italic>artefactual</italic> basis of science (instruments, samples, devices) and the <italic>procedural</italic> orchestration of scientific inquiry (planning, measuring, analyzing)&#x02014;a difference that is central to disciplinary authenticity (<xref ref-type="bibr" rid="B64">Watkins et al., 2012</xref>; <xref ref-type="bibr" rid="B34">Lee and Butler, 2003</xref>). Disentangling these aspects enables instructional designers and researchers to reason about how specific design elements (e.g., access to professional tools vs. engagement in scientific practices) affect learners&#x00027; authenticity perceptions. The improved separation is likely due to iterative item clarification and tighter semantic boundaries between dimensions. By reducing wording overlaps (e.g., items that implicitly referenced both tools and procedures) and prioritizing first-person, experience-near formulations, we possibly minimized cross-loadings that otherwise threaten discriminant validity.</p>
</sec>
<sec>
<label>4.2</label>
<title>Psychometric properties (RQ2)</title>
<p>Overall, the results provide promising evidence that the extended FEWAW instrument demonstrates satisfactory psychometric quality across central aspects of scale validation. The majority of scales showed solid internal consistencies and most dimensions were empirically distinguishable despite theoretically expected associations among some constructs (e.g., <italic>materials</italic>&#x02013;<italic>methods, content</italic>&#x02013;<italic>materials</italic>). The patterns of correlations with external validation measures further supported the convergent validity of the dimensions, particularly for <italic>materials, content</italic>, and <italic>methods</italic>, which emerged as the most robust and theoretically coherent indicators of perceived authenticity in our sample. At the same time, the weaker performance of the <italic>innovation</italic> scale points to conceptual and psychometric limitations that warrant reconsideration in future revisions of the instrument. With respect to measurement invariance, the results tentatively suggest that the instrument functions similarly across gender and grade level. However, given the limited sample size, these findings should be interpreted with caution. Taken together, the findings indicate that the revised FEWAW represents a psychometrically robust instrument, while also recognizing specific areas where further research is needed.</p>
<p>In the following, we discuss the results for each aspect of RQ2 in more detail, structured according to the four sub-questions on internal consistency (RQ2.1), discriminant validity (RQ2.2), convergent validity (RQ2.3), and measurement invariance (RQ2.4).</p>
<sec>
<label>4.2.1</label>
<title>Internal consistency (RQ2.1)</title>
<p>The final 21-item version achieved strong psychometric properties while maintaining broad construct coverage. The trimming strategy combined (a) statistical thresholds (factor loadings, item-level explained variance, and modification indices) with (b) conceptual trimming to remove redundancy and harmonize scale length. This two-step approach is consistent with recommendations in the measurement literature (<xref ref-type="bibr" rid="B7">Brown, 2015</xref>; <xref ref-type="bibr" rid="B31">Kline, 2016</xref>; <xref ref-type="bibr" rid="B5">Bortz and D&#x000F6;ring, 2015</xref>) and meets demands in time-constrained environments such as out-of-school labs, where additional measurement instruments are often administered.</p>
<p>Internal consistencies of the six scales ranged from &#x003C9; &#x0003D; 0.64 to 0.87 (see <xref ref-type="table" rid="T4">Table 4</xref>). Five of the six dimensions exceeded the commonly recommended threshold of &#x003C9;&#x02265;0.70, indicating solid reliability even with the reduced number of items. Cronbach&#x00027;s &#x003B1; values showed a comparable pattern, ranging from &#x003B1; &#x0003D; 0.63 to 0.87, with five of the six dimensions exceeding the commonly recommended threshold of &#x003B1;&#x02265;0.70. The highest reliability was observed for <italic>materials</italic> (&#x003C9; &#x0003D; 0.87, &#x003B1; &#x0003D; 0.87), followed by <italic>instructor, location</italic>, and <italic>content</italic> (all &#x003C9;&#x02265;0.82, &#x003B1;&#x02265;0.82). In comparison to <xref ref-type="bibr" rid="B16">Finger et al. (2022</xref>), who reported consistently high reliability values across all scales (&#x003B1;&#x02265;0.81), the present results are largely comparable&#x02014;with the exception of the <italic>innovation</italic> scale, which showed a noticeably lower internal consistency (&#x003C9; &#x0003D; 0.64, &#x003B1; &#x0003D; 0.63).</p>
<p>This result may be partially explained by the fact that the <italic>innovation</italic> scale, along with <italic>location</italic> and <italic>instructor</italic>, was retained without revision. Since these scales were locked for comparability, they could not be optimized or improved in the same way as the newly extended dimensions. We return to the consequences of this decision, especially with regard to the <italic>innovation</italic> dimension, in Section 4.2.3.</p></sec>
<sec>
<label>4.2.2</label>
<title>Discriminant validity (RQ2.2)</title>
<p>Inter-factor correlations for all factors remained below the conventional threshold of <italic>r</italic> &#x0003D; 0.80, generally indicating that the six dimensions capture distinct aspects of perceived authenticity. However, the magnitude of the intercorrelations between several dimensions, notably <italic>content</italic> and <italic>materials</italic> (<italic>r</italic> &#x0003D; 0.67) and <italic>materials</italic> and <italic>methods</italic> (<italic>r</italic> &#x0003D; 0.68), should be reviewed critically. High inter-factor correlations may raise questions regarding the discriminant validity of these dimensions and signal the potential existence of an overlying, higher-order factor. The association between <italic>materials</italic> and <italic>methods</italic>, for example, is theoretically coherent as disciplinary authenticity involves both access to the <italic>tools</italic> and engagement with the <italic>practices</italic> of the field. This overlap suggests that learners can and do differentiate between <italic>what</italic> they used and <italic>how</italic> they used it, yet the resulting correlations indicate that these facets are perceived as closely connected. Similarly, the strong link between <italic>content</italic> and <italic>materials</italic> may reflect the fact that authentic scientific content is typically embedded within the artifacts through which it is explored.</p>
<p>These patterns are reflected in the HTMT ratio of correlations, which provides a stricter indication of conceptual distinctiveness. Most HTMT values remained below the recommended threshold of 0.85 (<xref ref-type="bibr" rid="B22">Henseler et al., 2015</xref>; <xref ref-type="bibr" rid="B9">Cheung et al., 2024</xref>), supporting the separability of the majority of dimensions. However, elevated values were observed for the pairs <italic>content</italic>&#x02013;<italic>materials</italic> (HTMT &#x0003D; 0.79) and <italic>materials</italic>&#x02013;<italic>methods</italic> (HTMT &#x0003D; 0.83), indicating particularly close empirical associations. This suggests that while the dimensions are conceptually defined as distinct, they may not be fully separated in learners&#x00027; perceptions. One plausible explanation is the inherent structure of the learning activities in our sample. The tasks were designed such that the materials followed directly from the content and the methods naturally emerged from the available materials. For instance, activities on robotics (<italic>content</italic>) involved working with the robot itself (<italic>materials</italic>) and required the students to program (<italic>methods</italic>). This built-in sequencing may have made it difficult for learners to perceive these dimensions as clearly distinct from one another.</p>
<p>Future research should therefore investigate a hierarchical factor model to determine whether these dimensions are best represented as distinct yet strongly associated facets or as expressions of a broader, underlying construct. Despite these challenges, the intercorrelations and HTMT values remained below conventional thresholds, providing evidence for adequate empirical separability. The refined wording and the clear conceptual distinction between dimensions likely contributed to the overall acceptable statistical separation.</p></sec>
<sec>
<label>4.2.3</label>
<title>Convergent validity (RQ2.3)</title>
<p>The analyses of the correlations between FEWAW scales and external validation measures support the convergent validity of most dimensions. In particular, the scales <italic>materials, content</italic>, and <italic>methods</italic> showed the strongest associations with constructs that are theoretically aligned with key components of perceived authenticity such as general and task-specific authenticity, participation in scientific practices, and perceptions of lab equipment (e.g. <xref ref-type="bibr" rid="B13">Damerau, 2012</xref>; <xref ref-type="bibr" rid="B41">Nachtigall et al., 2018</xref>; <xref ref-type="bibr" rid="B55">Sch&#x000FC;ttler et al., 2021</xref>; <xref ref-type="bibr" rid="B10">Chi et al., 2018</xref>). These findings suggest that learners&#x00027; authenticity judgments are closely linked to material and procedural features of the learning environment, which appear to serve as salient cues for authenticity perception (<xref ref-type="bibr" rid="B55">Sch&#x000FC;ttler et al., 2021</xref>). This interpretation aligns with earlier research indicating that authenticity is often anchored in tangible characteristics of science education settings (<xref ref-type="bibr" rid="B6">Braund and Reiss, 2006</xref>; <xref ref-type="bibr" rid="B48">Roth, 1995</xref>).</p>
<p>Among these, <italic>materials</italic> and <italic>content</italic> stood out as the dimensions with the most pronounced and consistently high correlations across multiple external measures, suggesting that these two dimensions play a particularly central role in shaping students&#x00027; authenticity perceptions. From a theoretical perspective, both dimensions reflect foundational elements of scientific practice, namely the physical artifacts and the substantive focus of scientific inquiry.</p>
<p>The <italic>location</italic> and <italic>instructor</italic> scales were also positively associated with several external constructs, though their relationships were less pronounced. Both dimensions correlated moderately with general authenticity and perceived authenticity of lab equipment, while <italic>location</italic> additionally related to participation in scientific practices. These results point to a secondary role of spatial and interpersonal aspects in shaping perceived authenticity, possibly reflecting that these features are more context-sensitive and subject to variation in learners&#x00027; interpretations.</p>
<p>In contrast, the <italic>innovation</italic> scale displayed lower correlations with most external validation measures. Although it was modestly associated with task-related authenticity and epistemological beliefs about the origin of knowledge, it showed no meaningful correlation with other constructs we measured. This pattern is consistent with the relatively low AVE<sub>AUIN</sub> &#x0003D; 0.386, indicating weaker convergence of its items and providing an internal validity-based explanation for the selective and generally weaker external associations. Importantly, the weaker empirical performance reflects a deeper conceptual issue that arises when operationalizing <italic>innovation</italic> in formal learning contexts. While the present data does not allow for definitive conclusions about the underlying causes, a few considerations may help interpret the observed pattern.</p>
<p>Authenticity in formal learning settings typically involves a simulation of scientific practice rather than direct engagement in authentic research (<xref ref-type="bibr" rid="B3">Betz et al., 2016</xref>). Students&#x00027; perceptions of authenticity may therefore be bounded by their role expectations in school-based learning, as many see themselves as exploring existing ideas rather than generating new knowledge. Unlike the other dimensions, which are anchored in tangible cues such as physical materials, tools, spatial settings, or even instructors, <italic>innovation</italic> relies on learners&#x00027; subjective assessment of epistemic novelty. Such assessments draw on beliefs about who is entitled to create new scientific knowledge, making the construct inherently more complex than dimensions triggered directly by environmental features. This asymmetry is also reflected in the current item formulations, which adopt an &#x0201C;objective&#x0201D; perspective on scientific discovery (e.g., &#x0201C;I tried to discover something new for science,&#x0201D; &#x0201C;I contributed to answering a current research question&#x0201D;). These formulations implicitly assume a professional scientific role and therefore may exceed what students consider realistic within a classroom or an outreach setting. This interpretation aligns with prior research emphasizing that authenticity or student perceptions on epistemological beliefs depend not only on environmental features but also on learners&#x00027; epistemic role expectations (<xref ref-type="bibr" rid="B49">Sandoval, 2005</xref>; <xref ref-type="bibr" rid="B60">Stroupe, 2014</xref>; <xref ref-type="bibr" rid="B43">Nachtigall et al., 2024</xref>). In this view, <italic>innovation</italic> can be considered an outcome of how learners position themselves within these contexts.</p>
<p>The selective correlation with epistemological beliefs about the <italic>origin of knowledge</italic> further supports this explanation. Learners who have a broader view of who can generate scientific knowledge appear more likely to perceive their own activities as innovative. Conversely, students who believe that only professional scientists produce new knowledge may experience a mismatch between item wording and their perceived role, resulting in overall lower scores. This pattern is consistent with research showing that many students differentiate sharply between school science and professional science and attribute knowledge generation primarily to scientists rather than learners (<xref ref-type="bibr" rid="B63">Voitle et al., 2022</xref>). The absence of a corresponding relationship with beliefs about the <italic>changeability of knowledge</italic> suggests the importance of learners&#x00027; assumptions about who is allowed to generate new ideas. Taken together, these findings indicate that the subjective experience of <italic>innovation</italic> is constrained by role-based plausibility boundaries. Students may feel they can explore or test ideas, but not &#x0201C;discover something new for science.&#x0201D;</p>
<p>From a psychometric perspective, this conceptual misalignment helps explain the low AVE for the <italic>innovation</italic> scale and the lack of meaningful correlations with most external validation measures. It also clarifies why this dimension has shown weak performance in <xref ref-type="bibr" rid="B16">Finger et al. (2022</xref>). To improve both theoretical coherence and empirical functioning, future iterations of the scale may benefit from shifting toward a more learner-centered conceptualization of epistemic novelty, emphasizing personal discovery (&#x0201C;I explored something new to me&#x0201D;) and idea generation (&#x0201C;I was able to generate and test my own ideas&#x0201D;) rather than contributions to professional scientific knowledge. Such formulations would align more closely with authenticity as a subjective experience and be more consistent with the role expectations typically held by students in structured learning contexts.</p>
<p>Furthermore, the unexpectedly weak association between <italic>instructor</italic> and external ratings of instructor expertise should be noted. A plausible explanation lies in the specific wording of the items. The FEWAW scale refers to instructors as &#x0201C;real scientists,&#x0201D; invoking authenticity markers rooted in scientific identity and professional status. By contrast, the external validation scale refers to &#x0201C;our tutors&#x0201D; and emphasizes perceived competence rather than professional affiliation. Particularly in outreach contexts such as student labs, where instruction is often provided by university students or early-career staff, learners may recognize expertise without perceiving the instructors as authentic representatives of science.</p></sec>
<sec>
<label>4.2.4</label>
<title>Measurement invariance (RQ2.4)</title>
<p>The analysis provided initial evidence for scalar invariance across gender and grade level, suggesting that the six-factor structure functions equivalently across these groups. This indicates that the instrument allows for unbiased mean comparisons between male and female students as well as across grade levels.</p>
<p>Nevertheless, these findings must be viewed as preliminary. Given the small sample size (<italic>N</italic> &#x0003D; 130), the absence of significant differences does not conclusively confirm full invariance. Minor variations in the pattern of loadings or intercepts might remain undetected in small samples. Furthermore, as often observed in small-to-moderate samples, a slight deterioration of overall model fit occurred during the stepwise invariance testing. This pattern is well-documented as a sample-size-sensitive artifact rather than a substantive refutation of invariance (<xref ref-type="bibr" rid="B8">Chen, 2007</xref>). Accordingly, future research should validate the model structure with larger and more diverse datasets encompassing different school types, age groups, and disciplinary contexts. This could help assess the robustness of the FEWAW measurement model and to determine whether the observed factorial stability generalizes across sub-populations.</p>
</sec>
</sec>
</sec>
<sec id="s5">
<label>5</label>
<title>Limitations</title>
<p>While the present study offers important insights into the factorial structure and validity of the revised FEWAW instrument, several limitations must be acknowledged.</p>
<p>First, the generalizability of the results is limited by the specific context in which the data were collected. All participants took part in an extracurricular physics lab at a single institution in Germany. As a result, the findings may not generalize to other subject domains or other science learning contexts. Moreover, the sample consisted exclusively of students from schools in grades 10 and 11, which restricts conclusions about the instrument&#x00027;s applicability to other age groups.</p>
<p>Second, our study relied on a smaller and more context-specific sample. While this reflects the narrower goal of refining and validating selected dimensions rather than developing a new instrument from scratch, the reduced sample size limits generalizability&#x02014;particularly in confirmatory factor analysis and measurement invariance testing (<xref ref-type="bibr" rid="B7">Brown, 2015</xref>).</p>
<p>Third, although the <italic>innovation</italic> scale showed comparatively weaker psychometric performance, no qualitative or process-oriented data were collected to clarify how students interpreted these items. Consequently, the study cannot provide in-depth explanations for the low reliability and limited external associations of this scale. Future research should explore learners&#x00027; interpretations through cognitive interviews or think-aloud protocols to better understand the source of this mismatch.</p>
<p>Taken together, these limitations underscore the need for further validation studies with more diverse and larger samples, ideally across different school types, age groups and disciplinary contexts.</p></sec>
<sec id="s6">
<label>6</label>
<title>Conclusions and outlook</title>
<p>The present contribution provides a theoretically grounded, multidimensional instrument for assessing students&#x00027; perceived authenticity in educational settings. The six-factor structure was empirically confirmed, with good support for internal consistency, discriminant validity and scalar measurement invariance across gender and grade. The results highlight the need to view authenticity not as a unitary construct but as dependent on instructional context and learner characteristics (<xref ref-type="bibr" rid="B2">Betz, 2018</xref>; <xref ref-type="bibr" rid="B42">Nachtigall et al., 2022</xref>; <xref ref-type="bibr" rid="B53">Schriebl et al., 2023</xref>).</p>
<p>Future studies should validate the FEWAW structure in larger and more diverse samples (e.g., <italic>N</italic>&#x0003E;500) to assess the weighting and potential hierarchy among dimensions. This would help prioritize design elements and advance theory-driven instructional development.</p>
<p>Further research should also explore the predictive validity of the FEWAW dimensions. Investigating how perceived authenticity relates to motivational (e.g., situational interest), epistemological (e.g., beliefs about knowledge), and cognitive outcomes (e.g., learning gains) could demonstrate the instrument&#x00027;s practical utility and theoretical significance.</p>
<p>In sum, the revised questionnaire offers a concise and theoretically reliable instrument for assessing perceived authenticity in science education. It addresses prior concerns regarding construct overlap and establishes a foundation for future research and instructional design focused on authenticity.</p></sec>
</body>
<back>
<sec sec-type="data-availability" id="s7">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec sec-type="ethics-statement" id="s8">
<title>Ethics statement</title>
<p>The studies involving humans were approved by the Ethics Committee of the Otto von Guericke University Magdeburg (approval no. 98/23). The studies were conducted in accordance with the local legislation and institutional requirements. Written informed consent for participation in this study was provided by the participants&#x00027; legal guardians/next of kin.</p>
</sec>
<sec sec-type="author-contributions" id="s9">
<title>Author contributions</title>
<p>DS: Conceptualization, Data curation, Formal analysis, Visualization, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing, Methodology. TS: Investigation, Writing &#x02013; review &#x00026; editing. BE: Formal analysis, Methodology, Writing &#x02013; review &#x00026; editing. BW: Conceptualization, Funding acquisition, Project administration, Supervision, Writing &#x02013; review &#x00026; editing, Methodology.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s11">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec sec-type="disclaimer" id="s12">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="s13">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/feduc.2026.1749760/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/feduc.2026.1749760/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.pdf" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Anker-Hansen</surname> <given-names>J.</given-names></name> <name><surname>Andr&#x000E9;e</surname> <given-names>M.</given-names></name></person-group> (<year>2019</year>). <article-title>In pursuit of authenticity in science education</article-title>. <source>Nord. Stud. Sci. Educ</source>. <volume>15</volume>, <fpage>498</fpage>&#x02013;<lpage>510</lpage>. doi: <pub-id pub-id-type="doi">10.5617/nordina.4723</pub-id></mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Betz</surname> <given-names>A.</given-names></name></person-group> (<year>2018</year>). <article-title>Der Einfluss der Lernumgebung auf die (wahrgenommene) Authentizit&#x000E4;t der linguistischen Wissenschaftsvermittlung und das situationale Interesse von Lernenden [The influence of the learning environment on learners&#x00027; (perceived) authenticity of science communication and on their situational interest]</article-title>. <source>Unterrichtswiss</source>. <volume>46</volume>, <fpage>261</fpage>&#x02013;<lpage>278</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s42010-018-0021-0</pub-id></mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Betz</surname> <given-names>A.</given-names></name> <name><surname>Flake</surname> <given-names>S.</given-names></name> <name><surname>Mierwald</surname> <given-names>M.</given-names></name> <name><surname>Vanderbeke</surname> <given-names>M.</given-names></name></person-group> (<year>2016</year>). <article-title>&#x0201C;Modelling authenticity in teaching and learning contexts: a contribution to theory development and empirical investigation of the construct,&#x0201D;</article-title> in <source>Transforming Learning, Empowering Learners: The International Conference of the Learning Sciences (ICLS) 2016, Vol. 2</source>, eds. C. K. Looi, J. L. Polman, U. Cress, and P. Reimann (Singapore: International Society of the Learning Sciences), <fpage>815</fpage>&#x02013;<lpage>818</lpage>.</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bolger</surname> <given-names>M. S.</given-names></name> <name><surname>Osness</surname> <given-names>J. B.</given-names></name> <name><surname>Gouvea</surname> <given-names>J. S.</given-names></name> <name><surname>Cooper</surname> <given-names>A. C.</given-names></name></person-group> (<year>2021</year>). <article-title>Supporting scientific practice through model-based inquiry: a students&#x00027;-eye view of grappling with data, uncertainty, and community in a laboratory experience</article-title>. <source>CBE Life Sci. Educ</source>. <volume>20</volume>:<fpage>ar59</fpage>. doi: <pub-id pub-id-type="doi">10.1187/cbe.21-05-0128</pub-id><pub-id pub-id-type="pmid">34678041</pub-id></mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bortz</surname> <given-names>J.</given-names></name> <name><surname>D&#x000F6;ring</surname> <given-names>N.</given-names></name></person-group> (<year>2015</year>). <source>Forschungsmethoden und Evaluation: F&#x000FC;r Human- und Sozialwissenschaftler [Research Methods and Evaluation: For Researchers in the Human and Social Sciences</source>]. Heidelberg: Springer.</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Braund</surname> <given-names>M.</given-names></name> <name><surname>Reiss</surname> <given-names>M.</given-names></name></person-group> (<year>2006</year>). <article-title>Towards a more authentic science curriculum: the contribution of out-of-school learning</article-title>. <source>Int. J. Sci. Educ</source>. <volume>28</volume>, <fpage>1373</fpage>&#x02013;<lpage>1388</lpage>. doi: <pub-id pub-id-type="doi">10.1080/09500690500498419</pub-id></mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Brown</surname> <given-names>T. A.</given-names></name></person-group> (<year>2015</year>). <source>Confirmatory Factor Analysis for Applied Research</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Guilford Press</publisher-name>.</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>F. F.</given-names></name></person-group> (<year>2007</year>). <article-title>Sensitivity of goodness of fit indices to lack of measurement invariance</article-title>. <source>Struct. Equ. Model</source>. <volume>14</volume>, <fpage>464</fpage>&#x02013;<lpage>504</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10705510701301834</pub-id></mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cheung</surname> <given-names>G. W.</given-names></name> <name><surname>Cooper-Thomas</surname> <given-names>H. D.</given-names></name> <name><surname>Lau</surname> <given-names>R. S.</given-names></name> <name><surname>Wang</surname> <given-names>L. C.</given-names></name></person-group> (<year>2024</year>). <article-title>Reporting reliability, convergent and discriminant validity with structural equation modeling: a review and best-practice recommendations</article-title>. <source>Asia Pac. J. Manag</source>. <volume>41</volume>, <fpage>745</fpage>&#x02013;<lpage>783</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10490-023-09871-y</pub-id></mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chi</surname> <given-names>S.</given-names></name> <name><surname>Liu</surname> <given-names>X.</given-names></name> <name><surname>Wang</surname> <given-names>Z.</given-names></name> <name><surname>Han</surname> <given-names>S. W.</given-names></name></person-group> (<year>2018</year>). <article-title>Moderation of the effects of scientific inquiry activities on low SES students&#x00027; PISA 2015 science achievement by school teacher support and disciplinary climate in science classroom across gender</article-title>. <source>Int. J. Sci. Educ</source>. <volume>40</volume>, <fpage>1284</fpage>&#x02013;<lpage>1304</lpage>. doi: <pub-id pub-id-type="doi">10.1080/09500693.2018.1476742</pub-id></mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chinn</surname> <given-names>C. A.</given-names></name> <name><surname>Malhotra</surname> <given-names>B. A.</given-names></name></person-group> (<year>2002</year>). <article-title>Epistemologically authentic inquiry in schools: a theoretical framework for evaluating inquiry tasks</article-title>. <source>Sci. Educ</source>. <volume>86</volume>, <fpage>175</fpage>&#x02013;<lpage>218</lpage>. doi: <pub-id pub-id-type="doi">10.1002/sce.10001</pub-id></mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Cohen</surname> <given-names>J.</given-names></name></person-group> (<year>1988</year>). <source>Statistical Power Analysis for the Behavioral Sciences</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Routledge</publisher-name>.</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="thesis"><person-group person-group-type="author"><name><surname>Damerau</surname> <given-names>K.</given-names></name></person-group> (<year>2012</year>). <source>Molekulare und Zell-Biologie im Sch&#x000FC;lerlabor. Fachliche Optimierung und Evaluation der Wirksamkeit im BeLL Bio (Bergisches Lehr-Lern-Labor Biologie)</source> [<italic>Molecular and cellular biology in an out-of-school lab: subject-specific optimization and evaluation of effectiveness in the BeLL Bio</italic>] (Ph.D. thesis). Bergische Universit&#x000E4;t Wuppertal, Wuppertal, Germany.</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Engeln</surname> <given-names>K.</given-names></name></person-group> (<year>2004</year>). <source>Sch&#x000FC;lerlabors. Authentische, aktivierende Lernumgebungen als M&#x000F6;glichkeit, Interesse an Naturwissenschaften und Technik zu wecken [Out-of-School Labs: Authentic, Activating Learning Environments as a Means to Foster Interest in Science and Technology</source>]. Berlin: Logos Verlag Berlin.</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Faul</surname> <given-names>F.</given-names></name> <name><surname>Erdfelder</surname> <given-names>E.</given-names></name> <name><surname>Buchner</surname> <given-names>A.</given-names></name> <name><surname>Lang</surname> <given-names>A. G.</given-names></name></person-group> (<year>2009</year>). <article-title>Statistical power analyses using G*Power 3.1: tests for correlation and regression analyses</article-title>. <source>Behav. Res. Methods</source> <volume>41</volume>, <fpage>1149</fpage>&#x02013;<lpage>1160</lpage>. doi: <pub-id pub-id-type="doi">10.3758/BRM.41.4.1149</pub-id><pub-id pub-id-type="pmid">19897823</pub-id></mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Finger</surname> <given-names>L.</given-names></name> <name><surname>van den Bogaert</surname> <given-names>V.</given-names></name> <name><surname>Fleischer</surname> <given-names>J.</given-names></name> <name><surname>Raimann</surname> <given-names>J.</given-names></name> <name><surname>Sommer</surname> <given-names>K.</given-names></name> <name><surname>Wirth</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Das Sch&#x000FC;lerlabor als Ort authentischer Wissenschaftsvermittlung? Entwicklung und Validierung eines Fragebogens zur Erfassung der Authentizit&#x000E4;tswahrnehmung der Wissenschaftsvermittlung im Sch&#x000FC;lerlabor [Out-of-school labs as places of authentic science education? Development and validation of a questionnaire to assess the perceived authenticity of science education in out-of-school labs]</article-title>. <source>Z. Didakt. Naturwiss</source>. <volume>28</volume>:<fpage>2</fpage>. doi: <pub-id pub-id-type="doi">10.1007/s40573-022-00139-4</pub-id></mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Finney</surname> <given-names>S. J.</given-names></name> <name><surname>DiStefano</surname> <given-names>C.</given-names></name></person-group> (<year>2006</year>). <article-title>&#x0201C;Non-normal and categorical data in structural equation modeling,&#x0201D;</article-title> in <source>Structural Equation Modeling: A Second Course</source>, eds. G. R. Hancock, and R. O. Mueller (Charlotte, NC: Information Age Publishing), <fpage>269</fpage>&#x02013;<lpage>314</lpage>.</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fornell</surname> <given-names>C.</given-names></name> <name><surname>Larcker</surname> <given-names>D. F.</given-names></name></person-group> (<year>1981</year>). <article-title>Evaluating structural equation models with unobservable variables and measurement error</article-title>. <source>J. Mark. Res</source>. <volume>18</volume>, <fpage>39</fpage>&#x02013;<lpage>50</lpage>. doi: <pub-id pub-id-type="doi">10.1177/002224378101800104</pub-id></mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Habig</surname> <given-names>B.</given-names></name> <name><surname>Gupta</surname> <given-names>P.</given-names></name></person-group> (<year>2021</year>). <article-title>Authentic STEM research, practices of science, and interest development in an informal science education program</article-title>. <source>Int. J. STEM Educ</source>. <volume>8</volume>:<fpage>57</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s40594-021-00314-y</pub-id></mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Habig</surname> <given-names>S.</given-names></name> <name><surname>Blankenburg</surname> <given-names>J.</given-names></name> <name><surname>van Vorst</surname> <given-names>H.</given-names></name> <name><surname>Fechner</surname> <given-names>S.</given-names></name> <name><surname>Parchmann</surname> <given-names>I.</given-names></name> <name><surname>Sumfleth</surname> <given-names>E.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Context characteristics and their effects on students&#x00027; situational interest in chemistry</article-title>. <source>Int. J. Sci. Educ</source>. <volume>40</volume>, <fpage>1154</fpage>&#x02013;<lpage>1175</lpage>. doi: <pub-id pub-id-type="doi">10.1080/09500693.2018.1470349</pub-id></mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hagenk&#x000F6;tter</surname> <given-names>R.</given-names></name> <name><surname>Nachtigall</surname> <given-names>V.</given-names></name> <name><surname>Rolka</surname> <given-names>K.</given-names></name> <name><surname>Rummel</surname> <given-names>N.</given-names></name></person-group> (<year>2024</year>). <article-title>Model authenticity in learning mathematical experimentation: how students perceive and learn from scientist and peer models</article-title>. <source>Eur. J. Psychol. Educ</source>. <volume>39</volume>, <fpage>3301</fpage>&#x02013;<lpage>3324</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10212-024-00843-4</pub-id></mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Henseler</surname> <given-names>J.</given-names></name> <name><surname>Ringle</surname> <given-names>C. M.</given-names></name> <name><surname>Sarstedt</surname> <given-names>M.</given-names></name></person-group> (<year>2015</year>). <article-title>A new criterion for assessing discriminant validity in variance-based structural equation modeling</article-title>. <source>J. Acad. Mark. Sci</source>. <volume>43</volume>, <fpage>115</fpage>&#x02013;<lpage>135</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11747-014-0403-8</pub-id></mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Herrington</surname> <given-names>J.</given-names></name> <name><surname>Oliver</surname> <given-names>R.</given-names></name></person-group> (<year>2000</year>). <article-title>An instructional design framework for authentic learning environments</article-title>. <source>Educ. Technol. Res. Dev</source>. <volume>48</volume>, <fpage>23</fpage>&#x02013;<lpage>48</lpage>. doi: <pub-id pub-id-type="doi">10.1007/BF02319856</pub-id></mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hohrath</surname> <given-names>S.</given-names></name> <name><surname>A&#x000DF;mann</surname> <given-names>S.</given-names></name> <name><surname>Krabbe</surname> <given-names>H.</given-names></name> <name><surname>Opfermann</surname> <given-names>M.</given-names></name></person-group> (<year>2024</year>). <article-title>Students&#x00027; perceived authenticity and understanding of authentic research while experimenting in a non-formal learning setting</article-title>. <source>Eur. J. Psychol. Educ</source>. <volume>39</volume>, <fpage>3325</fpage>&#x02013;<lpage>3349</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10212-024-00810-z</pub-id></mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Holm</surname> <given-names>S.</given-names></name></person-group> (<year>1979</year>). <article-title>A simple sequentially rejective multiple test procedure</article-title>. <source>Scand. J. Stat</source>. <volume>6</volume>, <fpage>65</fpage>&#x02013;<lpage>70</lpage>.</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Honebein</surname> <given-names>P. C.</given-names></name> <name><surname>Duffy</surname> <given-names>T. M.</given-names></name> <name><surname>Fishman</surname> <given-names>B. J.</given-names></name></person-group> (<year>1993</year>). <article-title>&#x0201C;Constructivism and the design of learning environments: context and authentic activities for learning,&#x0201D;</article-title> in <source>Designing Environments for Constructive Learning</source>, eds. T. M. Duffy, J. Lowyck, D. H. Jonassen, and T. M. Welsh (<publisher-loc>Berlin</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>87</fpage>&#x02013;<lpage>108</lpage>. doi: <pub-id pub-id-type="doi">10.1007/978-3-642-78069-1_5</pub-id></mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>L.</given-names></name> <name><surname>Bentler</surname> <given-names>P. M.</given-names></name></person-group> (<year>1999</year>). <article-title>Cutoff criteria for fit indexes in covariance structure analysis: conventional criteria versus new alternatives</article-title>. <source>Struct. Equ. Model</source>. <volume>6</volume>, <fpage>1</fpage>&#x02013;<lpage>55</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10705519909540118</pub-id></mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Huber</surname> <given-names>F.</given-names></name> <name><surname>Vollhardt</surname> <given-names>K.</given-names></name> <name><surname>Meyer</surname> <given-names>F.</given-names></name></person-group> (<year>2009</year>). <article-title>Helden der Werbung? Eine Untersuchung der Relevanz von Werbefiguren f&#x000FC;r das Konsumentenverhalten</article-title>. <source>Mark. Z. Forsch. Prax</source>. <volume>31</volume>, <fpage>183</fpage>&#x02013;<lpage>196</lpage>. doi: <pub-id pub-id-type="doi">10.15358/0344-1369-2009-3-183</pub-id></mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Itzek-Greulich</surname> <given-names>H.</given-names></name> <name><surname>Flunger</surname> <given-names>B.</given-names></name> <name><surname>Vollmer</surname> <given-names>C.</given-names></name> <name><surname>Nagengast</surname> <given-names>B.</given-names></name> <name><surname>Rehm</surname> <given-names>M.</given-names></name> <name><surname>Trautwein</surname> <given-names>U.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Effects of a science center outreach lab on school students&#x00027; achievement&#x02014;are student lab visits needed when they teach what students can learn at school?</article-title> <source>Learn. Instr</source>. <volume>38</volume>, <fpage>43</fpage>&#x02013;<lpage>52</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.learninstruc.2015.03.003</pub-id></mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kapon</surname> <given-names>S.</given-names></name> <name><surname>Laherto</surname> <given-names>A.</given-names></name> <name><surname>Levrini</surname> <given-names>O.</given-names></name></person-group> (<year>2018</year>). <article-title>Disciplinary authenticity and personal relevance in school science</article-title>. <source>Sci. Educ</source>. <volume>102</volume>, <fpage>1077</fpage>&#x02013;<lpage>1106</lpage>. doi: <pub-id pub-id-type="doi">10.1002/sce.21458</pub-id></mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Kline</surname> <given-names>R. B.</given-names></name></person-group> (<year>2016</year>). <source>Principles and Practice of Structural Equation Modeling</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Guilford Press</publisher-name>.</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="thesis"><person-group person-group-type="author"><name><surname>Kremer</surname> <given-names>K. H.</given-names></name></person-group> (<year>2010</year>). <source>Die Natur der Naturwissenschaften verstehen: Untersuchungen zur Struktur und Entwicklung von Kompetenzen in der Sekundarstufe I</source> [<italic>Understanding the nature of science: investigations into the structure and development of competencies in lower secondary education</italic>] (Ph.D. thesis). Universit&#x000E4;t Kassel, Fachbereich Mathematik und Naturwissenschaften, Kassel, Germany.</mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Landis</surname> <given-names>J. R.</given-names></name> <name><surname>Koch</surname> <given-names>G. G.</given-names></name></person-group> (<year>1977</year>). <article-title>The measurement of observer agreement for categorical data</article-title>. <source>Biometrics</source> <volume>33</volume>, <fpage>159</fpage>&#x02013;<lpage>174</lpage>. doi: <pub-id pub-id-type="doi">10.2307/2529310</pub-id><pub-id pub-id-type="pmid">843571</pub-id></mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>H.-S.</given-names></name> <name><surname>Butler</surname> <given-names>N.</given-names></name></person-group> (<year>2003</year>). <article-title>Making authentic science accessible to students</article-title>. <source>Int. J. Sci. Educ</source>. <volume>25</volume>, <fpage>923</fpage>&#x02013;<lpage>948</lpage>. doi: <pub-id pub-id-type="doi">10.1080/09500690305023</pub-id></mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Little</surname> <given-names>R. J. A.</given-names></name> <name><surname>Rubin</surname> <given-names>D. B.</given-names></name></person-group> (<year>2002</year>). <source>Statistical Analysis with Missing Data</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Wiley</publisher-name>. doi: <pub-id pub-id-type="doi">10.1002/9781119013563</pub-id></mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>McDonald</surname> <given-names>R. P.</given-names></name></person-group> (<year>1999</year>). <source>Test Theory: A Unified Treatment</source>. <publisher-loc>London</publisher-loc>: <publisher-name>Psychology Press</publisher-name>.</mixed-citation>
</ref>
<ref id="B37">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Meade</surname> <given-names>A. W.</given-names></name> <name><surname>Craig</surname> <given-names>S. B.</given-names></name></person-group> (<year>2012</year>). <article-title>Identifying careless responses in survey data</article-title>. <source>Psychol. Methods</source> <volume>17</volume>, <fpage>437</fpage>&#x02013;<lpage>455</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0028085</pub-id><pub-id pub-id-type="pmid">22506584</pub-id></mixed-citation>
</ref>
<ref id="B38">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mierwald</surname> <given-names>M.</given-names></name> <name><surname>Lehmann</surname> <given-names>T.</given-names></name> <name><surname>Brauch</surname> <given-names>N.</given-names></name></person-group> (<year>2018</year>). <article-title>Zur Ver&#x000E4;nderung epistemologischer &#x000DC;berzeugungen im Sch&#x000FC;lerlabor: Authentizit&#x000E4;t von Lernmaterial als Chance der Entwicklung einer wissenschaftlich angemessenen &#x000DC;berzeugungshaltung im Fach Geschichte? [Changing epistemological beliefs in student labs: authentic learning materials as a chance to foster the development of academically adequate beliefs in the domain of history?]</article-title>. <source>Unterrichtswiss</source>. <volume>46</volume>, <fpage>279</fpage>&#x02013;<lpage>297</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s42010-018-0019-7</pub-id></mixed-citation>
</ref>
<ref id="B39">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Moschner</surname> <given-names>B.</given-names></name> <name><surname>Gruber</surname> <given-names>H.</given-names></name></person-group> (<year>2017</year>). <article-title>&#x0201C;Erfassung epistemischer &#x000DC;berzeugungen mit dem FEE [Assessing epistemic beliefs using the FEE],&#x0201D;</article-title> in <source>Wissen und Lernen</source>, eds. A. Bernholt, H. Gruber, and B. Moschner (Bedford Heights, OH: Waxmann), <fpage>17</fpage>&#x02013;<lpage>38</lpage>.</mixed-citation>
</ref>
<ref id="B40">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nachtigall</surname> <given-names>V.</given-names></name> <name><surname>Rummel</surname> <given-names>N.</given-names></name></person-group> (<year>2021</year>). <article-title>Investigating students&#x00027; perceived authenticity of learning activities in an out-of-school lab for social sciences: a replication study</article-title>. <source>Instr. Sci</source>. <volume>49</volume>, <fpage>779</fpage>&#x02013;<lpage>810</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11251-021-09556-3</pub-id></mixed-citation>
</ref>
<ref id="B41">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nachtigall</surname> <given-names>V.</given-names></name> <name><surname>Rummel</surname> <given-names>N.</given-names></name> <name><surname>Serova</surname> <given-names>K.</given-names></name></person-group> (<year>2018</year>). <article-title>Authentisch ist nicht gleich authentisch &#x02013; Wie Sch&#x000FC;lerinnen und Sch&#x000FC;ler die Authentizit&#x000E4;t von Lernaktivit&#x000E4;ten im Sch&#x000FC;lerlabor einsch&#x000E4;tzen [Authentic does not equal authentic&#x02014;how students evaluate the authenticity of learning activities in an out-of-school lab]</article-title>. <source>Unterrichtswiss</source>. <volume>46</volume>, <fpage>299</fpage>&#x02013;<lpage>319</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s42010-018-0020-1</pub-id></mixed-citation>
</ref>
<ref id="B42">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nachtigall</surname> <given-names>V.</given-names></name> <name><surname>Shaffer</surname> <given-names>D. W.</given-names></name> <name><surname>Rummel</surname> <given-names>N.</given-names></name></person-group> (<year>2022</year>). <article-title>Stirring a secret sauce: a literature review on the conditions and effects of authentic learning</article-title>. <source>Educ. Psychol. Rev</source>. <volume>34</volume>, <fpage>1479</fpage>&#x02013;<lpage>1516</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10648-022-09676-3</pub-id></mixed-citation>
</ref>
<ref id="B43">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nachtigall</surname> <given-names>V.</given-names></name> <name><surname>Shaffer</surname> <given-names>D. W.</given-names></name> <name><surname>Rummel</surname> <given-names>N.</given-names></name></person-group> (<year>2024</year>). <article-title>The authenticity dilemma: towards a theory on the conditions and effects of authentic learning</article-title>. <source>Eur. J. Psychol. Educ</source>. <volume>39</volume>, <fpage>3483</fpage>&#x02013;<lpage>3509</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10212-024-00892-9</pub-id></mixed-citation>
</ref>
<ref id="B44">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nicaise</surname> <given-names>M.</given-names></name> <name><surname>Gibney</surname> <given-names>T.</given-names></name> <name><surname>Crane</surname> <given-names>M.</given-names></name></person-group> (<year>2000</year>). <article-title>Toward an understanding of authentic learning: student perceptions of an authentic classroom</article-title>. <source>J. Sci. Educ. Technol</source>. <volume>9</volume>, <fpage>79</fpage>&#x02013;<lpage>94</lpage>. doi: <pub-id pub-id-type="doi">10.1023/A:1009477008671</pub-id></mixed-citation>
</ref>
<ref id="B45">
<mixed-citation publication-type="thesis"><person-group person-group-type="author"><name><surname>Pawek</surname> <given-names>C.</given-names></name></person-group> (<year>2009</year>). <source>Sch&#x000FC;lerlabore als interessef&#x000F6;rdernde au&#x000DF;erschulische Lernumgebungen f&#x000FC;r Sch&#x000FC;lerinnen und Sch&#x000FC;ler aus der Mittel- und Oberstufe</source> [<italic>Out-of-school labs as interest-promoting extracurricular learning environments for lower and upper secondary students</italic>] (Ph.D. thesis). Universit&#x000E4;t Kiel, Kiel, Germany.</mixed-citation>
</ref>
<ref id="B46">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Peacock</surname> <given-names>M.</given-names></name></person-group> (<year>1997</year>). <article-title>The effect of authentic materials on the motivation of EFL learners</article-title>. <source>ELT J</source>. <volume>51</volume>, <fpage>144</fpage>&#x02013;<lpage>156</lpage>. doi: <pub-id pub-id-type="doi">10.1093/elt/51.2.144</pub-id></mixed-citation>
</ref>
<ref id="B47">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rosseel</surname> <given-names>Y.</given-names></name></person-group> (<year>2012</year>). <article-title>lavaan: an R package for structural equation modeling</article-title>. <source>J. Stat. Softw</source>. <volume>48</volume>, <fpage>1</fpage>&#x02013;<lpage>36</lpage>. doi: <pub-id pub-id-type="doi">10.18637/jss.v048.i02</pub-id></mixed-citation>
</ref>
<ref id="B48">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Roth</surname> <given-names>W.-M.</given-names></name></person-group> (<year>1995</year>). <source>Authentic School Science: Knowing and Learning in Open-Inquiry Science Laboratories</source>. Dordrecht: Springer. doi: <pub-id pub-id-type="doi">10.1007/978-94-011-0495-1</pub-id></mixed-citation>
</ref>
<ref id="B49">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sandoval</surname> <given-names>W. A.</given-names></name></person-group> (<year>2005</year>). <article-title>Understanding students&#x00027; practical epistemologies and their influence on learning through inquiry</article-title>. <source>Sci. Educ</source>. <volume>89</volume>, <fpage>634</fpage>&#x02013;<lpage>656</lpage>. doi: <pub-id pub-id-type="doi">10.1002/sce.20065</pub-id></mixed-citation>
</ref>
<ref id="B50">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Satorra</surname> <given-names>A.</given-names></name> <name><surname>Bentler</surname> <given-names>P. M.</given-names></name></person-group> (<year>2001</year>). <article-title>A scaled difference chi-square test statistic for moment structure analysis</article-title>. <source>Psychometrika</source> <volume>66</volume>, <fpage>507</fpage>&#x02013;<lpage>514</lpage>. doi: <pub-id pub-id-type="doi">10.1007/BF02296192</pub-id></mixed-citation>
</ref>
<ref id="B51">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Scharfenberg</surname> <given-names>F.-J.</given-names></name> <name><surname>Bogner</surname> <given-names>F. X.</given-names></name> <name><surname>Klautke</surname> <given-names>S.</given-names></name></person-group> (<year>2007</year>). <article-title>Learning in a gene technology laboratory with educational focus: results of a teaching unit with authentic experiments</article-title>. <source>Biochem. Mol. Biol. Educ</source>. <volume>35</volume>, <fpage>28</fpage>&#x02013;<lpage>39</lpage>. doi: <pub-id pub-id-type="doi">10.1002/bmb.1</pub-id><pub-id pub-id-type="pmid">21591053</pub-id></mixed-citation>
</ref>
<ref id="B52">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schermelleh-Engel</surname> <given-names>K.</given-names></name> <name><surname>Moosbrugger</surname> <given-names>H.</given-names></name> <name><surname>M&#x000FC;ller</surname> <given-names>H.</given-names></name></person-group> (<year>2003</year>). <article-title>Evaluating the fit of structural equation models: tests of significance and descriptive goodness-of-fit measures</article-title>. <source>Methods Psychol. Res. Online</source> <volume>8</volume>, <fpage>23</fpage>&#x02013;<lpage>74</lpage>.</mixed-citation>
</ref>
<ref id="B53">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schriebl</surname> <given-names>D.</given-names></name> <name><surname>M&#x000FC;ller</surname> <given-names>A.</given-names></name> <name><surname>Robin</surname> <given-names>N.</given-names></name></person-group> (<year>2023</year>). <article-title>Modelling authenticity in science education</article-title>. <source>Sci. Educ</source>. <volume>32</volume>, <fpage>1021</fpage>&#x02013;<lpage>1048</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11191-022-00355-x</pub-id></mixed-citation>
</ref>
<ref id="B54">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schriebl</surname> <given-names>D.</given-names></name> <name><surname>M&#x000FC;ller</surname> <given-names>A.</given-names></name> <name><surname>Robin</surname> <given-names>N.</given-names></name> <name><surname>Henrich</surname> <given-names>B.</given-names></name></person-group> (<year>2021</year>). <article-title>An instrument to measure students&#x00027; perception of the authenticity of an out-of-school learning place</article-title>. <source>Prog. Sci. Educ</source>. <volume>4</volume>, <fpage>66</fpage>&#x02013;<lpage>74</lpage>. doi: <pub-id pub-id-type="doi">10.25321/prise.2021.1072</pub-id></mixed-citation>
</ref>
<ref id="B55">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sch&#x000FC;ttler</surname> <given-names>T.</given-names></name> <name><surname>Watzka</surname> <given-names>B.</given-names></name> <name><surname>Girwidz</surname> <given-names>R.</given-names></name> <name><surname>Ertl</surname> <given-names>B.</given-names></name></person-group> (<year>2021</year>). <article-title>Die Wirkung der Authentizit&#x000E4;t von Lernort und Laborger&#x000E4;ten auf das situationale Interesse und die Relevanzwahrnehmung beim Besuch eines naturwissenschaftlichen Sch&#x000FC;lerlabors [Effects of an authentic location and laboratory equipment for the situational interest and the perception of content relevance when visiting an out-of-school science lab]</article-title>. <source>Z. Didakt. Naturwiss</source>. <volume>27</volume>, <fpage>109</fpage>&#x02013;<lpage>125</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s40573-021-00128-z</pub-id></mixed-citation>
</ref>
<ref id="B56">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schwartz</surname> <given-names>R. S.</given-names></name> <name><surname>Lederman</surname> <given-names>N. G.</given-names></name> <name><surname>Crawford</surname> <given-names>B. A.</given-names></name></person-group> (<year>2004</year>). <article-title>Developing views of nature of science in an authentic context: an explicit approach to bridging the gap between nature of science and scientific inquiry</article-title>. <source>Sci. Educ</source>. <volume>88</volume>, <fpage>610</fpage>&#x02013;<lpage>645</lpage>. doi: <pub-id pub-id-type="doi">10.1002/sce.10128</pub-id></mixed-citation>
</ref>
<ref id="B57">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Smetana</surname> <given-names>L. K.</given-names></name> <name><surname>Bell</surname> <given-names>R. L.</given-names></name></person-group> (<year>2012</year>). <article-title>Computer simulations to support science instruction and learning: a critical review of the literature</article-title>. <source>Int. J. Sci. Educ</source>. <volume>34</volume>, <fpage>1337</fpage>&#x02013;<lpage>1370</lpage>. doi: <pub-id pub-id-type="doi">10.1080/09500693.2011.605182</pub-id></mixed-citation>
</ref>
<ref id="B58">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sommer</surname> <given-names>K.</given-names></name> <name><surname>Firstein</surname> <given-names>A.</given-names></name> <name><surname>Rothstein</surname> <given-names>B.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Authentizit&#x000E4;t (der Wissenschaftsvermittlung) im Sch&#x000FC;lerlabor [Authenticity (of science education) in out-of-school labs],&#x0201D;</article-title> in <source>Handbuch Forschen im Sch&#x000FC;lerlabor</source>, eds. K. Sommer, J. Wirth, and M. Vanderbeke (M&#x000FC;nster: Waxmann), <fpage>21</fpage>&#x02013;<lpage>30</lpage>.</mixed-citation>
</ref>
<ref id="B59">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sommer</surname> <given-names>K.</given-names></name> <name><surname>Wirth</surname> <given-names>J.</given-names></name> <name><surname>Rummel</surname> <given-names>N.</given-names></name></person-group> (<year>2018</year>). <article-title>Authentizit&#x000E4;t der Wissenschaftsvermittlung im Sch&#x000FC;lerlabor&#x02014;Einf&#x000FC;hrung in den Thementeil [Authenticity of instruction about natural and social sciences in out-of-school labs&#x02014;introduction to the special issue]</article-title>. <source>Unterrichtswiss</source>. <volume>46</volume>, <fpage>253</fpage>&#x02013;<lpage>260</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s42010-018-0022-z</pub-id></mixed-citation>
</ref>
<ref id="B60">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stroupe</surname> <given-names>D.</given-names></name></person-group> (<year>2014</year>). <article-title>Examining classroom science practice communities: how teachers and students negotiate epistemic agency and learn science-as-practice</article-title>. <source>Sci. Educ</source>. <volume>98</volume>, <fpage>487</fpage>&#x02013;<lpage>516</lpage>. doi: <pub-id pub-id-type="doi">10.1002/sce.21112</pub-id></mixed-citation>
</ref>
<ref id="B61">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sv&#x000E4;rd</surname> <given-names>J.</given-names></name> <name><surname>Sch&#x000F6;nborn</surname> <given-names>K. J.</given-names></name> <name><surname>Hallstr&#x000F6;m</surname> <given-names>J.</given-names></name></person-group> (<year>2024</year>). <article-title>Students&#x00027; perceptions of authenticity in an upper secondary technology education innovation project</article-title>. <source>Res. Sci. Technol. Educ</source>. <volume>42</volume>, <fpage>467</fpage>&#x02013;<lpage>487</lpage>. doi: <pub-id pub-id-type="doi">10.1080/02635143.2022.2116418</pub-id></mixed-citation>
</ref>
<ref id="B62">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>van Vorst</surname> <given-names>H.</given-names></name> <name><surname>Dorschu</surname> <given-names>A.</given-names></name> <name><surname>Fechner</surname> <given-names>S.</given-names></name> <name><surname>Kauertz</surname> <given-names>A.</given-names></name> <name><surname>Krabbe</surname> <given-names>H.</given-names></name> <name><surname>Sumfleth</surname> <given-names>E.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Charakterisierung und Strukturierung von Kontexten im naturwissenschaftlichen Unterricht&#x02014;Vorschlag einer theoretischen Modellierung [A theoretical framework for categorizing context-based tasks in science education]</article-title>. <source>Z. Didakt. Naturwiss</source>. <volume>21</volume>, <fpage>29</fpage>&#x02013;<lpage>39</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s40573-014-0021-5</pub-id></mixed-citation>
</ref>
<ref id="B63">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Voitle</surname> <given-names>F.</given-names></name> <name><surname>Heuckmann</surname> <given-names>B.</given-names></name> <name><surname>Kampa</surname> <given-names>N.</given-names></name> <name><surname>Kremer</surname> <given-names>K.</given-names></name></person-group> (<year>2022</year>). <article-title>Assessing students&#x00027; epistemic beliefs related to professional and school science</article-title>. <source>Int. J. Sci. Educ</source>. <volume>44</volume>, <fpage>1000</fpage>&#x02013;<lpage>1020</lpage>. doi: <pub-id pub-id-type="doi">10.1080/09500693.2022.2059821</pub-id></mixed-citation>
</ref>
<ref id="B64">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Watkins</surname> <given-names>J.</given-names></name> <name><surname>Coffey</surname> <given-names>J. E.</given-names></name> <name><surname>Redish</surname> <given-names>E. F.</given-names></name> <name><surname>Cooke</surname> <given-names>T. J.</given-names></name></person-group> (<year>2012</year>). <article-title>Disciplinary authenticity: enriching the reforms of introductory physics courses for life-science students</article-title>. <source>Phys. Rev. Phys. Educ. Res</source>. <volume>8</volume>:<fpage>010112</fpage>. doi: <pub-id pub-id-type="doi">10.1103/PhysRevSTPER.8.010112</pub-id></mixed-citation>
</ref>
<ref id="B65">
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zachrich</surname> <given-names>L.</given-names></name> <name><surname>Wagner</surname> <given-names>W.</given-names></name> <name><surname>Bertram</surname> <given-names>C.</given-names></name> <name><surname>Trautwein</surname> <given-names>U.</given-names></name></person-group> (<year>2024</year>). <article-title>Really? It depends! How authentic learning material affects involvement with personal stories of the past</article-title>. <source>Learn. Instr</source>. <volume>92</volume>:<fpage>101921</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.learninstruc.2024.101921</pub-id></mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0001">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2293057/overview">Joaquin Marc Veith</ext-link>, Leipzig University, Germany</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0002">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1794740/overview">Yasemin Tas</ext-link>, Atat&#x000FC;rk University, T&#x000FC;rkiye</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3294950/overview">Valentina Nachtigall</ext-link>, Ruhr University Bochum, Germany</p>
</fn>
</fn-group>
<fn-group>
<fn id="fn0003"><label>1</label><p>FEWAW is the German acronym for <italic>Fragebogen zur Erfassung der Wahrnehmung von Authentizit&#x000E4;t in der Wissenschaftsvermittlung</italic> (Questionnaire for Assessing the Perception of Authenticity in Science Communication).</p></fn>
</fn-group>
</back>
</article>