<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Educ.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Education</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Educ.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2504-284X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/feduc.2026.1741733</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Is flipped classroom really superior?&#x2014;Questioning the flip in K-12 teaching</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wiesner</surname>
<given-names>Patrick</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/836312"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Krauss</surname>
<given-names>Stefan</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/171606"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Stegm&#x00FC;ller</surname>
<given-names>Nathalie</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2324458"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Binder</surname>
<given-names>Karin</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/166832"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Mathematics Education, Faculty of Mathematics, University of Regensburg</institution>, <city>Regensburg</city>, <country country="de">Germany</country></aff>
<aff id="aff2"><label>2</label><institution>Mathematics Education, Faculty of Mathematics, University of Paderborn</institution>, <city>Paderborn</city>, <country country="de">Germany</country></aff>
<author-notes>
<corresp id="c001"><label>&#x002A;</label>Correspondence: Patrick Wiesner, <email xlink:href="mailto:patrick.wiesner@mathematik.uni-regensburg.de">patrick.wiesner@mathematik.uni-regensburg.de</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-19">
<day>19</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>11</volume>
<elocation-id>1741733</elocation-id>
<history>
<date date-type="received">
<day>07</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>29</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>05</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2026 Wiesner, Krauss, Stegm&#x00FC;ller and Binder.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Wiesner, Krauss, Stegm&#x00FC;ller and Binder</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-19">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>There is a contradiction between seven meta-analyses, all of which indicate a substantial benefit of the flipped classroom (FC) method for K-12 teaching and some larger study that found no such benefit when compared to &#x201C;traditional&#x201D; teaching. In the theoretical part of the paper, we shed light on this contradiction by consulting general literature on meta-analyses. Ranking the 50 included FC studies by the number of classes per experimental condition, we found a negative correlation between the &#x201C;size&#x201D; of a study and the effect in favor of FC. In the empirical part, we present an FC study with three conditions concerning mathematical teaching, based on <italic>n</italic>&#x202F;=&#x202F;950 students aged 11&#x2013;13, in which many relevant covariates (e.g., quality of instruction) were addressed. One FC condition was based on students&#x2019; knowledge acquisition through instructional videos at home (FCn: <italic>n</italic>&#x202F;=&#x202F;12 classes). Considering that self-regulation support might play a crucial role especially for young students working at home, another FC condition (FCS: <italic>n</italic>&#x202F;=&#x202F;12 classes) was implemented, in which students could learn additional math-free strategies concerning watching instructional videos. Both FC-conditions were experimentally compared with a control group of traditional teaching (TT: <italic>n</italic>&#x202F;=&#x202F;13 classes). No significant effect on learning gains was found between FCn and TT, indicating that &#x201C;flipping&#x201D; alone may not be more effective per se. However, a significant difference was found between FCS and FCn. Thus, supporting students&#x2019; self-regulation in addition may in indeed open the door to successful FC, even with very young students.</p>
</abstract>
<kwd-group>
<kwd>flipped classroom</kwd>
<kwd>inverted learning</kwd>
<kwd>K-12</kwd>
<kwd>instructional video</kwd>
<kwd>self-regulated learning</kwd>
<kwd>math education</kwd>
<kwd>flipped learning</kwd>
<kwd>FALKE research program</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This project is part of the &#x201C;Qualit&#x00E4;tsoffensive Lehrerbildung,&#x201D; a joint initiative of the Federal Government and the L&#x00E4;nder which aims to improve the quality of teacher training. The program is funded by the Federal Ministry of Education and Research. The authors are responsible for the content of this publication. (grant number: 1JA2010). Open Access publishing supported by the University of Regensburg.</funding-statement>
</funding-group>
<counts>
<fig-count count="4"/>
<table-count count="8"/>
<equation-count count="1"/>
<ref-count count="47"/>
<page-count count="13"/>
<word-count count="10665"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Digital Education</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>Several meta-analyses document positive effects of the flipped classroom (FC) method in K-12 education (<xref ref-type="bibr" rid="ref8">Cheng et al., 2019</xref>; <xref ref-type="bibr" rid="ref15">G&#x00FC;ler et al., 2022</xref>; <xref ref-type="bibr" rid="ref21">L&#x00E5;g and S&#x00E6;le, 2019</xref>; <xref ref-type="bibr" rid="ref35">Strelan et al., 2020</xref>; <xref ref-type="bibr" rid="ref37">van Alten et al., 2019</xref>; <xref ref-type="bibr" rid="ref41">Wagner et al., 2020</xref>; <xref ref-type="bibr" rid="ref46">Zhu, 2021</xref>). According to <xref ref-type="table" rid="tab1">Table 1</xref>, the advantage of FC seems obvious from an empirical perspective. However, when attempting to demonstrate this effect in controlled &#x201C;large-scale&#x201D; designs while implementing multiple classes per experimental condition, the evidence astonishingly fails (<xref ref-type="bibr" rid="ref42">Wagner and Urhahne, 2021</xref>). In the present article, we review the existing meta-analyses regarding K-12 teaching (i.e., primary and secondary education) and discuss possible alternative reasons for the repeated confirmation of positive effects in favor of the FC method. Finally, we present the so far largest controlled FC study<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref> in K-12 teaching, in which we implement about 12 classes per experimental condition and control multiple possible covariates that might alternatively affect learning gains. Since self-regulation support for watching instructional videos at home seems to be crucial especially for young students (see below), an additional FC condition was implemented in which such strategies&#x2014;addressing &#x201C;before,&#x201D; &#x201C;while&#x201D; and &#x201C;after&#x201D; watching the video&#x2014;were explicitly provided.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Overview of meta-analyses comparing FC with traditional teaching considering learning gains in K-12.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Meta-analysis (year)<break/>Journal</th>
<th align="center" valign="top">K-12 level (# FC studies included)</th>
<th align="center" valign="top">Effect sizes in favor of FC (Cohen&#x2019;s <italic>d</italic> / Hedges <italic>g</italic>)<xref ref-type="table-fn" rid="tfn1"><sup>&#x002A;</sup></xref></th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" rowspan="2"><xref ref-type="bibr" rid="ref11">Do&#x011F;an et al. (2021)</xref><xref ref-type="table-fn" rid="tfn2"><sup>&#x002A;&#x002A;</sup></xref><break/>Education &#x0026; Information Technologies</td>
<td align="center" valign="middle">Secondary level (11)</td>
<td align="center" valign="middle"><italic>d</italic>&#x202F;=&#x202F;0.58</td>
</tr>
<tr>
<td align="center" valign="middle">Primary level (4)</td>
<td align="center" valign="middle"><italic>d</italic>&#x202F;=&#x202F;1.89</td>
</tr>
<tr>
<td align="left" valign="middle"><xref ref-type="bibr" rid="ref46">Zhu (2021)</xref><break/>Educational Technology Research and Development</td>
<td align="center" valign="middle">Secondary &#x0026; primary level together (27)</td>
<td align="center" valign="middle"><italic>d</italic>&#x202F;=&#x202F;0.54</td>
</tr>
<tr>
<td align="left" valign="middle"><xref ref-type="bibr" rid="ref41">Wagner et al. (2020)</xref><break/>Zeitschrift f&#x00FC;r P&#x00E4;dagogische Psychologie</td>
<td align="center" valign="middle">Secondary level (25)</td>
<td align="center" valign="middle"><italic>d</italic>&#x202F;=&#x202F;0.42</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="2"><xref ref-type="bibr" rid="ref35">Strelan et al. (2020)</xref><xref ref-type="table-fn" rid="tfn2"><sup>&#x002A;&#x002A;</sup></xref><break/>Educational Research Review</td>
<td align="center" valign="middle">Secondary level (21)</td>
<td align="center" valign="middle"><italic>g</italic>&#x202F;=&#x202F;0.64</td>
</tr>
<tr>
<td align="center" valign="middle">Primary level (3)</td>
<td align="center" valign="middle"><italic>g</italic>&#x202F;=&#x202F;0.47</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="2"><xref ref-type="bibr" rid="ref21">L&#x00E5;g and S&#x00E6;le (2019)</xref><xref ref-type="table-fn" rid="tfn2"><sup>&#x002A;&#x002A;</sup></xref><break/>AERA Open</td>
<td align="center" valign="middle">Secondary level (16)</td>
<td align="center" valign="middle"><italic>g</italic>&#x202F;=&#x202F;0.45</td>
</tr>
<tr>
<td align="center" valign="middle">Primary level (12)</td>
<td align="center" valign="middle"><italic>g</italic>&#x202F;=&#x202F;0.44</td>
</tr>
<tr>
<td align="left" valign="middle"><xref ref-type="bibr" rid="ref37">van Alten et al. (2019)</xref><xref ref-type="table-fn" rid="tfn2"><sup>&#x002A;&#x002A;</sup></xref><break/>Educational Research Review</td>
<td align="center" valign="middle">Secondary level (11)</td>
<td align="center" valign="middle"><italic>g</italic>&#x202F;=&#x202F;0.36</td>
</tr>
<tr>
<td align="left" valign="middle"><xref ref-type="bibr" rid="ref8">Cheng et al. (2019)</xref><xref ref-type="table-fn" rid="tfn2"><sup>&#x002A;&#x002A;</sup></xref><break/>Education Tech Research</td>
<td align="center" valign="middle">Secondary level (12)</td>
<td align="center" valign="middle"><italic>g</italic>&#x202F;=&#x202F;0.21</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="tfn1">
<label>&#x002A;</label>
<p>The effect sizes <italic>d</italic> and <italic>g</italic> only vary by a slightly different calculation of the pooled standard deviation: &#x2502;<italic>g</italic> and <italic>d</italic>&#x2502;&#x202F;=&#x202F;0.2 small effect, &#x2502;<italic>g</italic> and <italic>d</italic>&#x2502;&#x202F;=&#x202F;0.5 medium effect, &#x2502;<italic>g</italic> and <italic>d</italic>&#x2502;&#x202F;=&#x202F;0.8 large effect.</p>
</fn>
<fn id="tfn2">
<label>&#x002A;&#x002A;</label>
<p>Meta-analysis also includes studies regarding tertiary level (which are not listed in this table).</p>
</fn>
</table-wrap-foot>
</table-wrap>
<sec id="sec2">
<label>1.1</label>
<title>Flipped classroom</title>
<p>The flipped classroom (FC; synonyms: inverted classroom, flipped learning, inverted learning) is a teaching method that has become increasingly popular in recent years with a growing focus on research that has all been conducted within the last 15&#x202F;years (<xref ref-type="bibr" rid="ref6">Cevikbas and Kaiser, 2020</xref>; <xref ref-type="bibr" rid="ref18">Hwang et al., 2019</xref>; <xref ref-type="bibr" rid="ref19">Kapur et al., 2022</xref>). <xref ref-type="bibr" rid="ref45">Zhang et al. (2024)</xref> for example provide an overview of current research trends on FC across all age groups and professions. Although there is no single definition of FC, almost all characterizations include the reversed order of traditional teaching as a &#x201C;minimum requirement.&#x201D; In contrast to traditional teaching&#x2014;i.e., the knowledge acquisition happens in school and most of the practice has to be done as homework&#x2014;the concept of FC means that new knowledge is acquired independently by students before the actual lesson to allow more time for reflection, elaboration, and practice in class (<xref ref-type="bibr" rid="ref4">Bishop and Verleger, 2013</xref>; <xref ref-type="bibr" rid="ref22">Lage et al., 2000</xref>). In terms of acquiring knowledge at home, students are often required to watch instructional videos and are sometimes given short additional quizzes to test their understanding of the content (e.g., <xref ref-type="bibr" rid="ref16">Hew et al., 2021</xref>; <xref ref-type="bibr" rid="ref41">Wagner et al., 2020</xref>). Some authors specify options for the subsequent plenary phase, for example group work, class surveys, cooperative learning, and student presentations or discussions (<xref ref-type="bibr" rid="ref2">Bergmann and Sams, 2012</xref>; <xref ref-type="bibr" rid="ref4">Bishop and Verleger, 2013</xref>; <xref ref-type="bibr" rid="ref26">Lo et al., 2017</xref>). Meanwhile, there are a lot of individual studies investigating the effect of FC in K-12 teaching (see <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref>). Taken together, these studies provide important insights into ideas, conditions, and consequences on teaching with the FC method.</p>
</sec>
<sec id="sec3">
<label>1.2</label>
<title>The effect of flipped classroom in K-12 education: meta-analytical evidence</title>
<p>Like any method, FC has potential opportunities as well as potential pitfalls (<xref ref-type="bibr" rid="ref7">Cevikbas and Kaiser, 2023</xref>). We summarize seven meta-analyses investigating the effect of FC regarding K-12 teaching that all were conducted within the last 7&#x202F;years (in <xref ref-type="table" rid="tab1">Table 1</xref>). We selected analyses that examined the effects in the K-12 sector separately and explicitly listed the included studies. All seven meta-analyses generally conclude that FC is more effective than traditional teaching in K-12 with effect sizes ranging from <italic>g</italic>&#x202F;=&#x202F;0.21 to <italic>d</italic>&#x202F;=&#x202F;1.89. The effect of these meta-analyses is in line with a recent review of meta-analyses from <xref ref-type="bibr" rid="ref24">Li et al. (2024)</xref> with an overall positive effect of <italic>g</italic>&#x202F;=&#x202F;0.53 in favor of FC in K-12 teaching. There are even two more reviews on meta-analyses (<xref ref-type="bibr" rid="ref16">Hew et al., 2021</xref>; <xref ref-type="bibr" rid="ref19">Kapur et al., 2022</xref>), yet, they deal predominantly with the tertiary level (for the restriction to K-12 teaching in the present article see 1.3).</p>
<p>A common finding of the meta-analyses is that most of the included studies compare FC based on instructional videos that have to be watched at home by students with traditional teaching without videos (e.g., see <xref ref-type="bibr" rid="ref46">Zhu, 2021</xref>). Furthermore, the positive effects of FC are often attributed to short quizzes (e.g., see <xref ref-type="bibr" rid="ref37">van Alten et al., 2019</xref>), at least when students receive feedback (<xref ref-type="bibr" rid="ref41">Wagner et al., 2020</xref>).</p>
<p>However, the evidence is mixed in terms of the subjects considered. While <xref ref-type="bibr" rid="ref41">Wagner et al. (2020)</xref> reported a larger effect in STEM subjects than in the humanities, <xref ref-type="bibr" rid="ref35">Strelan et al. (2020)</xref> found the opposite.</p>
<p>In <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref>, we provide an extensive overview of the about 50 individual studies comparing learning gains from FC to traditional teaching that were included in at least one of the seven meta-analyses in <xref ref-type="table" rid="tab1">Table 1</xref>. The first letters of the names (bold) in <xref ref-type="table" rid="tab1">Table 1</xref> are used in the left column in <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref> to indicate which study was included in which meta-analysis. Since most meta-analyses critically remark the generally small sizes of the FC studies conducted so far (e.g., <xref ref-type="bibr" rid="ref8">Cheng et al., 2019</xref>; <xref ref-type="bibr" rid="ref41">Wagner et al., 2020</xref>), we sorted the studies in <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref>, first, according to the average number of classes per experimental condition and, second, by the total number of participating students. As statistical multilevel modeling, which diminishes potential class effects, is only possible if more classes per condition are implemented, we chose the number of classes per condition as the core principle to judge the &#x201C;largeness&#x201D; of an FC study. Notably, in <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref> the bivariate Pearson correlation coefficient between the number of classes per condition and the effect sizes reported in <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref> yields <italic>r</italic>&#x202F;=&#x202F;&#x2212; 0.3 i.e. the larger a study, the smaller the observed effect in favor of FC.</p>
<p>More specifically, from <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref>, which contains 51 individual FC studies, it becomes clear that 40 studies implemented only one class per experimental condition. So far, there seems to be only one &#x2018;large&#x2019; FC study concerning K-12 teaching (<xref ref-type="bibr" rid="ref42">Wagner and Urhahne, 2021</xref>) with an average of 10 classes per condition, which was too new to be included in the meta-analyses of <xref ref-type="table" rid="tab1">Table 1</xref>. In this study, however, the most effective method was not FC, but watching the instructional video in class followed by student-centered instruction. Since the learning materials were basically identical in all conditions, the study by <xref ref-type="bibr" rid="ref42">Wagner and Urhahne (2021)</xref> has a high internal validity, but at the same time, there is a trade-off regarding external validity because instructional videos are typically not shown in class. Thus, there currently seems to be a major contradiction between the results of seven meta-analyses and an actual, large and internally valid FC study.</p>
<p>In experimental psychology, it is not uncommon for effects found in small studies to fail to be replicated in large and controlled experiments. Beyond the well-known problems demonstrated in the replication crisis (e.g., <xref ref-type="bibr" rid="ref28">Maxwell et al., 2015</xref>; <xref ref-type="bibr" rid="ref32">Shrout and Rodgers, 2018</xref>), <xref ref-type="bibr" rid="ref1">Barto&#x0161; et al. (2023)</xref>, <xref ref-type="bibr" rid="ref20">Kvarven et al. (2020)</xref>, and <xref ref-type="bibr" rid="ref33">Sotola (2022)</xref> examined meta-analyses in particular. The latter one investigated meta-analyses that were published in <italic>Psychology Bulletin</italic> and demonstrated that the risk of a meta-analysis confirming a positive effect when, in fact, there is a null effect is particularly high when the number of participants in the included studies is very small. He claimed in such cases that for every included study, there must be another study that was not published, meaning that these estimated unpublished 50 percent of all conducted studies might show no or a negative effect. While <xref ref-type="bibr" rid="ref20">Kvarven et al. (2020)</xref> assume that effect sizes in meta-analyses are overestimated almost by a factor of three, <xref ref-type="bibr" rid="ref1">Barto&#x0161; et al. (2023)</xref> stress that such effect sizes might be overestimated even more. The general conclusion of all three reviews is that meta-analyses, of course, are not unreliable per se, but should probably be interpreted with caution, and all agree that the reported effect sizes might be overestimated.</p>
<p>In the absence of contrary arguments or specialties that discriminate the meta-analyses of <xref ref-type="table" rid="tab1">Table 1</xref> from those reviewed by <xref ref-type="bibr" rid="ref1">Barto&#x0161; et al. (2023)</xref>, <xref ref-type="bibr" rid="ref20">Kvarven et al. (2020)</xref> and <xref ref-type="bibr" rid="ref33">Sotola (2022)</xref>, one might speculate that the theoretical analyses of the three papers may also&#x2014;at least partly&#x2014;underlie the seemingly overwhelming evidence in favor of FC instruction. This hypothesis is consistent with <xref ref-type="bibr" rid="ref19">Kapur et al.&#x2019;s (2022)</xref> review of meta-analyses exclusively on FC, which also suggests that effect sizes might be overestimated due to small sample sizes of the included studies and publication bias (see also <xref ref-type="bibr" rid="ref16">Hew et al., 2021</xref>). Yet, neither <xref ref-type="bibr" rid="ref19">Kapur et al. (2022)</xref> nor <xref ref-type="bibr" rid="ref16">Hew et al. (2021)</xref> focus on K-12 students (instead 90% of the studies considered by Kapur et al. were from the tertiary level). Of course, all authors of the meta-analyses in <xref ref-type="table" rid="tab1">Table 1</xref> are aware that their analyses depend on the individual studies included (e.g., <xref ref-type="bibr" rid="ref35">Strelan et al., 2020</xref>; <xref ref-type="bibr" rid="ref21">L&#x00E5;g and S&#x00E6;le, 2019</xref>), and discuss a possible publication bias (<xref ref-type="bibr" rid="ref46">Zhu, 2021</xref>), small study bias (<xref ref-type="bibr" rid="ref11">Do&#x011F;an et al., 2021</xref>), or the novelty effect, meaning that there is an initial boost in performance or enthusiasm that occurs when a new tool or method is introduced (<xref ref-type="bibr" rid="ref41">Wagner et al., 2020</xref>).</p>
</sec>
<sec id="sec4">
<label>1.3</label>
<title>The role of self-regulation for K-12 students</title>
<p>To provide the desired benefit of extended learning time for FC, students must prepare effectively for the lesson at home, since, otherwise, the success of the FC method is threatened (<xref ref-type="bibr" rid="ref8">Cheng et al., 2019</xref>; <xref ref-type="bibr" rid="ref14">Gillette et al., 2018</xref>; <xref ref-type="bibr" rid="ref37">van Alten et al., 2019</xref>). The issue of self-regulated learning (&#x201C;SRL&#x201D;) and the need to support self-regulation, especially for young students, is the reason why we focus on K-12 teaching in this paper. While studying at university requires strong self-regulation skills, students at school usually receive more help and explicit support (<xref ref-type="bibr" rid="ref40">Vosniadou, 2020</xref>). In the K-12 classroom, teachers implementing the FC method cannot automatically assume that learning at home, especially for very young students, will be competent and successful (or be done at all). Indeed, the review of meta-analyses by <xref ref-type="bibr" rid="ref19">Kapur et al. (2022)</xref> indirectly supports the claim that the relevance of SRL support decreases as students get older: At the tertiary level, the average effect size for FC (without specific SRL support and compared to traditional teaching) is the highest (<italic>g</italic>&#x202F;=&#x202F;0.93), while the younger the students, the lower the effect size (high schools: <italic>g</italic>&#x202F;=&#x202F;0.63, elementary schools: <italic>g</italic>&#x202F;=&#x202F;0.40).</p>
<p>However, in experimental FC studies, elaborated support regarding the appropriate use of instructional videos is found only rarely. <xref ref-type="table" rid="tab2">Table 2</xref> summarizes three studies that focus specifically on SRL in K-12 teaching by experimentally comparing two FC conditions with and without explicit SRL support (all three without implementing an additional control group regarding traditional teaching).</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Overview of studies comparing FC with and without SRL support in K-12 education.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Authors (year)<break/>Journal</th>
<th align="center" valign="top" rowspan="2"># Students, (# classes)</th>
<th align="left" valign="top" rowspan="2">Subject (grade)</th>
<th align="center" valign="top" colspan="2">Conditions: # students, (# classes)</th>
<th align="left" valign="top" rowspan="2">Results (relating to learning gains)</th>
</tr>
<tr>
<th align="center" valign="top">FC with SRL support</th>
<th align="center" valign="top">FC without SRL<break/>support</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle"><xref ref-type="bibr" rid="ref38">van Alten et al. (2020a)</xref><break/>Computers in Human Behavior</td>
<td align="center" valign="middle">154, (6)</td>
<td align="left" valign="middle">History (8th grade)</td>
<td align="center" valign="middle">74, <bold>(6)</bold></td>
<td align="center" valign="middle">80, <bold>(6)</bold></td>
<td align="left" valign="middle">No significant effect</td>
</tr>
<tr>
<td align="left" valign="middle"><xref ref-type="bibr" rid="ref39">van Alten et al. (2020b)</xref><break/>Computers &#x0026; Education</td>
<td align="center" valign="middle">115, (5)</td>
<td align="left" valign="middle">History (8th grade)</td>
<td align="center" valign="middle">50, <bold>(2</bold><xref ref-type="table-fn" rid="tfn3"><sup>&#x00B0;</sup></xref><bold>)</bold></td>
<td align="center" valign="middle">65, <bold>(3</bold><xref ref-type="table-fn" rid="tfn3">
<sup>
<bold>&#x00B0;</bold>
</sup>
</xref><bold>)</bold></td>
<td align="left" valign="middle">Significant positive effect in favor of FC with SRL</td>
</tr>
<tr>
<td align="left" valign="middle"><xref ref-type="bibr" rid="ref23">Lai and Hwang (2016)</xref><break/>Computers &#x0026; Education</td>
<td align="center" valign="middle">44, (2)</td>
<td align="left" valign="middle">Mathematics (4th grade)</td>
<td align="center" valign="middle">20, <bold>(1)</bold></td>
<td align="center" valign="middle">24, <bold>(1)</bold></td>
<td align="left" valign="middle">Significant positive effect in favor of FC with SRL</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="tfn3">
<label>&#x00B0;</label>
<p>Number of classes estimated by ourselves. Numbers in bold indicate the number of classes per condition.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The SRL support in the studies in <xref ref-type="table" rid="tab2">Table 2</xref> consists, for example, of short prompts that are implemented in the videos. However, general research on SRL over the last few decades has shown that it is not easy to guide students to actually use SRL strategies by simply transferring knowledge, but rather practical exercises are needed in addition (<xref ref-type="bibr" rid="ref10">Dignath and B&#x00FC;ttner, 2008</xref>; <xref ref-type="bibr" rid="ref44">Zeidner and Stoeger, 2019</xref>). In principle, it would be possible to address SRL even more dedicatedly&#x2014;based on general research on SRL (e.g., see <xref ref-type="bibr" rid="ref31">Pintrich, 1999</xref>)&#x2014;and to develop strategies explicitly designed for watching instructional videos, for instance, by following the ICAP framework (<xref ref-type="bibr" rid="ref9">Chi and Wylie, 2014</xref>), which especially deals with digital media.</p>
</sec>
<sec id="sec5">
<label>1.4</label>
<title>Rationale for the present study</title>
<p>In sum, despite many existing studies on the FC method in K-12 (<xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref>), it is still not certain whether this method is generally more effective than traditional teaching. <xref ref-type="bibr" rid="ref41">Wagner et al. (2020</xref>, p. 14) state that &#x201C;in particular, more randomized controlled trials with larger sample sizes and objective quantitative measures are needed.&#x201D; With respect to experimental control, for instance, <xref ref-type="bibr" rid="ref21">L&#x00E5;g and S&#x00E6;le (2019)</xref> and <xref ref-type="bibr" rid="ref8">Cheng et al. (2019)</xref> mention that most of the existing FC studies do not apply precise outcome measures and are therefore &#x201C;noisy&#x201D; (<xref ref-type="bibr" rid="ref35">Strelan et al., 2020</xref>). For example, often researchers themselves were the teachers in the studies, which violates the double-blind principle (<xref ref-type="bibr" rid="ref21">L&#x00E5;g and S&#x00E6;le, 2019</xref>), or there was no pretest to control for differences (<xref ref-type="bibr" rid="ref8">Cheng et al., 2019</xref>).</p>
<p>In the present paper, we report a controlled FC study regarding mathematics teaching in grades 6 and 7. With the implementation of <italic>n</italic>&#x202F;=&#x202F;12 classes per condition (a total of <italic>N</italic>&#x202F;=&#x202F;950 students were examined), this is the largest study in this area so far. Specifically, (a) a control group of &#x201C;traditional teaching&#x201D; was investigated and, therefore, we contribute to <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref>. In addition, we (b) implemented two FC-conditions, one with and one without explicit SRL-support for watching the instructional videos at home. In doing so, we contribute to <xref ref-type="table" rid="tab2">Table 2</xref>. Furthermore, we tried to manage all the requirements mentioned in <xref ref-type="bibr" rid="ref21">L&#x00E5;g and S&#x00E6;le (2019)</xref> such as clearly reporting the study design with a detailed description of the intervention, double-blind assessments, and psychometrically sound outcome measures.</p>
</sec>
</sec>
<sec id="sec6">
<label>2</label>
<title>Research questions</title>
<p>The main objectives of the present study are to investigate the effectiveness of an FC setting based on instructional videos in a robust, ecologically valid, and well-documented design when teaching mathematics to 11&#x2013;13&#x202F;year old students. Note that the following research questions are pedagogical in nature; the subject of mathematics serves rather as an exemplary discipline.</p>
<p>Research question 1 (RQ1): Do the mathematical learning gains of (young) students taught in an FC setting based on instructional videos differ from those taught in a traditional setting?</p>
<p>Research question 2 (RQ2): What is the effect of explicit support of SRL for watching instructional videos at home in an FC setting?</p>
<p>Since <xref ref-type="bibr" rid="ref42">Wagner and Urhahne (2021)</xref> could not replicate the positive effects in favor of FC with a large sample, we do not have a clear hypothesis on RQ1. Regarding RQ2, we speculate that SRL support might be the crucial factor for the effectiveness of FC, especially for students approximately of age 12&#x202F;years.</p>
</sec>
<sec sec-type="methods" id="sec7">
<label>3</label>
<title>Method</title>
<sec id="sec8">
<label>3.1</label>
<title>Study design</title>
<p>The intervention study with a pre&#x2012;post design was conducted in 6th and 7th grade mathematics classes in Bavarian schools (<xref ref-type="fig" rid="fig1">Figure 1</xref>). The participating classes were randomly distributed into three groups. The students were taught by their respective math teachers who received standardized training and materials prior to the intervention (see 3.3.4). Within each group, the teachers were following the identical manual (see 3.2). This uniform design of the lessons is intended to eliminate differences due to varying materials and to create comparability within, but also between experimental conditions. Basically, only the order of the used materials changed between the groups; therefore, all students received the same tasks and explanations except for the instructional videos (see 3.3.1) that were only obligatory in the FC conditions (<xref ref-type="fig" rid="fig1">Figure 1</xref>). Students&#x2019; performance was measured before and after the intervention using a pretest and a posttest (see 3.3.5). The lessons are described in more detail in 3.2.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Overview of the study design.</p>
</caption>
<graphic xlink:href="feduc-11-1741733-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Chart depicting three experimental conditions for teaching methods: Traditional Teaching (TT), Flipped Classroom with no SRL support (FCn), and Flipped Classroom with SRL support (FCS). TT involves 339 students across 13 classes, with four lessons and optional videos post-lesson. FCn has 316 students in 12 classes, while FCS includes 295 students in 12 classes, both with four lessons and mandatory pre-lesson videos. SRL support is explicitly provided in FCS. The timeline includes pretest (T1), explicit SRL, lessons (M1 to M4), and posttest (T2).</alt-text>
</graphic>
</fig>
<p>To answer RQ1, we compare classes in the traditional teaching (TT) condition with classes in the (typical) FC setting, in which students are provided with instructional videos but receive no explicit SRL support for watching them at home (FCn). A second FC condition (FCS) was implemented to answer RQ2: this group received an additional lesson on strategies (not mathematics-specific) about how to use instructional videos (see column &#x201C;SRL&#x201D; in <xref ref-type="fig" rid="fig1">Figure 1</xref>). It is important to note that no mathematical content was conveyed during this lesson to guarantee that no group had an advantage in this regard (3.2.2).</p>
</sec>
<sec id="sec9">
<label>3.2</label>
<title>Intervention</title>
<sec id="sec10">
<label>3.2.1</label>
<title>Four-lesson sequence in mathematics: M1&#x2013;M4</title>
<sec id="sec11">
<label>3.2.1.1</label>
<title>Structure of each lesson</title>
<p>Since the lessons of both FC groups were identical except for the additional SRL lesson (<xref ref-type="fig" rid="fig1">Figure 1</xref>), we will report them together in the following (<xref ref-type="table" rid="tab3">Table 3</xref>, right). Basically, also the TT group and the two FC conditions shared the same mathematical components (for an overview of the content of M1 &#x2013; M4 see <xref ref-type="fig" rid="fig2">Figure 2</xref>).</p>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Typical structure of a lesson in TT and in both FC settings.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Location</th>
<th align="left" valign="top">Traditional Teaching</th>
<th align="left" valign="top">Time</th>
<th align="left" valign="top">Location</th>
<th align="left" valign="top">Flipped Classroom</th>
<th align="left" valign="top">Time</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top" rowspan="4">School</td>
<td align="left" valign="middle">
<list list-type="simple">
<list-item>
<p>- Revision of homework</p>
</list-item>
<list-item>
<p>- Explanation of new content by teacher (following the structure of the instructional video)</p>
</list-item>
</list>
</td>
<td align="left" valign="top">&#x2248; 5&#x202F;min<break/>&#x2248; 10&#x202F;min</td>
<td align="left" valign="top">Home</td>
<td align="left" valign="middle">
<list list-type="simple">
<list-item>
<p>- Instructional video</p>
</list-item>
<list-item>
<p>- Quiz (the same as in TT)</p>
</list-item>
</list>
</td>
<td align="left" valign="middle">&#x2248; 15&#x202F;min</td>
</tr>
<tr>
<td align="left" valign="middle">
<list list-type="simple">
<list-item>
<p>- Consolidation (worksheet)</p>
</list-item>
</list>
</td>
<td align="left" valign="middle">&#x2248; 5&#x202F;min</td>
<td align="left" valign="top" rowspan="4">School</td>
<td align="left" valign="middle" rowspan="2">
<list list-type="simple">
<list-item>
<p>- Revision of the quiz &#x0026; opportunity for questions</p>
</list-item>
</list>
</td>
<td align="left" valign="middle" rowspan="2">&#x2248; 5&#x202F;min</td>
</tr>
<tr>
<td align="left" valign="middle">
<list list-type="simple">
<list-item>
<p>- Quiz (same as in FC)</p>
</list-item>
</list>
</td>
<td align="left" valign="middle">&#x2248; 5&#x202F;min</td>
</tr>
<tr>
<td align="left" valign="middle">
<list list-type="simple">
<list-item>
<p>- Exercises (part A)</p>
</list-item>
</list>
</td>
<td align="left" valign="middle">&#x2248; 20&#x202F;min</td>
<td align="left" valign="middle">
<list list-type="simple">
<list-item>
<p>- Consolidation (worksheet)</p>
</list-item>
</list>
</td>
<td align="left" valign="middle">&#x2248; 5&#x202F;min</td>
</tr>
<tr>
<td align="left" valign="top">Home</td>
<td align="left" valign="middle">
<list list-type="simple">
<list-item>
<p>- Homework exercises (part B)</p>
</list-item>
<list-item>
<p>Opportunity to watch the instructional video</p>
</list-item>
</list>
</td>
<td align="left" valign="middle">&#x2248; 15&#x202F;min</td>
<td align="left" valign="middle">
<list list-type="simple">
<list-item>
<p>- Exercises (part A and B)</p>
</list-item>
</list>
</td>
<td align="left" valign="middle">&#x2248; 35&#x202F;min</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Overview of the content of the four lessons M1 to M4.</p>
</caption>
<graphic xlink:href="feduc-11-1741733-g002.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Comparison table showing four methods of convertingprobabilities using &#x201C;1 out of 4&#x201D; as an example. M1 converts natural frequencyto common fraction with diagram and text explanation. M2 shows conversionbetween percentage, decimal, and common fractions. M3 relates naturalfrequency to notation for every nth, illustrating with diagrams. M4 comparesnatural frequency to odds, using diagrams and text.</alt-text>
</graphic>
</fig>
<p>In the traditional setting (left in <xref ref-type="table" rid="tab3">Table 3</xref>), after the revision of homework&#x2014;not in the first lesson&#x2014;teachers were of course instructed to follow the explanations that were also given in the videos from the FC conditions. The new content then had to be consolidated with worksheets, and teachers provided a short quiz to check their students&#x2019; understanding. The remaining time was spent doing exercises (part A). Finally, students were assigned homework (exercises, part B) to follow up on the lesson. Students were informed that there were also instructional videos that could be voluntarily <italic>n</italic> = 12 classes watched after each lesson to review the topic.</p>
<p>In both FC settings, as a preparation for each lesson, the students received an instructional video, followed by a quiz (the same as in TT) with automatic feedback on a Moodle-based learning platform. At the beginning of the class, the quiz questions were reviewed, giving the teacher the opportunity to specifically address poorly-answered questions. Students were also encouraged to ask questions related to the video. The content of the video was then consolidated using the same worksheets as the TT group. Finally, the teacher reminded the students of their upcoming homework, namely, to watch the next instructional video and to answer the quiz questions.</p>
</sec>
<sec id="sec12">
<label>3.2.1.2</label>
<title>Content of the four mathematics lessons</title>
<p>The sequence of the four lessons dealt with <italic>numerical formats of relative frequencies</italic> and was identical with respect to the content covered for all groups (<xref ref-type="fig" rid="fig2">Figure 2</xref>). Students usually learn at school that relative frequencies can be written as <italic>common fractions</italic> (e.g., 1/4), <italic>decimal fractions</italic> (e.g., 0.25), or <italic>percentages</italic> (e.g., 25%). However, in media and everyday language one often finds alternative formats such as <italic>natural frequencies</italic> (e.g., &#x201C;1 out of 4&#x201D;), the notation <italic>every n<sup>th</sup></italic> (e.g., &#x201C;every fourth&#x201D;), or <italic>odds</italic> (e.g., &#x201C;1 to 3&#x201D;). Since common and decimal fractions and percentages are standard in teaching mathematics, we describe below the three other formats that were implemented in our study.</p>
<p><italic>Natural frequencies</italic> consist of two absolute frequencies a and b (i.e., &#x201C;a out of b&#x201D; with a, b &#x2208; <italic>N</italic>, a&#x202F;&#x2264;&#x202F;b and b&#x202F;&#x2260;&#x202F;0). In applied research, they are particularly famous because of their beneficial effect for understanding conditional probabilities (in so-called Bayesian situations; <xref ref-type="bibr" rid="ref13">Gigerenzer and Hoffrage, 1995</xref>; <xref ref-type="bibr" rid="ref30">McDowell and Jacobs, 2017</xref>). In the notation <italic>every n<sup>th</sup></italic>, e.g., 1/4 becomes &#x201C;every fourth,&#x201D; and in general 1/n becomes &#x201C;every n<sup>th</sup>.&#x201D; <italic>Odds</italic> describe the &#x2018;confrontation&#x2019; of the number of cases &#x201C;a&#x201D; with a particular characteristic to the number of cases &#x201C;b&#x201D; without that characteristic. Thus, in terms of odds, the probability of 50% can be expressed as &#x201C;1: 1&#x201D; (read: &#x201C;1 to 1&#x201D;) and the probability of 25% can be expressed as &#x201C;1: 3&#x201D; (read: &#x201C;1 to 3&#x201D;). Note that the odds of 1 to 3, therefore, correspond to the probability of 1/4.</p>
<p>Since empirical studies have documented students&#x2019; problems especially with the mutual conversions of such formats (<xref ref-type="bibr" rid="ref43">Wiesner et al., 2023</xref>), the first lesson began with an introduction to <italic>natural frequencies</italic> (M1) and their equivalence to <italic>common fractions</italic>. This was followed by a repetition of the known conversions between <italic>common fractions</italic>, <italic>decimal fractions,</italic> and <italic>percentages</italic> (M2). Finally, the notations <italic>every n<sup>th</sup></italic> (M3) and <italic>odds</italic> (M4) were introduced, each time related to <italic>natural frequencies</italic>, which is the most intuitive format (<xref ref-type="bibr" rid="ref3">Binder et al., 2015</xref>; <xref ref-type="bibr" rid="ref13">Gigerenzer and Hoffrage, 1995</xref>).</p>
</sec>
</sec>
<sec id="sec13">
<label>3.2.2</label>
<title>Additional lesson for SRL (only given to the FCS group)</title>
<p>After the pretest (see <xref ref-type="fig" rid="fig1">Figure 1</xref>) and before the mathematics sequence, an additional lesson (&#x201C;SRL&#x201D;) was taught exclusively in the FCS condition. The goal of this lesson was to help students work successfully with the instructional video at home by using specific strategies. This lesson was designed &#x201C;math-free&#x201D; to ensure that the students did not have an advantage in the following mathematics sequence. Following the SRL model by <xref ref-type="bibr" rid="ref31">Pintrich (1999)</xref>, four cognitive strategies were developed, specifically focusing on instructional videos:</p>
<list list-type="bullet">
<list-item>
<p><italic>repetition strategy</italic> (ensuring awareness before watching): watching the video several times, the first viewing serves as an overview; from the second viewing onwards the following strategies are added</p>
</list-item>
<list-item>
<p><italic>before and after strategy</italic> (before <italic>and</italic> after watching): noting down one&#x2019;s own knowledge before and after watching the video</p>
</list-item>
<list-item>
<p><italic>note taking strategy</italic> (while watching): stopping the video at important points (or statements that are not understood) to take notes in bullet points (or just to note a single question mark and the timestamp of the issue)</p>
</list-item>
<list-item>
<p><italic>ordering strategy</italic> (after watching): sorting notes from the note-taking trategy to structure the content of the video, adding more notes, or removing redundant ones</p>
</list-item>
</list>
<p>All strategies are in line with the ICAP framework on digital learning (Interactive, Constructive, Active, and Passive), which describes in detail how students&#x2019; learning performance increases from passive to interactive as they become more engaged with digital learning tools such as instructional videos (<xref ref-type="bibr" rid="ref9">Chi and Wylie, 2014</xref>). The strategy lesson itself was structured as follows: First, students were presented the &#x201C;monkey business illusion&#x201D; video by <xref ref-type="bibr" rid="ref9001">Simons (2010)</xref> in order to illustrate that absorbing all the information by watching a video only once can be difficult and to motivate the need for strategies, especially when watching instructional videos. For the development of the strategies in class, the teachers of the FCS group followed the respective manual.</p>
<p>Afterwards, the strategies were consolidated with a so-called &#x201C;Strategy Prism&#x201D; (see 3.3.3), which is supposed to help the students remember the strategies and support metacognition. Finally, and most importantly, according to pertinent SRL research (<xref ref-type="bibr" rid="ref10">Dignath and B&#x00FC;ttner, 2008</xref>; <xref ref-type="bibr" rid="ref34">Stoeger et al., 2015</xref>), the strategies were put into practice during a class exercise on a non-subject-specific video about democracy with the teachers&#x2019; guidance. In the FCS group, before each of the four instructional videos, students were reminded about the strategies by a one-minute video in which the Strategy Prism was recalled.</p>
</sec>
</sec>
<sec id="sec14">
<label>3.3</label>
<title>Materials and administration</title>
<p>All teachers received a standardized teacher training in which the content and the standardized implementation of the lessons were explained by the test administrator (the first author). They received background information on the administration of the study and teaching material (e.g., manuals for each lesson, worksheets, quizzes, solutions, etc.). The instructional videos and the quizzes were provided online.</p>
<sec id="sec15">
<label>3.3.1</label>
<title>Instructional videos</title>
<p>The instructional videos were created using the lightboard technique (<xref ref-type="bibr" rid="ref27">Lubrick et al., 2019</xref>), because this technique allows one to implement design recommendations from various authors, such as the Gaze Guidance Principle or the Dynamic Drawing Principle (<xref ref-type="bibr" rid="ref5">Brame, 2016</xref>; <xref ref-type="bibr" rid="ref29">Mayer et al., 2020</xref>). For each video, the same structure was used: first, the new type of numerical format to be learned was introduced by an example. Then, the link to an already known notation was shown by using and connecting their &#x2018;basic ideas&#x2019; (<italic>Grundvorstellungen</italic>; see pictorials in <xref ref-type="fig" rid="fig2">Figure 2</xref>). Finally, the new format was placed into an overall graphic overview, in which all numerical formats were integrated and that was completed step by step in the four-lesson sequence.</p>
<p>The length of an instructional video ranged from 6 to 9 min. The videos were, in principle, online available throughout the course to all students in the three groups, yet obligatory as preparation only in the FC conditions. Furthermore, to control whether students had actually watched the videos before the lesson (manipulation check), the teachers and researchers were able to verify this via tracking data. This showed that the classes in the FC conditions actually did the flip and that the students in these two conditions used the videos significantly more than the students in the TT conditions.</p>
</sec>
<sec id="sec16">
<label>3.3.2</label>
<title>Quizzes</title>
<p>Directly after watching the videos at home, the students of the FC groups were asked to complete a short quiz of four tasks, which was also done in class in TT. The questions were either closed (e.g., Which answers are correct? &#x201C;1 out of 2&#x201D; is &#x201C;1/2,&#x201D; &#x201C;50%,&#x201D; &#x201C;0.2,&#x201D; or &#x201C;20%&#x201D;) or semi-open (e.g., Reduce the natural frequency as much as possible: &#x201C;12 out of 24&#x201D; is &#x201C;___ out of ___&#x201D;). For the two FC groups, the quizzes were also available online. As with the instructional videos, teachers and researchers could check to see if students had completed the quizzes.</p>
</sec>
<sec id="sec17">
<label>3.3.3</label>
<title>The strategy prism (only given to FCS group)</title>
<p>The Strategy Prism, which was distributed to by teachers in the FCS condition, serves as a reminder that summarizes all four strategies in a nutshell to support metacognitive skills. It was designed as a flyer that can be folded into a prism, thereby creating three surface areas. The three faces represent the three time periods &#x201C;before watching,&#x201D; &#x201C;while watching,&#x201D; and &#x201C;after watching&#x201D; and displayed relevant aspects briefly in bullet points. The prism can be folded for easy transportation and quickly set up when needed. Therefore, whenever students want to watch a video, they can easily build the prism and turn the relevant face towards them according to the phase that they are in.</p>
</sec>
<sec id="sec18">
<label>3.3.4</label>
<title>Standardized guidelines for teachers</title>
<p>The mathematical content of the training was identical for teachers in the three conditions. Teachers in the FC conditions received additional information on how to implement the FC method, and teachers in the FCS group also received a plan for the additional strategy lesson.</p>
<p><xref ref-type="table" rid="tab4">Table 4</xref> summarizes an evaluation of the guidelines and teaching materials by the participating teachers after completion of the study. Especially the result of the last item demonstrates a high level of experimental control.</p>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>Teachers&#x2019; evaluation of the content, training, and materials of the mathematics sequence.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Item</th>
<th align="center" valign="top">Mean (SD)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">The content of the mathematics lessons was relevant for my students.</td>
<td align="char" valign="middle" char="(">3.75 (0.55)</td>
</tr>
<tr>
<td align="left" valign="middle">The explications by the test administrator were clear and helpful.</td>
<td align="char" valign="middle" char="(">3.79 (0.54)</td>
</tr>
<tr>
<td align="left" valign="middle">The teaching materials were clearly structured.</td>
<td align="char" valign="middle" char="(">3.75 (0.44)</td>
</tr>
<tr>
<td align="left" valign="middle">During the study, I knew exactly what to do at any time.</td>
<td align="char" valign="middle" char="(">3.95 (0.22)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>N</italic>&#x202F;=&#x202F;34; Likert scale: 1&#x202F;=&#x202F;no agreement; 2&#x202F;=&#x202F;rather no agreement; 3&#x202F;=&#x202F;rather agreement; 4&#x202F;=&#x202F;total agreement.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="sec19">
<label>3.3.5</label>
<title>Pre- and posttest for measuring the learning gains</title>
<p>The pre- and posttest each consisted of 17 items; both tests shared the same structure, meaning that the items were formulated identically with only the numerical values differing between pre- and posttest. The first four (closed) items were similar to the following example: &#x201C;Every fifth means 20%&#x201D; a) &#x201C;true,&#x201D; b) &#x201C;false.&#x201D; The next eight (semi-opened) items required active conversions between two formats (e.g., &#x201C;1/6&#x201D; is &#x201C;__ out of 18&#x201D;). The following three items required students to decide whether a given inequality is true or false. In the remaining two items, students had to identify the largest and the smallest out of four provided ones in different formats. Each item of the pre- and posttest yielded one point and the scales of both tests were formed by adding the corresponding 17 scores.</p>
<p>The implemented videos, quizzes, all teaching materials for the four math lessons as well as the pre- and posttest can be found via the this <ext-link xlink:href="https://osf.io/v9fwj/?view_only=94ecca3f13214e37b87e5390c36e71d6" ext-link-type="uri">link</ext-link>.</p>
</sec>
<sec id="sec20">
<label>3.3.6</label>
<title>Control variables</title>
<p>To be able to statistically control the influence of potentially relevant covariates, the following control variables were additionally collected in the pre- and posttest lessons. For students: <italic>gender</italic>, <italic>native language</italic>, <italic>own computer or tablet</italic>, <italic>instructional quality</italic> (<italic>global)</italic>, <italic>instructional quality (of the four mathematics lessons), previous use of digital media in spare time/for school, reading habits</italic>, <italic>previous use of instructional videos at home</italic>, <italic>strategies for using instructional videos before intervention study</italic> and <italic>strategies for using instructional videos during intervention study</italic>; for teachers: <italic>gender</italic>, <italic>work experience (</italic>i.e.<italic>, years of being a teacher)</italic>, <italic>instructional quality</italic> (<italic>global), instructional quality (concerning the four mathematics lessons</italic>), <italic>positive attitude towards teaching (in general), attitude towards digital media</italic>, <italic>attitude towards instructional videos</italic>, and <italic>previous use of instructional videos</italic>. In <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 2</xref>, an example item is presented and the corresponding scales are summarized with indication of internal consistency for each scale.</p>
</sec>
</sec>
<sec id="sec21">
<label>3.4</label>
<title>Participants</title>
<p>Data were gathered from <italic>N</italic>&#x202F;=&#x202F;950 students of grade 6 and 7 of all school types across various locations in the state of Bavaria (Germany) in the school year 2022/23. In Germany basically there are an academic track (&#x201C;Gymnasium&#x201D;), a medium track (&#x201C;Realschule&#x201D;) and a vocational track (&#x201C;Mittelschule&#x201D;). The classes were chosen so that all students had the same prior knowledge: All classes knew fractions (common and decimal) and percentages, but none of them had explicit experience with the other three formats before. The students were taught in <italic>n</italic>&#x202F;=&#x202F;37 classes; these classes were distributed among <italic>n</italic>&#x202F;=&#x202F;20 schools. Three teachers taught two different classes (two of the TT group and one of the FCn group); thus the students were taught by <italic>n</italic>&#x202F;=&#x202F;34 teachers. <xref ref-type="table" rid="tab5">Table 5</xref> shows the distribution of students, classes, and teachers separated by condition. An overview of class size and gender distribution is provided in <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 2</xref>, <xref rid="SM1" ref-type="supplementary-material">Table B.4</xref>.</p>
<table-wrap position="float" id="tab5">
<label>Table 5</label>
<caption>
<p>Number of participating students (schools) and classes/teachers separated by experimental condition.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th>Condition</th>
<th align="center" valign="top">Students (schools)</th>
<th align="center" valign="top">Classes/teachers</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">TT</td>
<td align="char" valign="top" char="(">339 (6)</td>
<td align="char" valign="top" char="/">13/11</td>
</tr>
<tr>
<td align="left" valign="top">FCn</td>
<td align="char" valign="top" char="(">316 (5)</td>
<td align="char" valign="top" char="/">12/11</td>
</tr>
<tr>
<td align="left" valign="top">FCS</td>
<td align="char" valign="top" char="(">295 (9)</td>
<td align="char" valign="top" char="/">12/12</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Of all teachers who volunteered to participate in the study, 16 were female and 18 were male, with an average work experience of 14.2&#x202F;years. In all three groups, the average work experience, gender distribution of teachers and school type were comparable. Prior to data collection, the Bavarian Ministry of Education, school principals, teachers, parents, and the students themselves consented to the committed participation in the study.</p>
</sec>
<sec id="sec22">
<label>3.5</label>
<title>Statistical analysis</title>
<sec id="sec23">
<label>3.5.1</label>
<title>Coding of pre- and posttest</title>
<p>Concerning the closed items, the correct choice was scored with one point. In semi-open items (with a gap), all possible correct answers were scored as correct. For example, regarding the item 3b (pretest) concerning the conversion of 30% into a common fraction, several answers (e.g., 3/10 or also 30/100) received one point. For implementation in the statistical regression model (3.5.2), manifest scales were formed for the pre- and the posttest, respectively. In sum, a maximum score of 17 could be achieved on both the pretest and the posttest.</p>
</sec>
<sec id="sec24">
<label>3.5.2</label>
<title>Statistical model</title>
<p>From a statistical point of view, the two research questions RQ1 and RQ2 can be modeled simultaneously by setting the FCn condition as reference group. Due to the longitudinal and nested structure of the data, a linear mixed model (LMM) was used to predict students&#x2019; performance in the posttest while controlling for students&#x2019; performance in the pretest (<xref ref-type="bibr" rid="ref17">Hilbert et al., 2019</xref>). Since the FCn group served as reference group, the factors &#x201C;TT&#x201D; (0: no Traditional Teaching; 1: Traditional Teaching) and &#x201C;FCS&#x201D; (0: no SRL support; 1: SRL support) were included via dummy coding as well as the measurement point &#x201C;time&#x201D; (0: pretest, 1: posttest). In addition, since the effectiveness of the training from pretest to posttest was expected to vary between the different training groups, two interaction terms TT&#x202F;&#x00D7;&#x202F;time and FCS&#x202F;&#x00D7;&#x202F;time were modeled. The model equation was (<xref ref-type="table" rid="tab6">Table 6</xref> for the meaning of the various <inline-formula>
<mml:math id="M1">
<mml:mi>&#x03B2;</mml:mi>
</mml:math>
</inline-formula> coefficients).</p>
<disp-formula id="E1">
<mml:math id="M2">
<mml:mtable columnalign="left" displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:mi>y</mml:mi>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi>int</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:msub>
<mml:mo>&#x22C5;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi mathvariant="italic">TT</mml:mi>
</mml:msub>
<mml:mo>&#x22C5;</mml:mo>
<mml:mi mathvariant="italic">TT</mml:mi>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi mathvariant="italic">FCS</mml:mi>
</mml:msub>
<mml:mo>&#x22C5;</mml:mo>
<mml:mi mathvariant="italic">FCS</mml:mi>
<mml:mo>+</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">TT</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>&#x22C5;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="italic">TT</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">FC</mml:mi>
<mml:mi mathvariant="normal">S</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>&#x22C5;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="italic">FCS</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mn>0</mml:mn>
<mml:msub>
<mml:mi>i</mml:mi>
<mml:mtext mathvariant="italic">school</mml:mtext>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mn>0</mml:mn>
<mml:msub>
<mml:mi>i</mml:mi>
<mml:mtext mathvariant="italic">class</mml:mtext>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:math>
</disp-formula>
<table-wrap position="float" id="tab6">
<label>Table 6</label>
<caption>
<p>Interpretation of the <inline-formula>
<mml:math id="M3">
<mml:mi>&#x03B2;</mml:mi>
</mml:math>
</inline-formula> coefficients in the LMM.</p>
</caption>
<table frame="hsides" rules="groups">
<tbody>
<tr>
<td align="left" valign="top">&#x03B2; coefficient</td>
<td align="left" valign="top">Interpretation</td>
</tr>
<tr>
<td align="left" valign="top">
<inline-formula>
<mml:math id="M4">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi>int</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>
</td>
<td align="left" valign="top">Intercept: <inline-formula>
<mml:math id="M5">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi>int</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is the pre-value of the FCn group.<break/>Equation: <inline-formula>
<mml:math id="M6">
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">FCn</mml:mi>
<mml:mo>/</mml:mo>
<mml:mi mathvariant="italic">pre</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi>int</mml:mi>
</mml:msub>
</mml:math>
</inline-formula></td>
</tr>
<tr>
<td align="left" valign="top">
<inline-formula>
<mml:math id="M7">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi mathvariant="italic">TT</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>
</td>
<td align="left" valign="top">Main effect &#x201C;TT&#x201D; (Traditional Teaching): <inline-formula>
<mml:math id="M8">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi mathvariant="italic">TT</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> indicates the difference attributable solely to the traditional teaching factor (= difference between FCn and TT) at the pretest score.<break/>Equation: <inline-formula>
<mml:math id="M9">
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">TT</mml:mi>
<mml:mo>/</mml:mo>
<mml:mi mathvariant="italic">pre</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi>int</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi mathvariant="italic">TT</mml:mi>
</mml:msub>
</mml:math>
</inline-formula></td>
</tr>
<tr>
<td align="left" valign="top">
<inline-formula>
<mml:math id="M10">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi mathvariant="italic">FCS</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>
</td>
<td align="left" valign="top">Main effect &#x201C;FCS&#x201D; (SRL support): <inline-formula>
<mml:math id="M11">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi mathvariant="italic">FCS</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> indicates the difference attributable solely to the &#x2018;strategies factor&#x2019; (= difference between FCn and FCS) at the pretest score.<break/>Equation: <inline-formula>
<mml:math id="M12">
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">FCS</mml:mi>
<mml:mo>/</mml:mo>
<mml:mi mathvariant="italic">pre</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi>int</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi mathvariant="italic">FCS</mml:mi>
</mml:msub>
</mml:math>
</inline-formula></td>
</tr>
<tr>
<td align="left" valign="top">
<inline-formula>
<mml:math id="M13">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula>
</td>
<td align="left" valign="top">Main effect time: <inline-formula>
<mml:math id="M14">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula> indicates difference attributable solely to the factor of time (= difference between post and pre) for the FCn group.<break/>Equation: <inline-formula>
<mml:math id="M15">
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">FCn</mml:mi>
<mml:mo>/</mml:mo>
<mml:mtext mathvariant="italic">post</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi>int</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula></td>
</tr>
<tr>
<td align="left" valign="top">
<inline-formula>
<mml:math id="M16">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">TT</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>
</td>
<td align="left" valign="top">Interaction effect TT <inline-formula>
<mml:math id="M17">
<mml:mo>&#x00D7;</mml:mo>
</mml:math>
</inline-formula> time (Traditional Teaching <inline-formula>
<mml:math id="M18">
<mml:mo>&#x00D7;</mml:mo>
</mml:math>
</inline-formula> time): <inline-formula>
<mml:math id="M19">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">TT</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> indicates the difference between FCn and TT concerning learning gains.<break/>Equation: <inline-formula>
<mml:math id="M20">
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">TT</mml:mi>
<mml:mo>/</mml:mo>
<mml:mtext mathvariant="italic">post</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi>int</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi mathvariant="italic">TT</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">TT</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula></td>
</tr>
<tr>
<td align="left" valign="top">
<inline-formula>
<mml:math id="M21">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">FCS</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>
</td>
<td align="left" valign="top">Interaction effect FCS <inline-formula>
<mml:math id="M22">
<mml:mo>&#x00D7;</mml:mo>
</mml:math>
</inline-formula> time (SRL support <inline-formula>
<mml:math id="M23">
<mml:mo>&#x00D7;</mml:mo>
</mml:math>
</inline-formula> time): <inline-formula>
<mml:math id="M24">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">FCS</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> indicates the difference between FCn and FCS concerning learning gains.<break/>Equation: <inline-formula>
<mml:math id="M25">
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mo>/</mml:mo>
<mml:mtext mathvariant="italic">post</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi>int</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi mathvariant="italic">FCS</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">FCS</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula></td>
</tr>
</tbody>
</table>
</table-wrap>
<p>To account for the multilevel structure in the school context, the nesting of &#x201C;school&#x201D; and &#x201C;class&#x201D; was added using random effects in the LMM, which allows the individual parameters to be adjusted in order to obtain a more realistic estimate.</p>
<p>The applied LMM has the following three interpretative advantages compared to a mixed ANOVA (<xref ref-type="bibr" rid="ref17">Hilbert et al., 2019</xref>): a) If there were significant differences in the pretest score, the model would not only indicate whether they exist, but also where they are. In addition, significant differences between the interactions could be directly located. Both aspects eliminate the need for post-hoc analyses, which would result in a loss of statistical power; b) an LMM can handle missing values; thereby statistical power is increased; c) the LMM has less stringent model requirements (homoscedasticity; i.e., it is not required that the variances of the error terms are equal).</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="sec25">
<label>4</label>
<title>Results</title>
<sec id="sec26">
<label>4.1</label>
<title>Descriptive results of pre- and posttest</title>
<p><xref ref-type="table" rid="tab7">Table 7</xref> provides an overview of the descriptive results from the pre- and posttest. Both scales yielded satisfactory internal consistency aggregated across all groups as indicated by Cronbach&#x2019;s <italic>&#x03B1;</italic> (<italic>&#x03B1;</italic><sub>pretest</sub>&#x202F;=&#x202F;0.79; <italic>&#x03B1;</italic><sub>posttest</sub>&#x202F;=&#x202F;0.84). Across all three groups the average score in the pretest was 8.51 (<italic>SD</italic> = 2.96) and in the posttest 11.38 (<italic>SD</italic> = 3.30) with a Cohen&#x2019;s <italic>d</italic> of 0.95 (The male participants achieved an average score of 8.67 (SD = 3.06) in the pretest and 11.75 (<italic>SD</italic> = 3.25) in the posttest, corresponding to a Cohen&#x2019;s d of 0.98. For the female participants, the score was 8.34 (<italic>SD</italic> = 2.83) in the pretest and 10.94 (<italic>SD</italic> = 3.22) in the posttest, with a Cohen&#x2019;s <italic>d</italic> of 0.86.).</p>
<table-wrap position="float" id="tab7">
<label>Table 7</label>
<caption>
<p>Scales of pretest and posttest: Descriptive results.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th rowspan="2">Condition</th>
<th align="center" valign="top">Pretest</th>
<th align="center" valign="top">Posttest</th>
<th align="center" valign="top">Effect size</th>
</tr>
<tr>
<th align="center" valign="middle">M (<italic>SD</italic>)</th>
<th align="center" valign="middle">M (<italic>SD</italic>)</th>
<th align="center" valign="top">Cohens <italic>d</italic></th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Traditional Teaching (TT)</td>
<td align="center" valign="middle">8.14 <italic>(2.69)</italic></td>
<td align="center" valign="middle">11.05 <italic>(3.34)</italic></td>
<td align="center" valign="top">1.06</td>
</tr>
<tr>
<td align="left" valign="middle">FC with no SRL support (FCn)</td>
<td align="center" valign="middle">9.12 <italic>(3.02)</italic></td>
<td align="center" valign="middle">11.59 <italic>(3.47)</italic></td>
<td align="center" valign="top">0.80</td>
</tr>
<tr>
<td align="left" valign="middle">FC with SRL support (FCS)</td>
<td align="center" valign="middle">8.25 <italic>(3.09)</italic></td>
<td align="center" valign="middle">11.54 <italic>(3.03)</italic></td>
<td align="center" valign="top">1.04</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>According to Cohen: &#x2502;<italic>d</italic>&#x2502;&#x202F;=&#x202F;0.2 small effect, &#x2502;<italic>d</italic>&#x2502;&#x202F;=&#x202F;0.5 medium effect, &#x2502;<italic>d</italic>&#x2502;&#x202F;=&#x202F;0.8 large effect.</p>
</table-wrap-foot>
</table-wrap>
<p><xref ref-type="fig" rid="fig3">Figure 3</xref> displays the resulting line diagram regarding students&#x2019; pre- and post-performances separated by the three experimental conditions.</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Students&#x2019; performances regarding time (pre vs. post) and experimental conditions (TT vs. FCn vs. FCS), with bars indicating the standard error (SE). For easier identification of the interaction effects, the vertical axis was truncated at score&#x202F;=&#x202F;6.</p>
</caption>
<graphic xlink:href="feduc-11-1741733-g003.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Line graph comparing pretest and posttest scores for three experimental conditions: FCn, FCS, and TT. FCn shows scores increasing from 9.12 to 11.59 for 316 students. FCS rises from 8.25 to 11.54 for 295 students. TT increases from 8.14 to 11.05 for 339 students. Data is represented with solid, dashed, and dotted lines, respectively.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec27">
<label>4.2</label>
<title>Results of the linear mixed model</title>
<p>According to the research questions, in the LMM, the FCn condition was chosen as reference group (<xref ref-type="table" rid="tab8">Table 8</xref>). There was no significant difference in the pretest scores between the TT group and the reference group FCn (<inline-formula>
<mml:math id="M26">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi mathvariant="italic">TT</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.61</mml:mn>
<mml:mo>,</mml:mo>
</mml:math>
</inline-formula> <italic>p</italic>&#x202F;=&#x202F;0.10). Similarly, the pretest scores of the FCS group did not significantly differ from those of FCn group (<inline-formula>
<mml:math id="M27">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi>S</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.39</mml:mn>
<mml:mo>,</mml:mo>
</mml:math>
</inline-formula> <italic>p</italic>&#x202F;=&#x202F;0.07). Consequently, the remaining difference cannot be significant (obviously, the pretest scores of TT and FCS are closest to each other, <xref ref-type="fig" rid="fig3">Figure 3</xref>). The general comparability of the three groups with respect to the pretest contributes to the internal validity of conclusions from the model, since possible interaction effects are less likely biased by varying a priori competencies of the students.</p>
<table-wrap position="float" id="tab8">
<label>Table 8</label>
<caption>
<p>Parameters of estimate, standard error, <italic>t</italic>-value and <italic>p</italic>-value (rounded to two decimals) of the LMM.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Marginal <italic>R</italic><sup>2</sup>&#x202F;=&#x202F;0.19</th>
<th align="center" valign="middle">Estimate</th>
<th align="center" valign="middle">
<italic>SE</italic>
</th>
<th align="center" valign="middle">
<italic>t</italic>
</th>
<th align="center" valign="middle">
<italic>p</italic>
</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">(Intercept)</td>
<td align="center" valign="bottom"><bold>9.33</bold></td>
<td align="center" valign="bottom">0.66</td>
<td align="center" valign="bottom">14.21</td>
<td align="center" valign="bottom"><bold>&#x003C;0.001&#x002A;&#x002A;&#x002A;</bold></td>
</tr>
<tr>
<td align="left" valign="top">Time</td>
<td align="center" valign="bottom"><bold>2.48</bold></td>
<td align="center" valign="bottom">0.18</td>
<td align="center" valign="bottom">14.10</td>
<td align="center" valign="bottom"><bold>&#x003C;0.001&#x002A;&#x002A;&#x002A;</bold></td>
</tr>
<tr>
<td align="left" valign="top">TT</td>
<td align="center" valign="bottom">&#x2212;1.61</td>
<td align="center" valign="bottom">0.93</td>
<td align="center" valign="bottom">&#x2212;1.72</td>
<td align="center" valign="bottom">0.10</td>
</tr>
<tr>
<td align="left" valign="top">FCS</td>
<td align="center" valign="bottom">&#x2212;1.39</td>
<td align="center" valign="bottom">0.75</td>
<td align="center" valign="bottom">&#x2212;1.85</td>
<td align="center" valign="bottom">0.07</td>
</tr>
<tr>
<td align="left" valign="top">TT &#x00D7; time</td>
<td align="center" valign="bottom">0.45</td>
<td align="center" valign="bottom">0.25</td>
<td align="center" valign="bottom">1.83</td>
<td align="center" valign="bottom">0.07</td>
</tr>
<tr>
<td align="left" valign="top">FCS &#x00D7; time</td>
<td align="center" valign="bottom"><bold>0.76</bold></td>
<td align="center" valign="bottom">0.26</td>
<td align="center" valign="bottom">2.98</td>
<td align="center" valign="bottom"><bold>0.003&#x002A;&#x002A;</bold></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Estimate, Estimated Coefficients; <italic>SE</italic>, Standard Error; <italic>t</italic>, <italic>t</italic>-values; <italic>p</italic>, <italic>p</italic>-value; <italic>R</italic><sup>2</sup>, coefficient of determination; ICC, intraclass correlation. Values in bold are significant.</p>
</table-wrap-foot>
</table-wrap>
<p>Note that the intercept of 9.33 (i.e., the pretest score of the reference group FCn) in <xref ref-type="table" rid="tab8">Table 8</xref> slightly varies from <xref ref-type="fig" rid="fig3">Figure 3</xref> (9.12), which indicates the correction due to the implemented multi-level modeling. The significance only indicates its difference from 0. Moving on to the posttest results, there was a significant improvement of the reference group (FCn) due to the teaching sequence (<inline-formula>
<mml:math id="M29">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>2.48</mml:mn>
<mml:mo>,</mml:mo>
</mml:math>
</inline-formula><italic>p</italic>&#x202F;&#x003C;&#x202F;0.001). In terms of inferential statistics, RQ1 and RQ2 can be answered by comparing the slopes in <xref ref-type="fig" rid="fig3">Figure 3</xref>. The difference in the slopes is analyzed by the interactions. Regarding RQ1, the interaction effect between time and TT did not yield significant differences in the improvement (<inline-formula>
<mml:math id="M30">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">TT</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mspace width="0.25em"/>
</mml:math>
</inline-formula>= 0.45, <italic>p</italic>&#x202F;=&#x202F;0.07). Regarding RQ2, the interaction effect between time and FCS was significant (<inline-formula>
<mml:math id="M31">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">FCS</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>0.76</mml:mn>
</mml:math>
</inline-formula>, <italic>p</italic>&#x202F;=&#x202F;0.003), indicating different learning gains between the participants of the FCn condition and the FCS condition. Therefore, supporting students by explicitly providing them with strategies for watching instructional videos indeed seems to have a crucial effect. Since the model displayed in <xref ref-type="table" rid="tab8">Table 8</xref> uses FCn as reference group, it allows no inferential statement on the difference between TT and FCS. However, when, e.g., alternatively selecting TT as the reference group, no significant difference between the TT and the FCS condition occurs (<inline-formula>
<mml:math id="M32">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">FCS</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:mtext mathvariant="italic">time</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mspace width="0.25em"/>
</mml:math>
</inline-formula>= 0.30, <italic>p</italic>&#x202F;=&#x202F;0.22).</p>
<p>The Intraclass Correlation Coefficient (69%) was computed to assess the reliability of the model and the proportion of variance explained by the random effects. Furthermore, the marginal R<sup>2</sup> indicated that the fixed factors accounted for approximately 19% of the variance, while the conditional R<sup>2</sup> suggested that fixed and random factors together explained approximately 64% variance.</p>
<p>Including all control variables (see 3.3.6 and <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 2</xref>, respectively) individually as possible predictors in the LMM, only the interaction of time with the student scale <italic>strategies for using instructional videos</italic> (after intervention) was significant (aggregated across all groups), providing further evidence from another (self-reported) perspective for the importance of teaching such strategies.</p>
<p>Regarding RQ1, the learning gains between FCn and TT did not differ significantly (without implementation of control variables), yet with a <italic>p</italic>-value close to significance (<italic>p</italic>&#x202F;=&#x202F;0.07). Here, six student variables turned this interaction into being significant when individually implemented in the LMM (but no teacher variable). However, one must note that the <italic>p</italic>-value varied only moderately even in these cases, meaning that individually implementing student variables leads to corresponding <italic>p</italic>-values ranging from 0.02 to 0.13. Thus, the (nearly or indeed) significant difference between both groups was also relatively stable with respect to the control variables implemented (see <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 2</xref>).</p>
<p>Concerning RQ2, only one of the teacher variables, namely the teachers&#x2019; self-perceived instructional quality during the intervention, changes the significance of the differential improvements between FCS and FCn into non-significance (RQ2). Furthermore, none of these variables affected the non-significance of the differential improvements of the TT and the FCS group in the alternative model (see above). Taken together, this indicates a robust difference between the two FC conditions, on the one hand, and, on the other hand, a stable comparability between a professionally prepared TT and an FC teaching in which students are not left alone with instructional videos. Note that the superiority of FCS (significant with respect to FCn and only at a descriptive level compared to TT) is remarkable especially, when considering group differences in the control variables. Concerning the four variables in which an ANOVA revealed a significant difference (2 x <italic>instructional quality, previous use of digital media/videos</italic>; see <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 2</xref>), the prerequisites in the FCS conditions were even <italic>worse</italic>.</p>
</sec>
<sec id="sec28">
<label>4.3</label>
<title>Results at class level</title>
<p><xref ref-type="fig" rid="fig4">Figure 4</xref> provides a comprehensive visual summary of class-level interactions, illustrating the overall diversity observed in the study by highlighting the substantial variations between classes.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Learning gains of the 37 single classes.</p>
</caption>
<graphic xlink:href="feduc-11-1741733-g004.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Line graph showing overall test scores from pretest to posttest for three experimental conditions: FCn (solid blue line with 12 classes), FCS (dashed green line with 12 classes), and TT (dotted black line with 13 classes). The scores range from 1 to 17, with notable lines labeled as number 36 and number 7.</alt-text>
</graphic>
</fig>
<p>Note that a large range of both pretest and posttest scores was observed across the sample in general but also within each group (<xref ref-type="fig" rid="fig4">Figure 4</xref>). One intriguing class-related result is, for example, that class no. 36 in the FS n group that achieved the highest posttest score of 14.9 also reached the second highest pretest score of 10.6. Interestingly, this class also exhibited the second-largest improvement. Class no. 7, which was part of the FCS condition, had an average pretest score of 4.5 and demonstrated the greatest improvement with a gain of 4.8 points. Notably, in all conditions, there were single classes with small and with large improvements. In sum, <xref ref-type="fig" rid="fig4">Figure 4</xref> illustrates that a) neither floor nor ceiling effects were present in the study, and b) no single class reduced their competence level, which indicates the effectiveness of the sequence in general. However, it also becomes clear that c) when randomly choosing just one or two classes per condition, based on our data, almost any interaction effect had been possible.</p>
</sec>
</sec>
<sec sec-type="discussion" id="sec29">
<label>5</label>
<title>Discussion</title>
<p>The starting point of the present paper was an observed contradiction between a &#x2018;large&#x2019; FC study (<xref ref-type="bibr" rid="ref42">Wagner and Urhahne, 2021</xref>) and seven meta-analyses concerning K-12 teaching that had not yet included this recent study. While <xref ref-type="bibr" rid="ref42">Wagner and Urhahne (2021)</xref> found no benefit of FC teaching in a highly controlled setting with several classes per experimental condition, all seven meta-analyses, in contrast, claim a beneficial effect of the FC method. Consulting general literature on meta-analyses, including critiques, revealed that it is no exception in empirical psychological and pedagogical research that many relatively small studies find effects that cannot be replicated by large experiments. <xref ref-type="bibr" rid="ref33">Sotola (2022)</xref>, for example, cautions that effect sizes in meta-analyses might be overestimated, especially in in-depth studies with small samples.</p>
<p>We attempted to consider these thoughts regarding FC studies in the K-12 classroom. Sorting the K-12 FC studies from the seven meta-analyses by the criterion &#x201C;number of classes per experimental condition&#x201D; (<xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref>) made apparent that most of the individual FC studies implemented only one or two classes per condition. This fact is not only in line with many theoretical deliberations of <xref ref-type="bibr" rid="ref33">Sotola (2022)</xref>, <xref ref-type="bibr" rid="ref20">Kvarven et al. (2020)</xref>, and <xref ref-type="bibr" rid="ref1">Barto&#x0161; et al. (2023)</xref>; it also underlines the call of the authors of the FC meta-analyses for large and controlled empirical studies investigating the FC method, particularly for school students (<xref ref-type="bibr" rid="ref21">L&#x00E5;g and S&#x00E6;le, 2019</xref>; <xref ref-type="bibr" rid="ref37">van Alten et al., 2019</xref>; <xref ref-type="bibr" rid="ref42">Wagner and Urhahne, 2021</xref>).</p>
<p>In the present paper, we specifically focus on K-12 teaching, in which self-regulation support for students might be more necessary than for university students, since the latter ones should have a higher responsibility for their learning progress than school students (<xref ref-type="bibr" rid="ref38">van Alten et al., 2020a</xref>). In the empirical part, we implemented two experimental conditions (FCn vs. TT) to meet open demands and address the above contradiction (RQ1) through a further large and highly controlled study (and thus adding to <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref>). In addition, a second FC condition was created (FCS) in which the students received an additional math-free SRL lesson to explicitly support working with instructional videos at home to answer RQ2 (contributing to <xref ref-type="table" rid="tab2">Table 2</xref>).</p>
<p>Regarding RQ1, by applying a multi-level LMM, no significant difference was found between the learning gains of the students in the FCn and TT conditions. Yet, when implementing certain student control variables, the students of the TT group had a significantly higher learning increase. Regarding RQ2, the learning gains differed significantly in favor of the FCS group over the FCn group. All interaction effects were relatively stable when pertinent control scales entered the LMM as individual covariates.</p>
<p>Our study suggests that by providing school students with support for their SRL&#x2014;i.e., by teaching specific strategies for working with instructional videos&#x2014;FC might, indeed, become an effective method to enhance learning outcomes. One possible explanation for the significantly better outcomes observed in the FCS group can be provided by the ICAP framework (<xref ref-type="bibr" rid="ref9">Chi and Wylie, 2014</xref>). When students passively watch the video without being aware that they need to <italic>actively</italic> engage in the content, their knowledge acquisition remains passive. However, when students are made aware that simply watching videos may lead to missed opportunities for learning and that certain strategies can enhance their learning experience, their interaction with the learning content surpasses mere passivity. In fact, <xref ref-type="bibr" rid="ref9">Chi and Wylie (2014)</xref> suggest that, for instance, organizing and sorting notes can be viewed as an interactive process. Therefore, it might be crucial to allocate sufficient time to prepare students comprehensively to ensure a successful implementation of FC.</p>
<p>The present study highlights the importance of including several classes in educational interventions and using statistical multilevel modeling in general. Particularly, <xref ref-type="fig" rid="fig4">Figure 4</xref> emphasizes the need of addressing class effects to avoid misleading conclusions. Therefore, a comprehensive approach incorporating diverse classes within each condition is crucial for as internally valid assessments of intervention effects as possible.</p>
</sec>
<sec id="sec30">
<label>6</label>
<title>Limitations and future research</title>
<p>One limitation of our study is the short intervention duration of 2&#x202F;weeks. This short time frame perhaps did not allow the students to fully adapt to the FC method, and novelty effects cannot be entirely ruled out, even if many students may have already encountered this approach during the COVID-19 pandemic. In future research, it would be possible, for instance, to first &#x201C;train&#x201D; the FC method prior to actual data collection, allowing students to become more accustomed to the approach.</p>
<p>In addition, it is important to recognize that the results may not be generalizable to the entire K-12 education system because of the different characteristics of students in different grades or concerning different subjects. Conducting large-scale studies with multiple classes per condition would be desirable with other grades and subjects in order to obtain a clearer picture of the effectiveness of the FC approach in primary and secondary teaching. Currently, in the FALKE-d project, which includes this study, analyses are being conducted based on parallel designs and comparable sample sizes in five other school disciplines (chemistry, physics, music, german and politcs in elementary school). Furthermore and for the same reasons, it is not possible to infer conclusions on the tertiary level from the present study. Expanding ideas from our theoretical part to university teaching would be intriguing, for example, to see whether comparable contradictions exist there as well.</p>
<p>Furthermore, with the breakthrough of AI, knowledge transfer could be more individualized for students (e.g., via chatbots rather than via videos). Investigating the impact of switching to such forms of instruction is still in its infancy (<xref ref-type="bibr" rid="ref25">Lo and Hew, 2023</xref>). To the best of our knowledge, empirical findings are currently available only for the higher education sector (e.g., <xref ref-type="bibr" rid="ref36">Tang et al., 2025</xref>).</p>
</sec>
<sec sec-type="conclusions" id="sec31">
<label>7</label>
<title>Conclusion</title>
<p>Since the completion of our study, now, two large FC studies in K-12 education contradict the findings of seven meta-analyses. The years of publication of the meta-analyses (and of the individual FC studies) show that research on FC is still in the early stages. We are in line with <xref ref-type="bibr" rid="ref37">van Alten et al. (2019</xref>, p. 15) that &#x201C;Careful attention should be paid, however, to the design of the flipped classroom as simply flipping before and during classroom activities might be not enough.&#x201D; Our data suggest that in addition to &#x201C;flipping&#x201D; the classroom in K-12 teaching practice, students must be supported to watch instructional videos at home or this format will not be beneficial to them.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec32">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref rid="SM1" ref-type="supplementary-material">Supplementary material</xref>; further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="ethics-statement" id="sec33">
<title>Ethics statement</title>
<p>Ethical approval of an ethical council was not required for the study involving human samples in accordance with the local legislation and institutional requirements because approval has been obtained from the state government. Written informed consent for participation in this study was providedby the participants&#x2019; legal guardians/next of kin.</p>
</sec>
<sec sec-type="author-contributions" id="sec34">
<title>Author contributions</title>
<p>PW: Software, Conceptualization, Writing &#x2013; review &#x0026; editing, Investigation, Resources, Writing &#x2013; original draft, Supervision, Data curation, Project administration, Validation, Methodology, Formal analysis, Visualization. SK: Methodology, Conceptualization, Validation, Investigation, Supervision, Resources, Writing &#x2013; review &#x0026; editing, Funding acquisition, Project administration, Writing &#x2013; original draft. NS: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft, Data curation, Investigation. KB: Validation, Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft, Formal analysis, Software.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>The authors would like to thank all the members of the FALKE-d project, of which this study was a part. The authors would also like to thank the participating teachers and students.</p>
</ack>
<sec sec-type="COI-statement" id="sec35">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec36">
<title>Generative AI statement</title>
<p>The author(s) declared that Generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec37">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec38">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/feduc.2026.1741733/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/feduc.2026.1741733/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.pdf" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_2.pdf" id="SM2" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Barto&#x0161;</surname><given-names>F.</given-names></name> <name><surname>Maier</surname><given-names>M.</given-names></name> <name><surname>Shanks</surname><given-names>D. R.</given-names></name> <name><surname>Stanley</surname><given-names>T. D.</given-names></name> <name><surname>Sladekova</surname><given-names>M.</given-names></name> <name><surname>Wagenmakers</surname><given-names>E.-J.</given-names></name></person-group> (<year>2023</year>). <article-title>Meta-analyses in psychology often overestimate evidence for and size of effects</article-title>. <source>R. Soc. Open Sci.</source> <volume>10</volume>:<fpage>230224</fpage>. doi: <pub-id pub-id-type="doi">10.1098/rsos.230224</pub-id>, <pub-id pub-id-type="pmid">37416830</pub-id></mixed-citation></ref>
<ref id="ref2"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Bergmann</surname><given-names>J.</given-names></name> <name><surname>Sams</surname><given-names>A.</given-names></name></person-group> (<year>2012</year>). <source>Flip your classroom: Reach every student in every class every day</source>. <publisher-loc>Eugene, Oregon</publisher-loc>: <publisher-name>International Society for Technology in Education</publisher-name>.</mixed-citation></ref>
<ref id="ref3"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Binder</surname><given-names>K.</given-names></name> <name><surname>Krauss</surname><given-names>S.</given-names></name> <name><surname>Bruckmaier</surname><given-names>G.</given-names></name></person-group> (<year>2015</year>). <article-title>Effects of visualizing statistical information - an empirical study on tree diagrams and 2 &#x00D7; 2 tables</article-title>. <source>Front. Psychol.</source> <volume>6</volume>:<fpage>1186</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpsyg.2015.01186</pub-id>, <pub-id pub-id-type="pmid">26379569</pub-id></mixed-citation></ref>
<ref id="ref4"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Bishop</surname><given-names>J.</given-names></name> <name><surname>Verleger</surname><given-names>M.</given-names></name></person-group> (<year>2013</year>). The flipped classroom: a survey of the research, in 2013 ASEE Annual Conference &#x0026; 6/23/2013, 23.1200.1&#x2013;23.1200.18.</mixed-citation></ref>
<ref id="ref5"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Brame</surname><given-names>C. J.</given-names></name></person-group> (<year>2016</year>). <article-title>Effective educational videos: principles and guidelines for maximizing student learning from video content</article-title>. <source>CBE Life Sci. Educ.</source> <volume>15</volume>:<fpage>125</fpage>. doi: <pub-id pub-id-type="doi">10.1187/cbe.16-03-0125</pub-id>, <pub-id pub-id-type="pmid">27789532</pub-id></mixed-citation></ref>
<ref id="ref6"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cevikbas</surname><given-names>M.</given-names></name> <name><surname>Kaiser</surname><given-names>G.</given-names></name></person-group> (<year>2020</year>). <article-title>Flipped classroom as a reform-oriented approach to teaching mathematics</article-title>. <source>ZDM</source> <volume>52</volume>, <fpage>1291</fpage>&#x2013;<lpage>1305</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11858-020-01191-5</pub-id>, <pub-id pub-id-type="pmid">33042289</pub-id></mixed-citation></ref>
<ref id="ref7"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cevikbas</surname><given-names>M.</given-names></name> <name><surname>Kaiser</surname><given-names>G.</given-names></name></person-group> (<year>2023</year>). <article-title>Can flipped classroom pedagogy offer promising perspectives for mathematics education on pandemic-related issues? A systematic literature review</article-title>. <source>ZDM</source> <volume>55</volume>, <fpage>177</fpage>&#x2013;<lpage>191</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11858-022-01388-w</pub-id>, <pub-id pub-id-type="pmid">35789885</pub-id></mixed-citation></ref>
<ref id="ref8"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cheng</surname><given-names>L.</given-names></name> <name><surname>Ritzhaupt</surname><given-names>A. D.</given-names></name> <name><surname>Antonenko</surname><given-names>P.</given-names></name></person-group> (<year>2019</year>). <article-title>Effects of the flipped classroom instructional strategy on students&#x2019; learning outcomes: a meta-analysis</article-title>. <source>Educ. Technol. Res. Dev.</source> <volume>67</volume>, <fpage>793</fpage>&#x2013;<lpage>824</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11423-018-9633-7</pub-id></mixed-citation></ref>
<ref id="ref9"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chi</surname><given-names>M. T. H.</given-names></name> <name><surname>Wylie</surname><given-names>R.</given-names></name></person-group> (<year>2014</year>). <article-title>The ICAP framework: linking cognitive engagement to active learning outcomes</article-title>. <source>Educ. Psychol.</source> <volume>49</volume>, <fpage>219</fpage>&#x2013;<lpage>243</lpage>. doi: <pub-id pub-id-type="doi">10.1080/00461520.2014.965823</pub-id></mixed-citation></ref>
<ref id="ref10"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dignath</surname><given-names>C.</given-names></name> <name><surname>B&#x00FC;ttner</surname><given-names>G.</given-names></name></person-group> (<year>2008</year>). <article-title>Components of fostering self-regulated learning among students. A meta-analysis on intervention studies at primary and secondary school level</article-title>. <source>Metacogn. Learn.</source> <volume>3</volume>, <fpage>231</fpage>&#x2013;<lpage>264</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11409-008-9029-x</pub-id></mixed-citation></ref>
<ref id="ref11"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Do&#x011F;an</surname><given-names>Y.</given-names></name> <name><surname>Batd&#x0131;</surname><given-names>V.</given-names></name> <name><surname>Ya&#x015F;ar</surname><given-names>M. D.</given-names></name></person-group> (<year>2021</year>). <article-title>Effectiveness of flipped classroom practices in teaching of science: a mixed research synthesis</article-title>. <source>Res. Sci. Technol. Educ.</source> <volume>41</volume>, <fpage>393</fpage>&#x2013;<lpage>421</lpage>. doi: <pub-id pub-id-type="doi">10.1080/02635143.2021.1909553</pub-id></mixed-citation></ref>
<ref id="ref12"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Frei</surname><given-names>M.</given-names></name> <name><surname>Asen-Molz</surname><given-names>K.</given-names></name> <name><surname>Hilbert</surname><given-names>S.</given-names></name> <name><surname>Schilcher</surname><given-names>A.</given-names></name> <name><surname>Krauss</surname><given-names>S.</given-names></name></person-group> (<year>2020</year>). <source>Die Wirksamkeit von Erkl&#x00E4;rvideos im Rahmen der Methode Flipped Classroom</source>. <publisher-loc>Bildung, Schule</publisher-loc>, <publisher-name>Digitalisierung</publisher-name>. <volume>34</volume>, <fpage>284</fpage>&#x2013;<lpage>290</lpage>.</mixed-citation></ref>
<ref id="ref13"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gigerenzer</surname><given-names>G.</given-names></name> <name><surname>Hoffrage</surname><given-names>U.</given-names></name></person-group> (<year>1995</year>). <article-title>How to improve Bayesian reasoning without instruction: frequency formats</article-title>. <source>Psychol. Rev.</source> <volume>102</volume>, <fpage>684</fpage>&#x2013;<lpage>704</lpage>. doi: <pub-id pub-id-type="doi">10.1037/0033-295x.102.4.684</pub-id></mixed-citation></ref>
<ref id="ref14"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gillette</surname><given-names>C.</given-names></name> <name><surname>Rudolph</surname><given-names>M.</given-names></name> <name><surname>Kimble</surname><given-names>C.</given-names></name> <name><surname>Rockich-Winston</surname><given-names>N.</given-names></name> <name><surname>Smith</surname><given-names>L.</given-names></name> <name><surname>Broedel-Zaugg</surname><given-names>K.</given-names></name></person-group> (<year>2018</year>). <article-title>A Meta-analysis of outcomes comparing flipped classroom and lecture</article-title>. <source>Am. J. Pharm. Educ.</source> <volume>82</volume>:<fpage>6898</fpage>. doi: <pub-id pub-id-type="doi">10.5688/ajpe6898</pub-id>, <pub-id pub-id-type="pmid">30013248</pub-id></mixed-citation></ref>
<ref id="ref15"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>G&#x00FC;ler</surname><given-names>M.</given-names></name> <name><surname>Koko&#x00E7;</surname><given-names>M.</given-names></name> <name><surname>&#x00D6;nder B&#x00FC;t&#x00FC;ner</surname><given-names>S.</given-names></name></person-group> (<year>2022</year>). <article-title>Does a flipped classroom model work in mathematics education? A meta-analysis</article-title>. <source>Educ. Inf. Technol.</source> <volume>28</volume>, <fpage>57</fpage>&#x2013;<lpage>79</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10639-022-11143-z</pub-id></mixed-citation></ref>
<ref id="ref16"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hew</surname><given-names>K. F.</given-names></name> <name><surname>Bai</surname><given-names>S.</given-names></name> <name><surname>Dawson</surname><given-names>P.</given-names></name> <name><surname>Lo</surname><given-names>C. K.</given-names></name></person-group> (<year>2021</year>). <article-title>Meta-analyses of flipped classroom studies: a review of methodology</article-title>. <source>Educ. Res. Rev.</source> <volume>33</volume>:<fpage>100393</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.edurev.2021.100393</pub-id></mixed-citation></ref>
<ref id="ref17"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hilbert</surname><given-names>S.</given-names></name> <name><surname>Stadler</surname><given-names>M.</given-names></name> <name><surname>Lindl</surname><given-names>A.</given-names></name> <name><surname>Naumann</surname><given-names>F.</given-names></name> <name><surname>B&#x00FC;hner</surname><given-names>M.</given-names></name></person-group> (<year>2019</year>). <article-title>Analyzing longitudinal intervention studies with linear mixed models</article-title>. <source>Test. Psychomet. Methodol. Appl. Psychol.</source> <volume>26</volume>, <fpage>101</fpage>&#x2013;<lpage>119</lpage>. doi: <pub-id pub-id-type="doi">10.4473/TPM26.1.6</pub-id></mixed-citation></ref>
<ref id="ref18"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hwang</surname><given-names>G.-J.</given-names></name> <name><surname>Yin</surname><given-names>C.</given-names></name> <name><surname>Chu</surname><given-names>H.-C.</given-names></name></person-group> (<year>2019</year>). <article-title>The era of flipped learning: promoting active learning and higher order thinking with innovative flipped learning strategies and supporting systems</article-title>. <source>Interact. Learn. Environ.</source> <volume>27</volume>, <fpage>991</fpage>&#x2013;<lpage>994</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10494820.2019.1667150</pub-id></mixed-citation></ref>
<ref id="ref19"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kapur</surname><given-names>M.</given-names></name> <name><surname>Hattie</surname><given-names>J.</given-names></name> <name><surname>Grossman</surname><given-names>I.</given-names></name> <name><surname>Sinha</surname><given-names>T.</given-names></name></person-group> (<year>2022</year>). <article-title>Fail, flip, fix, and feed &#x2013; rethinking flipped learning: a review of meta-analyses and a subsequent meta-analysis</article-title>. <source>Front. Educ.</source> <volume>7</volume>:<fpage>956416</fpage>. doi: <pub-id pub-id-type="doi">10.3389/feduc.2022.956416</pub-id></mixed-citation></ref>
<ref id="ref20"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kvarven</surname><given-names>A.</given-names></name> <name><surname>Str&#x00F8;mland</surname><given-names>E.</given-names></name> <name><surname>Johannesson</surname><given-names>M.</given-names></name></person-group> (<year>2020</year>). <article-title>Comparing meta-analyses and preregistered multiple-laboratory replication projects</article-title>. <source>Nat. Hum. Behav.</source> <volume>4</volume>, <fpage>423</fpage>&#x2013;<lpage>434</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41562-019-0787-z</pub-id>, <pub-id pub-id-type="pmid">31873200</pub-id></mixed-citation></ref>
<ref id="ref21"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>L&#x00E5;g</surname><given-names>T.</given-names></name> <name><surname>S&#x00E6;le</surname><given-names>R. G.</given-names></name></person-group> (<year>2019</year>). <article-title>Does the flipped classroom improve student learning and satisfaction? A systematic review and meta-analysis</article-title>. <source>AERA Open</source> <volume>5</volume>:<fpage>233285841987048</fpage>. doi: <pub-id pub-id-type="doi">10.1177/2332858419870489</pub-id></mixed-citation></ref>
<ref id="ref22"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lage</surname><given-names>M. J.</given-names></name> <name><surname>Platt</surname><given-names>G. J.</given-names></name> <name><surname>Treglia</surname><given-names>M.</given-names></name></person-group> (<year>2000</year>). <article-title>Inverting the classroom: a gateway to creating an inclusive learning environment</article-title>. <source>J. Econ. Educ.</source> <volume>31</volume>, <fpage>30</fpage>&#x2013;<lpage>43</lpage>. doi: <pub-id pub-id-type="doi">10.1080/00220480009596759</pub-id></mixed-citation></ref>
<ref id="ref23"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lai</surname><given-names>C.-L.</given-names></name> <name><surname>Hwang</surname><given-names>G.-J.</given-names></name></person-group> (<year>2016</year>). <article-title>A self-regulated flipped classroom approach to improving students&#x2019; learning performance in a mathematics course</article-title>. <source>Comput. Educ.</source> <volume>100</volume>, <fpage>126</fpage>&#x2013;<lpage>140</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.compedu.2016.05.006</pub-id></mixed-citation></ref>
<ref id="ref24"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>S.</given-names></name> <name><surname>Fu</surname><given-names>W.</given-names></name> <name><surname>Liu</surname><given-names>X.</given-names></name> <name><surname>Hwang</surname><given-names>G.-J.</given-names></name></person-group> (<year>2024</year>). <article-title>Effectiveness of flipped classrooms for K&#x2013;12 students: evidence from a three-level meta-analysis</article-title>. <source>Rev. Educ. Res.</source> <volume>95</volume>:<fpage>261732</fpage>. doi: <pub-id pub-id-type="doi">10.3102/00346543241261732</pub-id></mixed-citation></ref>
<ref id="ref25"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lo</surname><given-names>C. K.</given-names></name> <name><surname>Hew</surname><given-names>K. F.</given-names></name></person-group> (<year>2023</year>). <article-title>A review of integrating AI-based chatbots into flipped learning: new possibilities and challenges</article-title>. <source>Front. Educ.</source> <volume>8</volume>:<fpage>1175715</fpage>. doi: <pub-id pub-id-type="doi">10.3389/feduc.2023.1175715</pub-id></mixed-citation></ref>
<ref id="ref26"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lo</surname><given-names>C. K.</given-names></name> <name><surname>Hew</surname><given-names>K. F.</given-names></name> <name><surname>Chen</surname><given-names>G.</given-names></name></person-group> (<year>2017</year>). <article-title>Toward a set of design principles for mathematics flipped classrooms: a synthesis of research in mathematics education</article-title>. <source>Educ. Res. Rev.</source> <volume>22</volume>, <fpage>50</fpage>&#x2013;<lpage>73</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.edurev.2017.08.002</pub-id></mixed-citation></ref>
<ref id="ref27"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lubrick</surname><given-names>M.</given-names></name> <name><surname>Zhou</surname><given-names>G.</given-names></name> <name><surname>Zhang</surname><given-names>J.</given-names></name></person-group> (<year>2019</year>). <article-title>Is the future bright? The potential of lightboard videos for student achievement and engagement in learning</article-title>. <source>Eurasia J. Math. Sci. Technol. Educ.</source> <volume>15</volume>:<fpage>108437</fpage>. doi: <pub-id pub-id-type="doi">10.29333/ejmste/108437</pub-id></mixed-citation></ref>
<ref id="ref28"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Maxwell</surname><given-names>S. E.</given-names></name> <name><surname>Lau</surname><given-names>M. Y.</given-names></name> <name><surname>Howard</surname><given-names>G. S.</given-names></name></person-group> (<year>2015</year>). <article-title>Is psychology suffering from a replication crisis? What does "failure to replicate" really mean?</article-title> <source>Am. Psychol.</source> <volume>70</volume>, <fpage>487</fpage>&#x2013;<lpage>498</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0039400</pub-id>, <pub-id pub-id-type="pmid">26348332</pub-id></mixed-citation></ref>
<ref id="ref29"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mayer</surname><given-names>R. E.</given-names></name> <name><surname>Fiorella</surname><given-names>L.</given-names></name> <name><surname>Stull</surname><given-names>A.</given-names></name></person-group> (<year>2020</year>). <article-title>Five ways to increase the effectiveness of instructional video</article-title>. <source>Educ. Technol. Res. Dev.</source> <volume>68</volume>, <fpage>837</fpage>&#x2013;<lpage>852</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11423-020-09749-6</pub-id></mixed-citation></ref>
<ref id="ref30"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>McDowell</surname><given-names>M.</given-names></name> <name><surname>Jacobs</surname><given-names>P.</given-names></name></person-group> (<year>2017</year>). <article-title>Meta-analysis of the effect of natural frequencies on Bayesian reasoning</article-title>. <source>Psychol. Bull.</source> <volume>143</volume>, <fpage>1273</fpage>&#x2013;<lpage>1312</lpage>. doi: <pub-id pub-id-type="doi">10.1037/bul0000126</pub-id>, <pub-id pub-id-type="pmid">29048176</pub-id></mixed-citation></ref>
<ref id="ref31"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Pintrich</surname><given-names>P. R.</given-names></name></person-group> (<year>1999</year>). <article-title>The role of motivation in promoting and sustaining self-regulated learning</article-title>. <source>Int. J. Educ. Res.</source> <volume>31</volume>, <fpage>459</fpage>&#x2013;<lpage>470</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0883-0355(99)00015-4</pub-id></mixed-citation></ref>
<ref id="ref32"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Shrout</surname><given-names>P. E.</given-names></name> <name><surname>Rodgers</surname><given-names>J. L.</given-names></name></person-group> (<year>2018</year>). <article-title>Psychology, science, and knowledge construction: broadening perspectives from the replication crisis</article-title>. <source>Annu. Rev. Psychol.</source> <volume>69</volume>, <fpage>487</fpage>&#x2013;<lpage>510</lpage>. doi: <pub-id pub-id-type="doi">10.1146/annurev-psych-122216-011845</pub-id>, <pub-id pub-id-type="pmid">29300688</pub-id></mixed-citation></ref>
<ref id="ref9001"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Simons</surname><given-names>D. J.</given-names></name></person-group> (<year>2010</year>). <article-title>Monkeying around with the gorillas in our midst: familiarity with an inattentional-blindness task does not improve the detection of unexpected events</article-title>. <source>i-Perception</source> <volume>1</volume>, <fpage>3</fpage>&#x2013;<lpage>6</lpage>.</mixed-citation></ref>
<ref id="ref33"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sotola</surname><given-names>L. K.</given-names></name></person-group> (<year>2022</year>). <article-title>Garbage in, garbage out? Evaluating the evidentiary value of published Meta-analyses using Z-curve analysis</article-title>. <source>Collabra Psychol.</source> <volume>8</volume>:<fpage>32571</fpage>. doi: <pub-id pub-id-type="doi">10.1525/collabra.32571</pub-id></mixed-citation></ref>
<ref id="ref34"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stoeger</surname><given-names>H.</given-names></name> <name><surname>Fleischmann</surname><given-names>S.</given-names></name> <name><surname>Obergriesser</surname><given-names>S.</given-names></name></person-group> (<year>2015</year>). <article-title>Self-regulated learning (SRL) and the gifted learner in primary school: the theoretical basis and empirical findings on a research program dedicated to ensuring that all students learn to regulate their own learning</article-title>. <source>Asia Pac. Educ. Rev.</source> <volume>16</volume>, <fpage>257</fpage>&#x2013;<lpage>267</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s12564-015-9376-7</pub-id></mixed-citation></ref>
<ref id="ref35"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Strelan</surname><given-names>P.</given-names></name> <name><surname>Osborn</surname><given-names>A.</given-names></name> <name><surname>Palmer</surname><given-names>E.</given-names></name></person-group> (<year>2020</year>). <article-title>The flipped classroom: a meta-analysis of effects on student performance across disciplines and education levels</article-title>. <source>Educ. Res. Rev.</source> <volume>30</volume>:<fpage>100314</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.edurev.2020.100314</pub-id></mixed-citation></ref>
<ref id="ref36"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname><given-names>V.</given-names></name> <name><surname>Painho</surname><given-names>M.</given-names></name> <name><surname>Vorobeva</surname><given-names>D.</given-names></name></person-group> (<year>2025</year>). <article-title>Integrating tailored generative AI into the flipped classroom: a pilot implementation in higher education</article-title>. <source>Innov. Educ. Teach. Int.</source>, <volume>62</volume>:<fpage>1</fpage>&#x2013;<lpage>19</lpage>. doi: <pub-id pub-id-type="doi">10.1080/14703297.2025.2523898</pub-id></mixed-citation></ref>
<ref id="ref37"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>van Alten</surname><given-names>D. C.</given-names></name> <name><surname>Phielix</surname><given-names>C.</given-names></name> <name><surname>Janssen</surname><given-names>J.</given-names></name> <name><surname>Kester</surname><given-names>L.</given-names></name></person-group> (<year>2019</year>). <article-title>Effects of flipping the classroom on learning outcomes and satisfaction: a meta-analysis</article-title>. <source>Educ. Res. Rev.</source> <volume>28</volume>:<fpage>100281</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.edurev.2019.05.003</pub-id></mixed-citation></ref>
<ref id="ref38"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>van Alten</surname><given-names>D. C.</given-names></name> <name><surname>Phielix</surname><given-names>C.</given-names></name> <name><surname>Janssen</surname><given-names>J.</given-names></name> <name><surname>Kester</surname><given-names>L.</given-names></name></person-group> (<year>2020a</year>). <article-title>Effects of self-regulated learning prompts in a flipped history classroom</article-title>. <source>Comput. Hum. Behav.</source> <volume>108</volume>:<fpage>106318</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.chb.2020.106318</pub-id></mixed-citation></ref>
<ref id="ref39"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>van Alten</surname><given-names>D. C.</given-names></name> <name><surname>Phielix</surname><given-names>C.</given-names></name> <name><surname>Janssen</surname><given-names>J.</given-names></name> <name><surname>Kester</surname><given-names>L.</given-names></name></person-group> (<year>2020b</year>). <article-title>Self-regulated learning support in flipped learning videos enhances learning outcomes</article-title>. <source>Comput. Educ.</source> <volume>158</volume>:<fpage>104000</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.compedu.2020.104000</pub-id></mixed-citation></ref>
<ref id="ref40"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vosniadou</surname><given-names>S.</given-names></name></person-group> (<year>2020</year>). <article-title>Bridging secondary and higher education. The importance of self-regulated learning</article-title>. <source>Eur. Rev.</source> <volume>28</volume>, <fpage>S94</fpage>&#x2013;<lpage>S103</lpage>. doi: <pub-id pub-id-type="doi">10.1017/s1062798720000939</pub-id></mixed-citation></ref>
<ref id="ref41"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wagner</surname><given-names>M.</given-names></name> <name><surname>Gegenfurtner</surname><given-names>A.</given-names></name> <name><surname>Urhahne</surname><given-names>D.</given-names></name></person-group> (<year>2020</year>). <article-title>Effectiveness of the flipped classroom on student achievement in secondary education: a meta-analysis</article-title>. <source>Z. Padagog. Psychol.</source> <volume>35</volume>, <fpage>11</fpage>&#x2013;<lpage>31</lpage>. doi: <pub-id pub-id-type="doi">10.1024/1010-0652/a000274</pub-id></mixed-citation></ref>
<ref id="ref42"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wagner</surname><given-names>M.</given-names></name> <name><surname>Urhahne</surname><given-names>D.</given-names></name></person-group> (<year>2021</year>). <article-title>Disentangling the effects of flipped classroom instruction in EFL secondary education: when is it effective and for whom?</article-title> <source>Learn. Instr.</source> <volume>75</volume>:<fpage>101490</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.learninstruc.2021.101490</pub-id></mixed-citation></ref>
<ref id="ref43"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wiesner</surname><given-names>P.</given-names></name> <name><surname>Binder</surname><given-names>K.</given-names></name> <name><surname>Krauss</surname><given-names>S.</given-names></name> <name><surname>Steib</surname><given-names>N.</given-names></name> <name><surname>Leusch</surname><given-names>C.</given-names></name></person-group> (<year>2023</year>). <article-title>Sechs verschiedene Darstellungsarten f&#x00FC;r "25%" - und wie man sie ineinander umrechnen kann</article-title>. <source>Stoch. Sch.</source> <volume>43</volume>, <fpage>2</fpage>&#x2013;<lpage>12</lpage>.</mixed-citation></ref>
<ref id="ref44"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Zeidner</surname><given-names>M.</given-names></name> <name><surname>Stoeger</surname><given-names>H.</given-names></name></person-group> (<year>2019</year>) '<article-title>Self-regulated learning (SRL): a guide for the perplexed</article-title>', <source>High Abil. Stud.</source>, vol. <volume>30</volume>, 1&#x2013;2, pp. <fpage>9</fpage>&#x2013;<lpage>51</lpage>.</mixed-citation></ref>
<ref id="ref45"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>F.</given-names></name> <name><surname>Wang</surname><given-names>H.</given-names></name> <name><surname>Zhang</surname><given-names>H.</given-names></name> <name><surname>Sun</surname><given-names>Q.</given-names></name></person-group> (<year>2024</year>). <article-title>The landscape of flipped classroom research: a bibliometrics analysis</article-title>. <source>Front. Educ.</source> <volume>9</volume>:<fpage>1165547</fpage>. doi: <pub-id pub-id-type="doi">10.3389/feduc.2024.1165547</pub-id></mixed-citation></ref>
<ref id="ref46"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhu</surname><given-names>G.</given-names></name></person-group> (<year>2021</year>). <article-title>Is flipping effective? A meta-analysis of the effect of flipped instruction on K-12 students&#x2019; academic achievement</article-title>. <source>Educ. Technol. Res. Dev.</source> <volume>69</volume>, <fpage>733</fpage>&#x2013;<lpage>761</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11423-021-09983-6</pub-id></mixed-citation></ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0002">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2980310/overview">I Kadek Suartama</ext-link>, Ganesha University of Education, Indonesia</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0003">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2969456/overview">Teguh Arie Sandy</ext-link>, Ahli Media Consultant, Indonesia</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3149355/overview">I Gde Wawan Sudatha</ext-link>, Ganesha University of Education, Indonesia</p>
</fn>
</fn-group>
<fn-group>
<fn id="fn0001">
<label>1</label>
<p>The study was part of FALKE-d (<xref ref-type="bibr" rid="ref12">Frei et al., 2020</xref>).</p>
</fn>
</fn-group>
</back>
</article>