<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="methods-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychol.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Psychology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1664-1078</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyg.2026.1614844</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Methods</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Multiple imputation and pooling strategies for handling wide-format missing data in latent growth curve modeling</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Jia</surname>
<given-names>Fan</given-names>
</name>
<xref ref-type="aff" rid="aff1"/>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3038771"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yan</surname>
<given-names>Yueqi</given-names>
</name>
<xref ref-type="aff" rid="aff1"/>
<uri xlink:href="https://loop.frontiersin.org/people/3418048"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><institution>Psychological Sciences, University of California, Merced</institution>, <city>Merced</city>, <state>CA</state>, <country country="us">United States</country></aff>
<author-notes>
<corresp id="c001"><label>&#x002A;</label>Correspondence: Fan Jia, <email xlink:href="mailto:fjia3@ucmerced.edu">fjia3@ucmerced.edu</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-03-18">
<day>18</day>
<month>03</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>17</volume>
<elocation-id>1614844</elocation-id>
<history>
<date date-type="received">
<day>19</day>
<month>04</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>06</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>23</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2026 Jia and Yan.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Jia and Yan</copyright-holder>
<license>
<ali:license_ref start_date="2026-03-18">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Latent growth curve modeling (LGCM), commonly employed in psychological sciences, often encounters the challenge of missing data, which introduce difficulties into the modeling process. While the full information maximum likelihood (FIML) is the dominant missing data handling technique in practice, an alternative class of techniques, multiple imputation (MI), may be preferable in certain scenarios. With the recent increasing attention shine lights on multilevel MI, we conducted a simulation study examining both standard wide-format (MI-wEMB and MI-wFCS) and multilevel long-format MI methods (MI-llMLM and MI-lqMLM) in comparison with FIML under various missing data conditions and model specifications. Our results indicate that while FIML generally produced unbiased estimates and accurate confidence intervals (CIs), most MI methods demonstrated comparable performance across most conditions. However, the proportion of missing data played a notable role, affecting the performance of the methods to varying extents. We also examined the variation in pooling strategies for the likelihood ratio test (LRT) statistic. The results showed that pooling strategies did not exhibit significant differences in performance, but long-format MI methods displayed concerningly conservative Type I error rates (near zero), regardless of the pooling strategy used. The study further revealed that when the analysis model was misspecified, FIML still maintained the highest power, followed by MI-wEMB, MI-wFCS, and MI-lqMLM. Sample size and missing data proportion had the most significant impact on power. Our findings provide practical guidance for researchers in selecting appropriate missing data approaches for LGCM.</p>
</abstract>
<kwd-group>
<kwd>latent growth curve modeling</kwd>
<kwd>long format</kwd>
<kwd>missing data</kwd>
<kwd>multilevel imputation</kwd>
<kwd>pooling</kwd>
<kwd>wide format</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was not received for this work and/or its publication.</funding-statement>
</funding-group>
<counts>
<fig-count count="12"/>
<table-count count="2"/>
<equation-count count="14"/>
<ref-count count="50"/>
<page-count count="19"/>
<word-count count="11081"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Quantitative Psychology and Measurement</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>Latent growth curve modeling (LGCM) is widely used in psychological sciences to understand changes over time. It uses latent constructs to estimate the average coefficients of trajectories, e.g., latent intercept and slopes, accounting for individual variations in these coefficients. Although the multilevel modeling (MLM) approach also investigates the growth trajectory of repeated-measures outcomes of interests, LGCM has some advantages over it. For example, LGCM is a structural equation modeling-based approach, and therefore, it explicitly accounts for measurement errors to test the theoretical models. In addition, LGCM enables researchers to investigate relationship among latent growth components (i.e., latent intercept and slopes) and other variables (e.g., covariates and distal outcomes).</p>
<p>Since missing data has been an inevitable issue in longitudinal studies, researchers who employ LGCM must select appropriate methodological approaches to address this challenge. Typical issues caused by missing data are biased parameter estimates, distorted model fit, and power loss (<xref ref-type="bibr" rid="ref003">Enders, 2022</xref>). Traditional missing data handling approaches, such as listwise deletion and single imputations, have been considered ineffective and problematic. The state-of-arts missing data techniques, such as full information maximum likelihood (FIML) and multiple imputation (MI), have gained increasing popularity in recent decades. FIML is wildly recognized in the fields of latent variable analysis, including LGCM. Previous research revealed when the multivariate normality assumption holds, FIML could produce unbiased parameter estimates and appropriate test statistics, taking into account missing data simultaneously (<xref ref-type="bibr" rid="ref12">Collins et al., 2001</xref>; <xref ref-type="bibr" rid="ref16">Enders and Bandalos, 2001</xref>; <xref ref-type="bibr" rid="ref54">Rubin, 1987</xref>). In contrast, MI is a family of approaches that addresses missing data and perform data analysis in separate steps. While FIML is often the default approach for handling missing data in the LGCM, MI offers several important advantages in many applied research settings. For example, MI can readily accommodate a large number of auxiliary variables that are not part of the analysis model but improve missing data recovery, whereas incorporating numerous auxiliary variables with FIML can be cumbersome and computationally challenging (<xref ref-type="bibr" rid="ref22">Graham, 2003</xref>; <xref ref-type="bibr" rid="ref56">Savalei and Bentler, 2009</xref>). In addition, with complex models or complicated data structures, FIML may fail to converge or become computationally infeasible (<xref ref-type="bibr" rid="ref56">Savalei and Bentler, 2009</xref>). In contrary, MI can often overcome these limitations because the estimation is conducted on completed data sets following imputation (<xref ref-type="bibr" rid="ref18">Enders and Mansolf, 2018</xref>; <xref ref-type="bibr" rid="ref21">Gottschall et al., 2012</xref>). MI also offers greater flexibility in specifying imputation models, allowing it to better accommodate nonnormal or nonlinear relationships (<xref ref-type="bibr" rid="ref1">Asparouhov and Muth&#x00E9;n, 2010</xref>; <xref ref-type="bibr" rid="ref67">White et al., 2011</xref>; <xref ref-type="bibr" rid="ref30">Jia and Wu, 2022</xref>). This article therefore focuses on conditions under which both FIML and MI are practically applicable and directly comparable, in order to examine their relative performance in a controlled setting. Although MI&#x2019;s primary advantages often arise in scenarios where FIML is difficult or impossible to apply, establishing their comparative behavior under shared feasible conditions provides an important foundation for understanding their respective strengths and limitations.</p>
<p>Despite its advantages, MI is less straightforward than FIML. It generally requires three steps: imputation (i.e., generating multiple complete data sets with missing values filled in), analysis (i.e., fitting multiple imputed data sets into the target analysis model), and pooling (i.e., combining the analysis results from these multiple imputed data sets). To ensure unbiased parameter estimates, each step requires to implement appropriate approaches. Generally speaking, the imputation model should align with the research context, the nature of the missing data, and the underlying assumptions of missing data mechanism (we will describe it in the next section). For longitudinal data, the process for selecting an appropriate imputation strategy can be even more intricate. Specific to longitudinal studies, data can be organized in either a wide format or long format. In the wide format, observations across measurement occasions are presented in separate variables. In such data structure, each row stores all observational data for one individual but with a greater number of columns. In the LGCM framework, the most common practice is to perform both imputation and a subsequent data analysis in the wide format.</p>
<p>The long format involves vertically stacking the observations from multiple measurement occasions for each individual, with an additional variable indicating the measurement occasion. This data format is commonly used within the MLM framework. For data organized in long format, several imputation methods suitable for the multilevel data structure have been proposed, especially for cross-sectional analysis (e.g., students clustered within classroom; <xref ref-type="bibr" rid="ref002">Audigier and Resche-Rigon, 2018</xref>; <xref ref-type="bibr" rid="ref9">Carpenter et al., 2011</xref>; <xref ref-type="bibr" rid="ref17">Enders et al., 2020</xref>; <xref ref-type="bibr" rid="ref45">Quartagno and Carpenter, 2016</xref>, <xref ref-type="bibr" rid="ref46">2019</xref>; <xref ref-type="bibr" rid="ref51">Resche-Rigon and White, 2018</xref>; <xref ref-type="bibr" rid="ref66">van Buuren and Groothuis-Oudshoorn, 2011</xref>; <xref ref-type="bibr" rid="ref71">Zhao and Schafer, 2015</xref>). Conceptually, the multilevel imputation approach is appropriate for the longitudinal data for a LGCM model, i.e., repeated measures inherently nested within individuals. However, limited research has examined their performance with such longitudinal data structures. One complication is that such investigation requires data transformation between wide and long formats. Specifically, one needs to convert original data to long format for the multilevel imputation process, then revert imputed data back to wide format to accommodate the requirements of the latent growth analysis model. Given the growing awareness in multilevel MI methods for longitudinal designs and recent software advancements in the MLM framework (e.g., <xref ref-type="bibr" rid="ref17">Enders et al., 2020</xref>), it is timely and relevant to evaluate how these conceptually appropriate multilevel MI methods (a.k.a., <italic>long-format MI</italic>) perform when applied to repeated-measures data in LGCM, compared to standard, single-level <italic>wide-format MI</italic>.</p>
<p>Another recent methodological advancement in MI further motivated this study. While parameter estimates and standard errors can be directly pooled using <xref ref-type="bibr" rid="ref54">Rubin&#x2019;s (1987)</xref> rules, strategies for pooling likelihood ratio test (LRT) statistics and practical fit indices have received comparatively little attention. <xref ref-type="bibr" rid="ref003">Enders (2022)</xref> summarizes two strategies for pooling LRT: D<sub>2</sub> (<xref ref-type="bibr" rid="ref37">Li et al., 1991</xref>) and D<sub>3</sub> (<xref ref-type="bibr" rid="ref41">Meng and Rubin, 1992</xref>), which have been evaluated in a few simulation studies (e.g., <xref ref-type="bibr" rid="ref18">Enders and Mansolf, 2018</xref>; <xref ref-type="bibr" rid="ref39">Liu and Sriutaisuk, 2020</xref>) under different scenarios. In more recent work, <xref ref-type="bibr" rid="ref10">Chan and Meng (2022)</xref> proposed a new LRT statistic pooling strategy, which has been denoted as D<sub>4</sub> and proven at least as effective as D<sub>3</sub> while offering greater efficiency (<xref ref-type="bibr" rid="ref25">Grund et al., 2023</xref>). To our knowledge, none of these pooling approaches has been evaluated within the LGCM framework.</p>
<p>This current article aims to provide researchers with guidance on the best practice in handling missing data using MI when performing a LGCM, including recommendations for selecting appropriate imputation methods (e.g., wide-format vs. long-format) and optimal pooling strategies for model fit evaluation. The remaining of the article is organized as follows. We first introduce the basics and principals of LGCM, and then discuss missing data mechanisms and highlight the difference among commonly used missing data techniques, with a focus on MI. We then delve into the imputation phase in MI, introducing imputation algorithms and imputation models that are suitable for scenarios in the LGCM framework. Additionally, the pooling phase is reviewed, with an emphasis on the pooling strategies for the LRT statistic. Moving forward, we present a simulation study that compared the combinations of these imputation and pooling strategies with FIML. Finally, we provided an empirical example and conclude with practical guidance on implementing these strategies in MI in the context of LGCM.</p>
</sec>
<sec id="sec2">
<label>2</label>
<title>Latent growth curve modeling</title>
<p>A classic application of LGCM is to analyze continuous repeated-measures data collected from a group of individuals and estimate intraindividual (within-person) growth over time [i.e., latent intercept and latent slope(s)], while accounting for variability at interindividual (between-person) levels (<xref ref-type="bibr" rid="ref35">Kohli and Harring, 2013</xref>; <xref ref-type="bibr" rid="ref6">Bollen and Curran, 2006</xref>). A latent intercept captures the initial level; and latent slope(s) usually represent a growth pattern as a polynomial function of time, such as linear, quadratic, cubic, etc. These two types of latent growth factors are measured by their mean levels, individual variances, and covariances between them (<xref ref-type="bibr" rid="ref13">Depaoli et al., 2023</xref>). The repeated measures are indicators of latent growth factors, linked by factor loadings. A typical latent quadratic model, for example, can be presented in matrix form in <xref ref-type="disp-formula" rid="E2">Equation 1</xref>.</p>
<disp-formula id="E1">
<mml:math id="M1">
<mml:mi>y</mml:mi>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x039B;</mml:mi>
<mml:mi>y</mml:mi>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:mi>&#x03B7;</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>&#x03B5;</mml:mi>
<mml:mo>,</mml:mo>
</mml:math>
</disp-formula>
<disp-formula id="E2">
<mml:math id="M2">
<mml:mo stretchy="true">[</mml:mo>
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mo>&#x22EE;</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mi>T</mml:mi>
</mml:msub>
</mml:mtd>
</mml:mtr>
</mml:mtable>
<mml:mo stretchy="true">]</mml:mo>
<mml:mo>=</mml:mo>
<mml:mo stretchy="true">[</mml:mo>
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:mn>1</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mtd>
<mml:mtd>
<mml:msubsup>
<mml:mi>t</mml:mi>
<mml:mn>1</mml:mn>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mn>1</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mtd>
<mml:mtd>
<mml:msubsup>
<mml:mi>t</mml:mi>
<mml:mn>2</mml:mn>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mn>1</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
</mml:mtd>
<mml:mtd>
<mml:msubsup>
<mml:mi>t</mml:mi>
<mml:mn>3</mml:mn>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mo>&#x22EE;</mml:mo>
</mml:mtd>
<mml:mtd>
<mml:mo>&#x22EE;</mml:mo>
</mml:mtd>
<mml:mtd>
<mml:mo>&#x22EE;</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mn>1</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mi>T</mml:mi>
</mml:msub>
</mml:mtd>
<mml:mtd>
<mml:msubsup>
<mml:mi>t</mml:mi>
<mml:mi>T</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mtd>
</mml:mtr>
</mml:mtable>
<mml:mo stretchy="true">]</mml:mo>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">[</mml:mo>
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mi>I</mml:mi>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mtd>
</mml:mtr>
</mml:mtable>
<mml:mo stretchy="true">]</mml:mo>
<mml:mo>+</mml:mo>
<mml:mo stretchy="true">[</mml:mo>
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>&#x03B5;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>&#x03B5;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>&#x03B5;</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mo>&#x22EE;</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>&#x03B5;</mml:mi>
<mml:mi>T</mml:mi>
</mml:msub>
</mml:mtd>
</mml:mtr>
</mml:mtable>
<mml:mo stretchy="true">]</mml:mo>
<mml:mo>,</mml:mo>
</mml:math>
<label>(1)</label>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M3">
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is time code for the <italic>j</italic><sup>th</sup> measurement occasion; <inline-formula>
<mml:math id="M4">
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> represents a vector of outcome for all individuals at the <italic>j</italic><sup>th</sup> measurement occasion; and <inline-formula>
<mml:math id="M5">
<mml:msub>
<mml:mi>&#x03B5;</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is a residual vector at the <italic>j</italic><sup>th</sup> measurement occasion (<italic>j</italic>&#x202F;=&#x202F;1, 2, &#x2026; <italic>T</italic>). The latent intercept, latent linear slope, and latent quadratic slope are denoted by <inline-formula>
<mml:math id="M6">
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mi>I</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math id="M7">
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>, and <inline-formula>
<mml:math id="M8">
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>, respectively. For a linear model, the model is a reduced form of <xref ref-type="disp-formula" rid="E2">Equation 1</xref>, with the <inline-formula>
<mml:math id="M9">
<mml:msub>
<mml:mi>&#x039B;</mml:mi>
<mml:mi>y</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> matrix only containing the first two columns, and <inline-formula>
<mml:math id="M10">
<mml:mi>&#x03B7;</mml:mi>
</mml:math>
</inline-formula> matrix only containing <inline-formula>
<mml:math id="M11">
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mi>I</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math id="M12">
<mml:msub>
<mml:mi>&#x03B7;</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>.</p>
<p>The model fit evaluation is commonly based on the likelihood ratio test (LRT) statistics, which assesses the difference between the model implied and observed covariance matrices and mean vectors. The LRT statistic, denoted <italic>T</italic>, follows a <inline-formula>
<mml:math id="M13">
<mml:msup>
<mml:mi>&#x03C7;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:math>
</inline-formula>distribution assuming data are normally distributed and can be written as follows.</p>
<disp-formula id="E3">
<mml:math id="M14">
<mml:mi>T</mml:mi>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo stretchy="true">[</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03B8;</mml:mi>
<mml:mo stretchy="true">&#x0302;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>l</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03B2;</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">]</mml:mo>
<mml:mo>,</mml:mo>
</mml:math>
<label>(2)</label>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M15">
<mml:mi>l</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03B8;</mml:mi>
<mml:mo stretchy="true">&#x0302;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> is the maximized log-likelihood under the hypothesized model, and <inline-formula>
<mml:math id="M16">
<mml:mi>l</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03B2;</mml:mi>
<mml:mo stretchy="true">&#x02DC;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> is the corresponding log-likelihood of the saturated model (<xref ref-type="bibr" rid="ref5">Bollen, 1989</xref>).</p>
</sec>
<sec id="sec3">
<label>3</label>
<title>Multiple imputation in missing data handling</title>
<p>Data can be missing during the data collection process through various ways. <xref ref-type="bibr" rid="ref004">Rubin (1976)</xref> summarized three primary missing data mechanisms, including missing completely at random (MCAR), missing at random (MAR), and missing not at random (MNAR). MAR occurs when probability of data being missing on a variable is only related to the observed variables. MCAR is sometimes considered as a special case of MAR; the former refers to the situation where the probability of data being missing on a variable is unrelated to its values or any other observed variables in the dataset. These two mechanisms are commonly referred to as &#x201C;ignorable missingness&#x201D; when the condition of &#x201C;distinct parameters&#x201D; holds. That means, the parameters governing the distribution of the data are distinct from those governing the missing data process. In an LGCM, this implies that the joint likelihood can be separated into two parts: a part for the LGCM and a part for the missingness mechanism. Because the missingness part does not contain information about the growth parameters, it does not need to be modeled in order to obtain valid estimates of the growth parameters. In contrast, MNAR, represents a &#x201C;non-ignorable&#x201D; missingness scenario where probability of data being missing on a variable is determined by unobserved values themselves, demanding more intricate methodological approaches for an effective solution. A common type of missingness in longitudinal studies, called <italic>attrition</italic>, happens when participants drop out from a study after initially contributing data in the early measurement occasions. Attrition at later occasions is likely to be informed by the data available from the preceding occasions (<xref ref-type="bibr" rid="ref001">Allison, 2001</xref>), in which case, the missing data due to attrition can reasonably be assumed to be MAR.</p>
<p>In situations where an &#x201C;ignorable&#x201D; missing data mechanism is present (i.e., MCAR or MAR), modern missing data techniques, such as full information maximum likelihood (FIML) or multiple imputation (MI), can effectively recover the missing information. FIML is an approach that estimates the parameters of a statistical model and handle missing data simultaneously. It is based on an iterative process that aims to find the values maximizing the overall log-likelihood, while accounting for the patterns of missing data (<xref ref-type="bibr" rid="ref003">Enders, 2022</xref>). MI, in contrast, typically handle missing data through three steps. In MI, missing values are first imputed multiple times based on a certain parametric or nonparametric model, creating multiple complete datasets (the imputation step). These imputed datasets are subsequently used for the target statistical analysis individually (the analysis step). Then, the results of all the multiple imputed datasets are pooled to generate the final result (the pooling step; <xref ref-type="bibr" rid="ref54">Rubin, 1987</xref>). This multi-step approach could avoid potential convergence problems FIML may have with complex data or models and enables flexibility in incorporating auxiliary variable and handling various types of missing data. However, the implementation of MI could be more challenging than FIML as it requires more complex methodological considerations. For example, researchers need to make decisions on the choices of (1) imputation algorithm, (2) imputation model, and (3) pooling strategies for different types of statistics, especially for the LRT statistic and model fit indices.</p>
<sec id="sec4">
<label>3.1</label>
<title>Imputation algorithms</title>
<p>Imputation algorithms refer to the procedures used to fill in missing data in a dataset. The most well-known imputation algorithms in the missing data literature are distinguished by whether missing values are imputed based on a multivariate distribution or a series of conditional univariate distributions. The first type of algorithms includes the joint modeling (JM; <xref ref-type="bibr" rid="ref58">Schafer, 1997</xref>) and expectation&#x2013;maximization with bootstrapping (EMB; <xref ref-type="bibr" rid="ref26">Honaker et al., 2011</xref>). Both algorithms assume data follow a multivariate normal distribution and are theoretically equivalent (<xref ref-type="bibr" rid="ref15">Enders, 2011</xref>). The JM algorithm uses an iterative Markov Chain Monte Carlo (MCMC) procedure that alternates between drawing imputations for missing values and drawing parameters from their conditional posterior distributions. The EMB algorithm creates a specified number of bootstrapped samples (e.g., 5,000) and then applies the expectation&#x2013;maximization algorithm to obtain maximum likelihood estimates of the mean vector and covariance matrix for each bootstrapped sample. To create each imputed dataset, the algorithm randomly selects one set of parameter estimates from the bootstrapped samples and uses these estimates to impute the missing values.</p>
<p>Another group of imputation algorithms are commonly known as Fully Conditional Specification (FCS; a.k.a., MI by chained equations or MICE; <xref ref-type="bibr" rid="ref65">van Buuren et al., 2006</xref>; <xref ref-type="bibr" rid="ref66">van Buuren and Groothuis-Oudshoorn, 2011</xref>), in which imputation is conducted on a variable-by-variable basis, conditional on all other variables in the dataset. This process is repeated iteratively until missing values for all variables are filled in. The entire procedure is then repeated multiple times to generate <italic>m</italic> imputed datasets. The MICE process can adapt flexibly to accommodate specific characteristics of different incomplete variables.</p>
</sec>
<sec id="sec5">
<label>3.2</label>
<title>Imputation models</title>
<p>Imputation models refer to the statistical models used to estimate the missing values in a dataset. For example, EMB fills missing data through random draws from a multivariate normal distribution using estimated parameters, while FCS imputes missing values using a series of univariate conditional models, each based on the distribution appropriate for the variable being imputed, such as linear regression with normal residuals assumed. In the context of LGCM, data should be organized in the wide format, where the repeated measure at <italic>j</italic><sup>th</sup> measurement occasion is stored as an individual variable (<inline-formula>
<mml:math id="M17">
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>) in the dataset. If one chooses to maintain this wide data structure during imputation, either standard EMB or FCS can be performed, depending on the chosen distribution model, i.e., multivariate normal distribution for EMB or models under univariate normal distributions for FCS. Imputation using EMB can be implemented through R package Amelia (<xref ref-type="bibr" rid="ref26">Honaker et al., 2011</xref>). R package mice (<xref ref-type="bibr" rid="ref65">van Buuren and Groothuis-Oudshoorn, 2011</xref>) or the software Blimp (<xref ref-type="bibr" rid="ref34">Keller and Enders, 2023</xref>) can be used for FCS imputation. In this article, we refer to the imputation strategy that preserves the wide format of data as the wide-format imputation.</p>
<p>In contrast, to account for the dependency of repeated measures within individuals in longitudinal studies, various multilevel imputation approaches, built on different multilevel imputation models, have developed over time and recently gained significant attention in methodological research (e.g., <xref ref-type="bibr" rid="ref002">Audigier and Resche-Rigon, 2018</xref>; <xref ref-type="bibr" rid="ref9">Carpenter et al., 2011</xref>; <xref ref-type="bibr" rid="ref17">Enders et al., 2020</xref>; <xref ref-type="bibr" rid="ref45">Quartagno and Carpenter, 2016</xref>, <xref ref-type="bibr" rid="ref46">2019</xref>; <xref ref-type="bibr" rid="ref51">Resche-Rigon and White, 2018</xref>; <xref ref-type="bibr" rid="ref71">Zhao and Schafer, 2015</xref>). We refer to these types of imputation strategies as the <italic>long-format</italic> imputation, as they impute data while stacking the lower-level records for each upper-level unit, and account for the multilevel nature of data through a restricted model. <xref ref-type="bibr" rid="ref23">Grund et al. (2018)</xref> systematically evaluated several long-format MI approaches that account for clustering data structure (but not necessarily longitudinal data) within multilevel modeling frameworks. Their evaluation compared multivariate-based and FCS imputation methods while varying analysis model complexity, including the incorporation of random effects and nonlinear terms. Based on their simulation results, long-format multilevel MI was recommended in the majority of scenarios. In contrast, <xref ref-type="bibr" rid="ref28">Huque et al. (2018)</xref> compared a broader range of wide-format and long-format imputation methods (implemented in a broader range of software packages) in longitudinal linear regression models, including a panel model and a multilevel random-intercept model. They found that the wide-format MI approaches outperformed the long-format approaches the models examined. <xref ref-type="bibr" rid="ref003">Ender (2022)</xref> demonstrated both wide-format and long-format imputation strategies with a single sample using the Blimp software (<xref ref-type="bibr" rid="ref34">Keller and Enders, 2023</xref>) in comparison with FIML. It shows that the parameter estimates of a latent growth curve model from wide-format imputation is generally comparable but a bit &#x201C;nosier&#x201D; than the other two methods.</p>
<p>The contradictory recommendations from <xref ref-type="bibr" rid="ref23">Grund et al. (2018)</xref> and <xref ref-type="bibr" rid="ref28">Huque et al. (2018)</xref> regarding the performance of wide-format versus long-format imputation methods likely arise from differences in their modeling frameworks. A possible explanation of the discrepancies could be that <xref ref-type="bibr" rid="ref23">Grund et al. (2018)</xref> focused on clustered data scenarios with complex multilevel analysis models that included random slopes, nonlinear effects, and cross-level interactions, where long-format multilevel MI better matched the analysis model&#x2019;s clustered structure and thus enhanced estimation in variance components and interaction estimates. In contrast, <xref ref-type="bibr" rid="ref28">Huque et al. (2018)</xref> examined longitudinal designs with simpler analyses, such as linear mixed models with random intercepts only or panel regression, where wide-format methods more flexibly captured unstructured correlations without the risk of overparameterization in multilevel imputation, leading to better or comparable performance in bias and coverage. This context-dependence underscores that neither wide-format nor long-format imputation is universally superior. Instead, the optimal choice of imputation method should be guided primarily by the degree of congeniality (alignment) between the imputation model and the target analysis model, as well as by the specific characteristics of the data and analysis.</p>
<p>Inspired by the <xref ref-type="bibr" rid="ref18">Enders&#x2019; (2018)</xref> non-simulation-based comparison within the LGCM framework and the recent software development (such as Blimp; (<xref ref-type="bibr" rid="ref34">Keller and Enders, 2023</xref>), the <italic>primary objective</italic> of this article is to systematically investigate the relative performance of wide-format versus long-format imputation methods in the context of LGCM, where the target analysis inherently requires the data to be structured in wide format. Technically, MI in long-format for a LGCM requires data transformation from wide to long formats prior to imputation, and back-transformation for performing a LGCM subsequently. Given that model fit evaluation is a critical component of LGCM, as in other latent variable models, we also assessed the performance of these approaches in estimating the LRT statistic, in addition to their accuracy and precision in estimating model parameters.</p>
</sec>
<sec id="sec6">
<label>3.3</label>
<title>Pooling strategies</title>
<p>Regardless of the imputation methods, after the imputation and analysis steps, the results obtained from each of imputed datasets need to be pooled together. It is straight forward to pool the parameter estimates and their standard errors (<xref ref-type="bibr" rid="ref54">Rubin, 1987</xref>). A final parameter estimate is simply the arithmetic mean of parameter estimates across imputed datasets. The pooled standard error of a parameter estimate (<inline-formula>
<mml:math id="M18">
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mtext mathvariant="italic">pooled</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula>, <xref ref-type="disp-formula" rid="E6">Equation 3</xref>) can be written as a function of within-imputation variance (<inline-formula>
<mml:math id="M19">
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>W</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>) and between-imputation variance (<inline-formula>
<mml:math id="M20">
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>B</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>) with <italic>m</italic> imputed datasets.</p>
<disp-formula id="E4">
<mml:math id="M21">
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>B</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfrac>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>m</mml:mi>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>&#x03B8;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>&#x03B8;</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>,</mml:mo>
</mml:math>
</disp-formula>
<disp-formula id="E5">
<mml:math id="M22">
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>W</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>m</mml:mi>
</mml:mfrac>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>m</mml:mi>
</mml:msubsup>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
</mml:math>
</disp-formula>
<disp-formula id="E6">
<mml:math id="M23">
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mtext mathvariant="italic">pooled</mml:mtext>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>W</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>B</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mfrac>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>B</mml:mi>
</mml:msub>
<mml:mi>m</mml:mi>
</mml:mfrac>
<mml:mo>.</mml:mo>
</mml:math>
<label>(3)</label>
</disp-formula>
<p>Pooling the LRT statistic statistics across imputed datasets, however, is a more intricate process. <xref ref-type="bibr" rid="ref37">Li et al. (1991)</xref> proposed an approach that pools <italic>m</italic> Wald test statistics to generate a final significance test statistic, which is referred to as the D<sub>2</sub> approach in the missing data analysis literature (<xref ref-type="bibr" rid="ref15">Enders, 2011</xref>). Although developed on a basis of the Wald test statistic, D<sub>2</sub> can be applied to LRT, which is asymptotically equivalent to a Wald test (<xref ref-type="bibr" rid="ref8">Buse, 1982</xref>). Let <inline-formula>
<mml:math id="M24">
<mml:msub>
<mml:mover accent="true">
<mml:mi>T</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mi>W</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> represents the average of <italic>m</italic> Wald test statistics, and the D<sub>2</sub> statistic can be defined as:</p>
<disp-formula id="E7">
<mml:math id="M25">
<mml:msub>
<mml:mi>D</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mover accent="true">
<mml:mi>T</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mi>W</mml:mi>
</mml:msub>
<mml:mspace width="0.33em"/>
<mml:msup>
<mml:mi>k</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2212;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>m</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>m</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mi mathvariant="italic">ARI</mml:mi>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>+</mml:mo>
<mml:mi mathvariant="italic">ARI</mml:mi>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:math>
</disp-formula>
<p>where <italic>k</italic> is the degree of freedom of LRT (i.e., the difference in the number of free parameters between the hypothesized and the saturated models); and <inline-formula>
<mml:math id="M26">
<mml:mi mathvariant="italic">ARI</mml:mi>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:math>
</inline-formula> is an estimate of the average relative increase in variance due to missing data. The D<sub>2</sub> approach can pool LRT statistics from <italic>m</italic> imputed datasets (<xref ref-type="bibr" rid="ref33">Jorgensen and Rosseel, 2025</xref>) and approximates an <italic>F</italic> distribution across these datasets for significance testing.</p>
<p>The D<sub>3</sub> statistic, developed by <xref ref-type="bibr" rid="ref41">Meng and Rubin (1992)</xref>, involves three steps. First, it averages the LRT statistics from <italic>m</italic> imputed datasets to obtain <inline-formula>
<mml:math id="M27">
<mml:msub>
<mml:mover accent="true">
<mml:mi>T</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mi mathvariant="italic">LR</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>.</p>
<disp-formula id="E8">
<mml:math id="M28">
<mml:msub>
<mml:mover accent="true">
<mml:mi>T</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mi mathvariant="italic">LR</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>m</mml:mi>
</mml:mfrac>
<mml:mspace width="0.33em"/>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>m</mml:mi>
</mml:munderover>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
</mml:math>
<label>(4)</label>
</disp-formula>
<p>where the LRT statistics (<inline-formula>
<mml:math id="M29">
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> is the same as in <xref ref-type="disp-formula" rid="E3">Equation 2</xref> for the <italic>i</italic><sup>th</sup> imputed dataset. Second, the analysis model is fit to each imputed dataset with the parameters fixed at the pooled values, and the average LRT statistic (<inline-formula>
<mml:math id="M30">
<mml:msub>
<mml:mover accent="true">
<mml:mi>T</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mtext mathvariant="italic">Constrianed</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula>) is computed in the same way as in <xref ref-type="disp-formula" rid="E8">Equation 4</xref>. The final step is to calculate the pooled likelihood ratio test statistics as follows:</p>
<disp-formula id="E9">
<mml:math id="M31">
<mml:msub>
<mml:mi>D</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:msub>
<mml:mover accent="true">
<mml:mi>T</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mtext mathvariant="italic">Constrianed</mml:mtext>
</mml:msub>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>+</mml:mo>
<mml:mi mathvariant="italic">ARI</mml:mi>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M32">
<mml:mi mathvariant="italic">ARI</mml:mi>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
</mml:math>
</inline-formula> is also an estimate of the average relative increase in variance due to missing data, which is a function of <inline-formula>
<mml:math id="M33">
<mml:msub>
<mml:mover accent="true">
<mml:mi>T</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mi mathvariant="italic">LR</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math id="M34">
<mml:msub>
<mml:mover accent="true">
<mml:mi>T</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mtext mathvariant="italic">Constrianed</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula> and <italic>m</italic>.</p>
<p>The D<sub>4</sub> approach represents the most recent advancement in the field of test statistic pooling strategies (<xref ref-type="bibr" rid="ref10">Chan and Meng, 2022</xref>; <xref ref-type="bibr" rid="ref25">Grund et al., 2023</xref>). This approach first stacks all the imputed dataset on top of one another and then fit the analysis model to the &#x201C;stacked&#x201D; data to obtain the likelihood ratio test statistic (<inline-formula>
<mml:math id="M35">
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mtext mathvariant="italic">stacked</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula>) as described in <xref ref-type="disp-formula" rid="E2">Equation 1</xref>. The D<sub>4</sub> statistic can be written as follows:</p>
<disp-formula id="E10">
<mml:math id="M36">
<mml:msub>
<mml:mi>D</mml:mi>
<mml:mn>4</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:msub>
<mml:mover accent="true">
<mml:mover accent="true">
<mml:mi>T</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mtext mathvariant="italic">Stacked</mml:mtext>
</mml:msub>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo stretchy="true">[</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>+</mml:mo>
<mml:mo>max</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi mathvariant="italic">ARI</mml:mi>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mn>4</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">]</mml:mo>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M37">
<mml:msub>
<mml:mover accent="true">
<mml:mi>T</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mtext mathvariant="italic">Stacked</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula> is computed as <inline-formula>
<mml:math id="M38">
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mtext mathvariant="italic">stacked</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula> divided by <italic>m</italic>; and <inline-formula>
<mml:math id="M39">
<mml:mi mathvariant="italic">ARI</mml:mi>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mn>4</mml:mn>
</mml:msub>
</mml:math>
</inline-formula> is another estimate of the average relative increase in variance.</p>
<p>The methodological research on these pooling strategies remains limited. Liu and Sriutaisuk (<xref ref-type="bibr" rid="ref39">Liu and Sriutaisuk, 2020</xref>) only focused on performance of D<sub>2</sub> with ordinal items in the confirmatory factor analysis. <xref ref-type="bibr" rid="ref18">Enders and Mansolf (2018)</xref> revealed that D<sub>3</sub> was comparable to FIML in estimating LRT statistic in a structural equation model. In the meanwhile, D<sub>3</sub> was criticized for its failure to remain invariant under equivalent parameterizations of the same model and for its inability to ensure a non-negative value (<xref ref-type="bibr" rid="ref10">Chan and Meng, 2022</xref>; <xref ref-type="bibr" rid="ref18">Enders and Mansolf, 2018</xref>). <xref ref-type="bibr" rid="ref10">Chan and Meng (2022)</xref> claimed that D<sub>4</sub> could perform at lease as well as D<sub>3</sub>, as it is invariant to re-parameterization and is assured to have a non-negative value. It was also expected to be more computationally efficient as it does not involve re-evaluating the likelihood function as D<sub>3</sub> does. Less research has focused this most recently proposed pooling strategy, D<sub>4</sub>. So far, none of these pooling strategies, a critical component of MI for latent variable models, have been evaluated in the LGCM framework. Therefore, the <italic>secondary objective</italic> of this article is to evaluate the performance of these pooling strategies when preforming various MI approaches in the LGCM.</p>
</sec>
</sec>
<sec id="sec7">
<label>4</label>
<title>Simulation</title>
<sec id="sec8">
<label>4.1</label>
<title>Design</title>
<p>We conducted three simulation studies to evaluate the performance of various imputation and pooling strategies within the LGCM framework, with FIML serving as the reference method. Although MI&#x2019;s practical advantages commonly arise in contexts where FIML is not feasible (e.g., large number of auxiliary variables, complex models, or non-normal data), we deliberately examined conditions where both methods are practically feasible and directly comparable. Because understanding MI&#x2019;s performance in these scenarios could provide critical insight into its potential benefits in more complex situations where FIML may be impractical or unavailable. In Study 1, data were generated using a linear latent curve growth model with 7 measurement occasions (see <xref ref-type="fig" rid="fig1">Figure 1A</xref>), with population parameters slightly adjusted from those in <xref ref-type="bibr" rid="ref4">Biesanz et al. (2004)</xref>. The analysis model used was the same as the generation model. Five missing data techniques were evaluated in this study:<list list-type="order">
<list-item>
<p>FIML;</p>
</list-item>
<list-item>
<p>MI-wEMB (MI with <italic>w</italic>ide-format data through EMB);</p>
</list-item>
<list-item>
<p>MI-wFCS (MI with <italic>w</italic>ide-format data through FCS);</p>
</list-item>
<list-item>
<p>MI-llMLM (MI with <italic>l</italic>ong-format data and <italic>l</italic>inear <italic>M</italic>ulti<italic>L</italic>evel imputation <italic>M</italic>odel);</p>
</list-item>
<list-item>
<p>MI-lqMLM (MI with <italic>l</italic>ong-format data and <italic>q</italic>uadratic <italic>M</italic>ulti<italic>L</italic>evel imputation <italic>M</italic>odel).</p>
</list-item>
</list></p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Population models: <bold>(A)</bold> linear latent curve growth model; <bold>(B)</bold> quadratic latent curve growth model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Path diagrams A and B show structural equation models. Diagram A has two latent variables, while B has three, each connected to the observed variables with multiple pathways (loadings) and labeled parameter values for means, variances, and covariances.</alt-text>
</graphic>
</fig>
<p>MI-wEMB refers to the wide-format EMB imputation implemented using the R package Amelia (<xref ref-type="bibr" rid="ref26">Honaker et al., 2011</xref>), which assumes a multivariate normal distribution and imputes missing data through the EMB algorithm. MI-wFCS is also a wide-format imputation method; however, it employs a fully conditional specification (FCS) algorithm that imputes missing values on a variable-by-variable basis. MI-wFCS in the present simulation was conducted using Blimp (<xref ref-type="bibr" rid="ref34">Keller and Enders, 2023</xref>), which employs the Bayesian FCS algorithm (10,000 iterations with 5,000 burn-ins), and imputes missing data through a round-robin sequence of regression models. Both MI-llMLM and MI-lqMLM are long-format imputation methods implemented in Blimp (<xref ref-type="bibr" rid="ref34">Keller and Enders, 2023</xref>) that employ fully Bayesian JM algorithm (10,000 iterations with 5,000 burn-ins), and explicitly account for the multilevel structure of the data. MI-llMLM was selected to align with the linear multilevel analysis model. MI-lqMLM was included to represent a scenario in which researchers apply a more complex imputation model (e.g., quadratic) before fitting a simpler nested analysis model (e.g., linear) when there is uncertainty about the functional form of the trajectory, as recommended by <xref ref-type="bibr" rid="ref18">Enders (2018)</xref>. In Blimp, missing values were imputed using a model-based approach, whereby a multilevel growth curve model (linear or quadratic, with random slopes) was specified as the imputation model. For all imputation methods, 100 imputed datasets were generated.</p>
<p>In Study 2 we used a quadratic latent curve growth model with 7 measurement occasions (see <xref ref-type="fig" rid="fig1">Figure 1B</xref>) for data generation, with adapted population values from <xref ref-type="bibr" rid="ref68">Wu and West (2010)</xref>. The analysis model was the same as the generation model. Four missing data techniques were examined: FIML, MI-wEMB, MI-wFCS, and MI-lqMLM.</p>
<p>Study 3 mirrored the Study 2 in terms of data generation and missing data handling approaches. However, this study employed a slightly misspecified analysis model, in which the covariance between the intercept and quadratic slope was incorrectly fixed at zero. For all MI methods in the three studies, the parameter estimates, and standard errors were pooled following the <xref ref-type="bibr" rid="ref54">Rubin&#x2019;s (1987)</xref> Rules; while the test statistics were pooled using the three aforementioned strategies: D<sub>2</sub>, D<sub>3</sub>, and D<sub>4</sub>. The inclusion of model misspecification was theoretically and practically motivated. From a theoretical perspective, missing data handling represents only one component of the overall LGCM analysis process, and its performance should be evaluated not only under ideal conditions but also when the analysis model deviates from the true population model. Methodological research in latent variable modeling commonly investigates inferential behavior under model misspecification in order to assess the robustness of estimation and hypothesis testing procedures. From a practical perspective, researchers rarely know the true model and must draw substantive conclusions under some degree of misspecification. Accordingly, Study 3 was designed to evaluate how different multiple imputation and pooling methods influence the inferential performance of the LRT statistic, specifically its statistical power, under various conditions.</p>
<p><xref ref-type="table" rid="tab1">Table 1</xref> reported the parameter values in the three population models. For all studies, we chose <italic>N</italic>&#x202F;=&#x202F;150, 300, and 600 to represent small, medium, and large sample sizes, respectively. Missing data were introduced based on MCAR and MAR with two levels of missing data proportions. The expected missing data proportion for each measurement occasion (<italic>j</italic>) was determined following either of the two linear functions:</p>
<disp-formula id="E11">
<mml:math id="M40">
<mml:mi>m</mml:mi>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mtext>samll</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>.075</mml:mn>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>,</mml:mo>
</mml:math>
</disp-formula>
<disp-formula id="E12">
<mml:math id="M41">
<mml:mi>m</mml:mi>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mtext>large</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>.175</mml:mn>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>,</mml:mo>
</mml:math>
</disp-formula>
<p>where <italic>j</italic>&#x202F;=&#x202F;1, 2, &#x2026;, 7. Therefore, the proportions on the seven time points were (0, 0.05, 0.1, 0.15, 0.2, 0.25, 0.3) for small missing proportions, and (0, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7) for large missing proportions. The probability of each value (i.e., the <italic>i</italic><sup>th</sup> individual at <italic>j</italic><sup>th</sup> occasion) being missing is determined using logistic regression. Specifically,</p>
<disp-formula id="E13">
<mml:math id="M42">
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:msup>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mspace width="0.33em"/>
<mml:mi mathvariant="normal">j</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msup>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>+</mml:mo>
<mml:msup>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="normal">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:math>
<label>(5)</label>
</disp-formula>
<p>where <italic>j</italic>&#x202F;=&#x202F;2, &#x2026;, 7; and b<sub>0</sub> varied to achieve the target expected missing data proportion. For MCAR, <italic>b</italic><sub>1</sub> was set at 0, indicating the missing data are not determined by any variable. For MAR, <italic>b</italic><sub>1</sub> was set at 0.4, defining the effect of <inline-formula>
<mml:math id="M43">
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> on log-odds ratio of missingness on <inline-formula>
<mml:math id="M44">
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> (<xref ref-type="bibr" rid="ref18">Enders and Mansolf, 2018</xref>).</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Parameter values in population models.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Parameter</th>
<th align="center" valign="top">Study 1</th>
<th align="center" valign="top">Study 2</th>
<th align="center" valign="top">Study 3</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Mean of intercept</td>
<td align="char" valign="middle" char=".">39.457</td>
<td align="center" valign="middle">1</td>
<td align="center" valign="middle">1</td>
</tr>
<tr>
<td align="left" valign="middle">Mean of linear slope</td>
<td align="char" valign="middle" char=".">8.063</td>
<td align="center" valign="middle">0.3</td>
<td align="center" valign="middle">0.3</td>
</tr>
<tr>
<td align="left" valign="middle">Mean of quadratic slope</td>
<td/>
<td align="center" valign="middle">0.5</td>
<td align="center" valign="middle">0.5</td>
</tr>
<tr>
<td align="left" valign="middle">Variance of intercept</td>
<td align="char" valign="middle" char=".">28.776</td>
<td align="center" valign="middle">3</td>
<td align="center" valign="middle">3</td>
</tr>
<tr>
<td align="left" valign="middle">Variance of linear slope</td>
<td align="char" valign="middle" char=".">8.201</td>
<td align="center" valign="middle">0.3</td>
<td align="center" valign="middle">0.3</td>
</tr>
<tr>
<td align="left" valign="middle">Variance of quadratic slope</td>
<td/>
<td align="center" valign="middle">0.3</td>
<td align="center" valign="middle">0.3</td>
</tr>
<tr>
<td align="left" valign="middle">Covariance of intercept and linear slope</td>
<td align="char" valign="middle" char=".">1.56</td>
<td align="center" valign="middle">0.3</td>
<td align="center" valign="middle">0.3</td>
</tr>
<tr>
<td align="left" valign="middle">Covariance of intercept and quadratic slope</td>
<td/>
<td align="center" valign="middle">0.3</td>
<td align="center" valign="middle">0.3</td>
</tr>
<tr>
<td align="left" valign="middle">Covariance of linear slope and quadratic slope</td>
<td/>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>In each study, we fully-crossed these factor levels, and for each condition, the performance of each method was evaluated by aggregating results across 500 replications. Data generation and analysis, including FIML, was conducted using the lavaan package (<xref ref-type="bibr" rid="ref53">Rosseel, 2012</xref>) in R (<xref ref-type="bibr" rid="ref49">R core team, 2021</xref>). R package lavaan.mi (<xref ref-type="bibr" rid="ref33">Jorgensen and Rosseel, 2025</xref>) was used for pooling the results.</p>
</sec>
<sec id="sec9">
<label>4.2</label>
<title>Outcome measures</title>
<sec id="sec10">
<label>4.2.1</label>
<title>Bias</title>
<p>We assessed standardized bias for each parameter estimate in the correct model only. This measure is calculated by taking the difference between the estimated value and the population value and dividing it by the standard deviation of the estimated values across replications. In accordance with <xref ref-type="bibr" rid="ref12">Collins et al. (2001)</xref>, we deemed a standardized bias acceptable when it falls below 0.4.</p>
</sec>
<sec id="sec11">
<label>4.2.2</label>
<title>MSE</title>
<p>Mean squared error (MSE) measures the average squared difference between the estimated value and the population value, providing a quantitative assessment of both the accuracy and precision of a missing data method.</p>
</sec>
<sec id="sec12">
<label>4.2.3</label>
<title>CIC</title>
<p>The 95% confidence interval coverage (CIC) is a proportion of replications, in which the 95% confidence intervals of a certain parameter contain the true population value. CIC is also an valuable tool for evaluating both the accuracy and precision of a quantitative method. A 95% CIC value are usually expected to be higher than 0.90. Following <xref ref-type="bibr" rid="ref7">Bradley&#x2019;s (1978)</xref> &#x201C;liberal criterion,&#x201D; we considered a CIC &#x201C;acceptable&#x201D; if it fell between 0.925 and 0.975.</p>
</sec>
<sec id="sec13">
<label>4.2.4</label>
<title>Type I error rate and power</title>
<p>We finally computed the proportion of replications with a significant LRT statistic (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05) as the Type I error rate in Studies 1 and 2. Because in Studies 1 and 2, the analysis models are correctly specified to match the population model, and therefore the proportion of significant LRT statistic is the estimate of Type I error rate. We considered the Type I error rate to be &#x201C;accurate&#x201D; if it was between 0.025 and 0.075 (<xref ref-type="bibr" rid="ref7">Bradley, 1978</xref>). In contrast, Study 3 introduced model misspecification by constraining the covariance between the intercept and quadratic slope to zero despite a nonzero population value; under this condition, the proportion of significate LRT statistics reflects the statistical power to detect this misspecification.</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="sec14">
<label>5</label>
<title>Results</title>
<sec id="sec15">
<label>5.1</label>
<title>Study 1</title>
<sec id="sec16">
<label>5.1.1</label>
<title>Parameter estimates</title>
<p>In each condition, we computed standardized biases, MSEs and CICs of parameters for the latent intercept and slope, including means, variances and covariance. <xref ref-type="fig" rid="fig2">Figures 2</xref>, <xref ref-type="fig" rid="fig3">3</xref> show that all methods produced unbiased parameter estimates, especially for the means of the latent factors, regardless of sample size, missing data proportion and mechanism. Comparing among the methods, FIML and MI-llMLM produced most accurate parameter estimates for the variances and covariance.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Study 1 results: standardized biases from missing data approaches for the latent means in the linear model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g002.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel chart displaying standardized bias of means for intercept and slope in Study 1 across sample sizes and missing data proportions for five methods (FIML, MI-wEMB, MI-wFCS, MI-llMLM, MI-lqMLM) under MCAR and MAR. Red dotted lines mark bias thresholds.</alt-text>
</graphic>
</fig>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Study 1 results: standardized biases from missing data approaches for the latent variances and covariance in the linear model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g003.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel chart displaying standardized bias of variances and covariance for intercept and slope in Study 1 across sample sizes and missing data proportions for five methods (FIML, MI-wEMB, MI-wFCS, MI-llMLM, MI-lqMLM) under MCAR and MAR. Red dotted lines mark bias thresholds.</alt-text>
</graphic>
</fig>
<p>We found that all methods produced comparable MSEs.<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref> Sample size had a greater impact on the mean and variance of the latent intercept than other parameters. Other factors did not show a noticeable impact on MSE. All CICs are generally within the acceptable range (i.e., &#x003E;0.90). We found that FIML could stably produce accurate confidence intervals across all conditions for all parameter types (<xref ref-type="fig" rid="fig4">Figures 4</xref>, <xref ref-type="fig" rid="fig5">5</xref>). All MI methods produced generally accurate (i.e., between 0.925 and 0.975) CICs for the mean of latent slope (<xref ref-type="fig" rid="fig4">Figure 4</xref>), variance of latent intercept and covariance between intercept and slope (<xref ref-type="fig" rid="fig5">Figure 5</xref>). The CICs of the mean of intercept can be slightly larger than 0.975, for all MI methods under MAR with the larger missing data proportion (<xref ref-type="fig" rid="fig4">Figure 4</xref>). The CICs for variance of slope could be lower than 0.925 for MI-wEMB and MI-lqMLM, under MAR with the larger missing data proportion (<xref ref-type="fig" rid="fig5">Figure 5</xref>).</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Study 1 results: CICs from missing data approaches for the latent means in the linear model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g004.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel chart displaying confidence interval coverage (CIC) of means for intercept and slope in Study 1 across sample sizes and missing data proportions for five methods (FIML, MI-wEMB, MI-wFCS, MI-llMLM, MI-lqMLM) under MCAR and MAR. Red dotted lines mark "acceptable" CIC range.</alt-text>
</graphic>
</fig>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Study 1 results: CICs from missing data approaches for the latent variances and covariance in the linear model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g005.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel chart displaying confidence interval coverage (CIC) of variances and covariance for intercept and slope in Study 1 across sample sizes and missing data proportions for five methods (FIML, MI-wEMB, MI-wFCS, MI-llMLM, MI-lqMLM) under MCAR and MAR. Red dotted lines mark "acceptable" CIC range.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec17">
<label>5.1.2</label>
<title>Type I error rate</title>
<p><xref ref-type="fig" rid="fig6">Figure 6</xref> presents the Type I error rates for all approaches, including different pooling strategies. We found that the Type I error rates from FIML generally fell within the range of 0.025&#x2013;0.075. Comparing the two wide-format imputation methods, MI-wEMB and MI-wFCS, the Type I error rates of test statistics pooled using D<sub>2</sub>, D<sub>3</sub> and D<sub>4</sub> were mostly within the acceptable range of 0.025&#x2013;0.075 or hovered around its edges. MI-wEMB was more sensitive to conditions where the sample size was small (<italic>N</italic>&#x202F;=&#x202F;150) and the proportion of missing data was large, whereas MI-wFCS demonstrated greater robustness in these challenging scenarios. The relative performance of the three pooling strategies was less clear. However, generally speaking, under MCAR conditions and with the two wide-format imputation methods, D<sub>2</sub> tended to produce slightly higher Type I error rates compared to D<sub>3</sub> and D<sub>4</sub>. Under MAR, D<sub>2</sub> tended to generate slightly smaller Type I error rates than D<sub>3</sub> and D<sub>4</sub>. Interesting but unsurprisingly, the two long-format imputation approaches, MI-llMLM and MI-lqMLM both yielded 0 Type I error rate, regardless of pooling approaches and design factors. This demonstrates a potential limitation of this imputation strategy in LGCM, which pre-assumes the shape of trajectory during imputation.</p>
<fig position="float" id="fig6">
<label>Figure 6</label>
<caption>
<p>Study 1 results: type I error rates from missing data approaches for the linear model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g006.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel chart displaying Type I error rates in Study 1 for different strategies (D2, D3, D4, Direct FIML) across methods (FIML, MI-wEMB, MI-wFCS, MI-llMLM, MI-lqMLM) under MCAR and MAR, across sample sizes and missing data proportions. Red dotted lines mark "accurate" range of Type I error rate.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec id="sec18">
<label>5.2</label>
<title>Study 2</title>
<sec id="sec19">
<label>5.2.1</label>
<title>Parameter estimates</title>
<p>In this study we focus on a latent quadratic growth model. Similar to the findings from Study 1, the standardized biases from all methods fell within the acceptable range (i.e., &#x003E; &#x2212;0.4 and &#x003C;0.4), except that for MI-wFCS the linear slope variance exceeded this range when the proportion of missing data was large. Overall, FIML and MI-lqMLM produced the most accurate parameter estimates. The MSEs from all methods were comparable across all conditions. A common pattern observed across methods was that when the sample size was small (<italic>N</italic>&#x202F;=&#x202F;150), the MSEs for intercept variance were substantially larger than those for other parameters. The CICs were generally within the acceptable range (i.e., &#x003E;0.90), with FIML yielding the most accurate CICs for nearly all parameters under most conditions. However, for MI-wEMB and MI-lqMLM, CICs associated with the latent linear slope (mean, variance, covariances) were heavily impacted by the proportion of missing data or missing data mechanism (see <xref ref-type="fig" rid="fig7">Figures 7</xref>&#x2013;<xref ref-type="fig" rid="fig9">9</xref>). Specifically, for these methods, the CICs for the mean of the linear slope dropped below 0.925 or even below 0.90, under a larger proportion of MAR (<xref ref-type="fig" rid="fig7">Figure 7</xref>). The CICs for the variance of the linear slope were even lower for MI-wEMB (<xref ref-type="fig" rid="fig8">Figure 8</xref>). Additionally, for MI-wEMB and MI-lqMLM, overly small CICs were observed for covariances between the linear slope and both the intercept and quadratic slopes under a larger proportion of MAR (<xref ref-type="fig" rid="fig9">Figure 9</xref>). In contrast, MI-wFCS tended to generate higher CICs (&#x003E;0.975) for parameters associated with the intercept and quadratic slopes.</p>
<fig position="float" id="fig7">
<label>Figure 7</label>
<caption>
<p>Study 2 results: CICs from missing data approaches for the latent means of in the quadratic model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g007.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Grouped line graphs compare CIC of means in Study 2 by method (FIML, MI-wEMB, MI-wFCS, MI-IMLM), missing data mechanism (MCAR, MAR), sample size, and missing data proportion. Triangle, square, and plus symbols represent mean of intercept, linear, and quadratic slopes, respectively. Under both MCAR and MAR, mean of intercept is generally high across panels, while means of linear and quadratic slopes vary more, especially at high missing data proportions and small sample size. Red dotted lines indicate reference values at 0.95 and 1.00. Legend identifies symbol meanings.</alt-text>
</graphic>
</fig>
<fig position="float" id="fig8">
<label>Figure 8</label>
<caption>
<p>Study 2 results: CICs from missing data approaches for the latent variances of in the quadratic model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g008.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Grouped dot plot comparing CIC of variances for intercept, linear slope, and quadratic slope (displayed as triangles, squares, and plus symbols) under MCAR and MAR conditions across FIML, MI-wEMB, MI-wFCS, and MI-MMM methods, with different sample sizes and missing data proportions on the x-axis and a vertical range from zero point eight five to one on the y-axis; parameter legend is present on the right.</alt-text>
</graphic>
</fig>
<fig position="float" id="fig9">
<label>Figure 9</label>
<caption>
<p>Study 2 results: CICs from missing data approaches for the latent covariances of in the quadratic model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g009.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Scatterplot matrix with twelve panels comparing CIC of covariances in Study 2 under MCAR and MAR missing data mechanisms, with FIML, MI-wEMB, MI-wFCS, and MI-0MIMI methods. X-axis shows sample size and missing data proportion; Y-axis shows CIC values from 0.85 to 1.00. Different shapes represent three types of covariance parameters: intercept-linear (triangle), intercept-quadratic (square), and linear-quadratic (plus sign). Data points cluster near CIC of 0.95, with visual grouping by method and condition. Legend and gridlines aid panel interpretation.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec20">
<label>5.2.2</label>
<title>Type I error rate</title>
<p>With the correctly specified analysis model, the Type I error rates for all methods remained &#x003C;0.10. However, different patterns were observed (see <xref ref-type="fig" rid="fig10">Figure 10</xref>). FIML yielded the most accurate Type I error rates. Comparing between the two wide-format MI methods, MI-wEMB and MI-wFCS, the Type I error rates for test statistics pooled using D<sub>2</sub>, D<sub>3</sub> and D<sub>4</sub> fell within 0.025&#x2013;0.075 or hovered around the edges, with only a few exceptions, particularly in cases with a large proportion of missing data. Similar to Study 1, the long-format MI method, MI-lqMLM, constantly produced Type I error rates of 0, regardless of pooling strategies or design factors.</p>
<fig position="float" id="fig10">
<label>Figure 10</label>
<caption>
<p>Study 2 results: type I error rates from missing data approaches for the quadratic model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g010.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Grid of scatter plots comparing Type I error rates by strategy under different conditions, with columns for missing data mechanisms (MCAR, MAR) and rows for analysis methods (FIML, MI-wEMB, MI-wFCS, MI-wMIM). Error rates are plotted for strategies D2, D3, D4, and Direct across varying sample sizes and proportions of missing data. Red and blue dashed lines indicate reference thresholds. Direct strategy shows higher error rates with FIML, while differences between strategies and methods emerge under MI conditions. Legend at right distinguishes strategies with distinct symbols.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec id="sec21">
<label>5.3</label>
<title>Study 3</title>
<sec id="sec22">
<label>5.3.1</label>
<title>Power</title>
<p>In Study 3, we examined the power of various test statistics in detecting model misspecification under MAR. <xref ref-type="fig" rid="fig11">Figure 11</xref> presents the power values from the D<sub>2</sub> pooling strategy for three MI approaches (i.e., MI-wEMB, MI-wFCS and MI-lqMLM), compared to those from FIML. We found that FIML exhibited the highest power with the large proportion of missing data, followed by MI-wEMB, MI-wFCS and MI-lqMLM. The impact of sample size was also noticeable. Generally, for the same proportion of missing data, power increased as sample size grew. As sample size increased, power difference among FIML and MI approaches diminished significantly. <xref ref-type="fig" rid="fig12">Figure 12</xref> presents a similar comparison using the D<sub>4</sub> pooling strategy with FIML. While D<sub>4</sub> tended to be more vulnerable to smaller sample sizes, it exhibited the same pattern observed with D<sub>2</sub>. Furthermore, with larger sample sizes, the power values for D<sub>2</sub> and D<sub>4</sub> converged. Power values from D<sub>3</sub> were nearly identical to those with D<sub>4</sub>.</p>
<fig position="float" id="fig11">
<label>Figure 11</label>
<caption>
<p>Study 3 results: power of D<sub>2</sub> test statistic comparing with FIML in detecting misspecification in quadratic model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g011.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Scatter plot comparing power of four statistical methods&#x2014;FIML, MI-wEMB, MI-wFCS, and MI-lqMLM&#x2014;across combinations of sample size and missing data proportion, with power on the y-axis, sample conditions on the x-axis, and a reference line at 0.8.</alt-text>
</graphic>
</fig>
<fig position="float" id="fig12">
<label>Figure 12</label>
<caption>
<p>Study 3 results: power of D<sub>4</sub> test statistic comparing with FIML in detecting misspecification in quadratic model.</p>
</caption>
<graphic xlink:href="fpsyg-17-1614844-g012.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Scatter plot showing power values for four statistical methods across combinations of sample size and missing data proportion. FIML, MI-wEMB, MI-wFCS, and MI-lqMLM are represented by different markers. Power is plotted on the vertical axis from zero to one, with a red dotted line at approximately zero point eight indicating a reference threshold. Sample size and missing data proportion groups appear on the horizontal axis as 150_0.3, 150_0.7, 300_0.3, 300_0.7, 600_0.3, and 600_0.7.</alt-text>
</graphic>
</fig>
</sec>
</sec>
</sec>
<sec id="sec23">
<label>6</label>
<title>Empirical example</title>
<p>In this section, we applied the aforementioned imputation approaches and pooling strategies to a real-world data set for demonstration. The data were obtained from the Early Childhood Longitudinal Studies Program (ECLS-K: 2011 Kindergarten&#x2013;Fifth Grade; <xref ref-type="bibr" rid="ref42">Mulligan et al., 2019</xref>; <xref ref-type="bibr" rid="ref63">Tourangeau et al., 2019</xref>). This national data set contains multisource information that offers a broad and multifaceted view of young children&#x2019;s early childhood experiences at home and in school. The sample consists of children who either entered kindergarten for the first time or repeated kindergarten during the 2010&#x2013;11 school year. We selected data collected during the fall semesters from kindergarten through second grade, and the spring semester from second grade through third grade. Among all the outcome measures related to children&#x2019;s home and school experiences, our primary focus was on their trajectory of mathematics achievement. For demonstration purposes, we randomly selected 600 children who had complete data on their math item response theory (IRT) scores at all measurement points. We then imposed attrition under MAR at all time points except for the first one, following <xref ref-type="disp-formula" rid="E13">Equation 5</xref>, with b<sub>1</sub> set at 0.4, and missing data proportions of five measurement occasions set at (0, 0.12, 0.24. 0.30, 0.36), respectively. At each time point, the probability of a value being missing is impacted by the values observed at the immediately preceding time point. We fit a quadratic latent growth curve model to the data. Then we intended to center time around the middle point and wrote loading matrix (<inline-formula>
<mml:math id="M45">
<mml:mi>&#x039B;</mml:mi>
</mml:math>
</inline-formula>) as follows:</p>
<disp-formula id="E14">
<mml:math id="M46">
<mml:mi>&#x039B;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mo>&#x2223;</mml:mo>
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:mn>1</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.5</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mn>2.25</mml:mn>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mn>1</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>.5</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mn>.25</mml:mn>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mn>1</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mn>0.5</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mn>.25</mml:mn>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mn>1</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mn>1</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mn>1</mml:mn>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mn>1</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mn>2</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mn>4</mml:mn>
</mml:mtd>
</mml:mtr>
</mml:mtable>
<mml:mo>&#x2223;</mml:mo>
<mml:mo>,</mml:mo>
</mml:math>
</disp-formula>
<p>where the three columns represent the loadings for intercept, the liner slope and the quadratic slope, respectively. The analysis results are shown in the <xref ref-type="table" rid="tab2">Table 2</xref>. The parameter estimates obtained from all MI methods were comparable to those from FIML.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Results from empirical example: parameter estimate (standard error) and LRT statistic <inline-formula>
<mml:math id="M47">
<mml:msup>
<mml:mi>&#x03C7;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:math>
</inline-formula></p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Parameter</th>
<th align="center" valign="top">Type</th>
<th align="center" valign="top">FIML</th>
<th align="center" valign="top">MI-wEMB</th>
<th align="center" valign="top">MI-wFCS</th>
<th align="center" valign="top">MI-lqMLM</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" colspan="6">Mean</td>
</tr>
<tr>
<td rowspan="3"/>
<td align="center" valign="middle">Int.</td>
<td align="center" valign="middle">0.339 (0.017)</td>
<td align="center" valign="middle">0.382 (0.020)</td>
<td align="center" valign="middle">0.340 (0.021)</td>
<td align="center" valign="middle">0.346 (0.020)</td>
</tr>
<tr>
<td align="center" valign="middle">S1</td>
<td align="center" valign="middle">0.784 (0.006)</td>
<td align="center" valign="middle">0.783 (0.006)</td>
<td align="center" valign="middle">0.784 (0.006)</td>
<td align="center" valign="middle">0.784 (0.006)</td>
</tr>
<tr>
<td align="center" valign="middle">S2</td>
<td align="center" valign="middle">&#x2212;0.124 (0.003)</td>
<td align="center" valign="middle">&#x2212;0.124 (0.003)</td>
<td align="center" valign="middle">&#x2212;0.126 (0.003)</td>
<td align="center" valign="middle">&#x2212;0.126 (0.003)</td>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Variance</td>
</tr>
<tr>
<td rowspan="3"/>
<td align="center" valign="middle">Int.</td>
<td align="center" valign="middle">0.262 (0.014)</td>
<td align="center" valign="middle">0.261 (0.015)</td>
<td align="center" valign="middle">0.264 (0.015)</td>
<td align="center" valign="middle">0.264 (0.015)</td>
</tr>
<tr>
<td align="center" valign="middle">S1</td>
<td align="center" valign="middle">0.015 (0.002)</td>
<td align="center" valign="middle">0.015 (0.002)</td>
<td align="center" valign="middle">0.015 (0.002)</td>
<td align="center" valign="middle">0.015 (0.002)</td>
</tr>
<tr>
<td align="center" valign="middle">S2</td>
<td align="center" valign="middle">0.003 (0.001)</td>
<td align="center" valign="middle">0.003 (0.001)</td>
<td align="center" valign="middle">0.003 (0.001)</td>
<td align="center" valign="middle">0.003 (0.001)</td>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Covariance</td>
</tr>
<tr>
<td rowspan="3"/>
<td align="center" valign="middle">Int. with S1</td>
<td align="center" valign="middle">&#x2212;0.024 (0.003)</td>
<td align="center" valign="middle">&#x2212;0.028 (0.003)</td>
<td align="center" valign="middle">&#x2212;0.023 (0.003)</td>
<td align="center" valign="middle">&#x2212;0.024 (0.003)</td>
</tr>
<tr>
<td align="center" valign="middle">Int. with S2</td>
<td align="center" valign="middle">0.000 (0.002)</td>
<td align="center" valign="middle">0.000 (0.001)</td>
<td align="center" valign="middle">0.000 (0.002)</td>
<td align="center" valign="middle">0.001 (0.002)</td>
</tr>
<tr>
<td align="center" valign="middle">S1 with S2</td>
<td align="center" valign="middle">&#x2212;0.003 (0.001)</td>
<td align="center" valign="middle">&#x2212;0.004 (0.001)</td>
<td align="center" valign="middle">&#x2212;0.004 (0.001)</td>
<td align="center" valign="middle">&#x2212;0.004 (0.001)</td>
</tr>
<tr>
<td align="left" valign="middle"><inline-formula>
<mml:math id="M48">
<mml:msup>
<mml:mi>&#x03C7;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:math>
</inline-formula> (<italic>df</italic>&#x202F;=&#x202F;6)</td>
<td/>
<td align="center" valign="middle">131.090</td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td rowspan="3"/>
<td align="center" valign="middle">D<sub>2</sub></td>
<td rowspan="3"/>
<td align="center" valign="middle">131.304</td>
<td align="center" valign="middle">120.319</td>
<td align="center" valign="middle">75.281</td>
</tr>
<tr>
<td align="center" valign="middle">D<sub>3</sub></td>
<td align="center" valign="middle">125.178</td>
<td align="center" valign="middle">125.217</td>
<td align="center" valign="middle">70.161</td>
</tr>
<tr>
<td align="center" valign="middle">D<sub>4</sub></td>
<td align="center" valign="middle">125.177</td>
<td align="center" valign="middle">125.219</td>
<td align="center" valign="middle">70.161</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Int., intercept; S1, linear slope of first phase; S2, linear slope of second phase.</p>
</table-wrap-foot>
</table-wrap>
<p>In the empirical analysis, the LRT statistic evaluates the fit of the LGCM (null hypothesis) against the corresponding saturated model (alternative hypothesis). FIML yields the conventional model LRT statistic, whereas each multiple imputation method pools the LRT statistics generated from regular maximum likelihood across imputations using the D<sub>2</sub>, D<sub>3</sub>, and D<sub>4</sub> pooling procedures. The D<sub>2</sub> test statistics with MI-wEMB were most similar to that from FIML, while the D<sub>3</sub> and D<sub>4</sub> methods with MI-wEMB and all pooling methods with MI-wFCS yielded lower LRT statistics values. The lowest LRT statistic values were found from all pooling approaches with MI-lqMLM. These results were consistent with the simulation results from Study 2.</p>
</sec>
<sec sec-type="discussion" id="sec24">
<label>7</label>
<title>Discussion</title>
<p>The current study evaluated the efficacy of various MI approaches applied to wide- and long-format data in estimating parameters and assessing model fit in linear and quadratic latent growth curve models. Our aim was to offer researchers practical guidance for handling missing data within this specific modeling framework.</p>
<p>Our analysis revealed that, similar to FIML, the MI approaches consistently yielded unbiased parameter estimates and comparable MSEs cross all examined parameters. Specifically, all methods performed well in accurately estimating the means, variances, and covariances of the growth factors. However, divergent patterns emerged in CIC. For the linear growth model, CICs for the latent variance of the linear slope occasionally fell below 0.925 when using MI-wEMB and MI-lqMLM, particularly under higher levels of missingness in MAR conditions. For the quadratic model, larger proportions of missing data also led to overly liberal CICs (i.e., &#x003C; 0.925) for MI-wEMB and MI-lqMLM, particularly for parameters related to the linear slope.</p>
<p>Model fit evaluation was one of the two central objects of our study. To assess model fit, we examined three pooled test statistics (D<sub>2</sub>, D<sub>3</sub>, and D<sub>4</sub>) obtained from the MI methods, and compared them with the FIML LRT statistic. When the analysis model was correctly specified, the Type I error rates of the pooled test statistics from the wide-format MI methods (MI-wEMB and MI-wFCS) were generally comparable to those produced by FIML. In contrast, the long-format MI methods (MI-llMLM and MI-lqMLM) yielded near-zero Type I error rates, indicating an overly conservative tendency. Under the quadratic model misspecification, where a latent covariance was incorrectly fixed to zero, MI-wEMB and MI-wFCS demonstrated the second- and third-highest power, respectively, to detect misspecification with smaller sample sizes, ranking just below FIML. As expected from the correct-model results, the long-format MI-lqMLM showed the lowest power. Further comparison under model misspecification revealed that the D<sub>2</sub> test statistics from MI-wEMB produced power values comparable to FIML, whereas D<sub>3</sub> and D<sub>4</sub> consistently yielded lower power values.</p>
<p>Overall, unlike the wide-format imputation methods (MI-wEMB and MI-wFCS), the long-format methods (MI-llMLM and MI-lqMLM) performed poorly in model fit evaluation. This shortfall likely stems from the long-format methods&#x2019; transformation of data into long format prior to imputation, followed by the specification of a parametric linear (MI-llMLM) or quadratic (MI-lqMLM) mixed-effects model. These impose greater constraints than less parametric wide-format approaches (no transformation needed), which permits an unstructured covariance matrix across time points without assuming specific random-effects distributions (as in MI-wEMB), or imputes missing values in time points sequentially based on Bayesian regression (as in MI-wFCS). Consequently, the constrained imputation model in long-format methods compels imputed values to adhere closely to the assumed trajectory and clustering structure, thereby reducing unexplained variability in the completed datasets more than a less restrictive model would.</p>
<p>This study provides practical guidance for researchers to select the appropriate approach dealing with missing data in the context of the LGCM framework. Given the growing attention to multilevel long-format imputation methods in recent literature (e.g., <xref ref-type="bibr" rid="ref46">Quartagno and Carpenter, 2019</xref>; <xref ref-type="bibr" rid="ref51">Resche-Rigon and White, 2018</xref>; <xref ref-type="bibr" rid="ref002">Audigier and Resche-Rigon, 2018</xref>; <xref ref-type="bibr" rid="ref17">Enders et al., 2020</xref>; <xref ref-type="bibr" rid="ref23">Grund et al., 2018</xref>), it is important to explore how these approaches can be effectively extended to the LGCM, particularly in addressing the inherent clustered data structure. Building on our findings, we highlight key insights as follows to support better methodological decision-making and identifying promising directions for future studies.</p>
<p>While our results indicate that FIML performs best under the specific conditions examined, this does not diminish the importance of MI in many real-world applications where FIML cannot be reliably implemented. MI is preferable in several key scenarios: when researchers require complete datasets for secondary analyses, encounter convergence issues with FIML (which are common in repeat measures designs), or need to incorporate auxiliary variables not included in the final analysis model. While MI&#x2019;s stepwise approach yielded comparable results in most cases and offers greater flexibility, it requires careful specification of the imputation model and thoughtful selection of pooling strategies.</p>
<p>Despite differences observed in parameter estimates and model fit statistics, MI methods generally served as viable alternatives to FIML. All examined MI approaches generated unbiased parameter estimates, with MI-wFCS (implemented via Blimp) standing out for its robust performance, producing accurate CICs across all parameters and demonstrating minimal sensitivity to both the mechanism and proportion of missing data. MI-wEMB exhibited greater power in LRT overall than other MI methods. For model fit evaluation, the D<sub>2</sub> test statistic paired with MI-wEMB most closely approximated FIML&#x2019;s ability to detect misspecification in latent factor covariances, whereas D<sub>3</sub> and D<sub>4</sub> required larger sample sizes to perform adequately. Notably, as sample size increased, the difference in power among imputation and pooling methods diminished substantially.</p>
<p>The long-format multilevel imputation is particularly appealing for complex LGCMs with a large number of time points or nonlinear trajectories, as it can, in theory, account for within-person dependencies and between-person heterogeneity through the specification of random effects during the imputation phase. However, our findings under the examined conditions indicate that these theoretical advantages, primarily derived from the multilevel modeling framework, did not translate into clear practical benefits over standard wide-format imputation approaches in LGCM. The long-format imputation methods examined in this study showed outstanding performance in parameter recovery relative to their wide-format counterparts, however, they could be more sensitive to missing data proportion when estimating CIs. More critically, the long-format imputation methods associated with the D<sub>2</sub>, D<sub>3</sub>, or D<sub>4</sub> pooling strategies produced near-zero Type I error rates. This result likely arose because the imputed values were generated deterministically and were overly consistent with the analysis model (e.g., linear or quadratic). Without valid between-imputation variability, these pooling strategies tended to underestimate the true uncertainty associated with the missing data. As a result, the pooled LRT statistics became overly conservative and were unlikely to reject the null hypothesis, even when they should have. This conservativeness not only deflated the Type I error rate but also severely reduced statistical power, limiting the ability to detect model misspecifications when they existed.</p>
<p>It is important to acknowledge the limitations of our findings within the context of the specific LGCMs and conditions examined. First, the conclusions may not generalize to alternative model configurations, such as conditional growth curve models with covariates, multivariate growth curve models, or multilevel latent growth curve models with additional hierarchical levels. Further research is needed to investigate these extensions. Second, the observed performance of MI methods may not hold across different types of model misspecifications. While our study focused on misspecification in the analysis model, misspecification can potentially arise in both the imputation and analysis models. The performance of long-format multilevel imputation under various misspecification scenarios presents an intriguing avenue for future investigation. Third, in our simulation, we focus exclusively on conditions allowing a straightforward head-to-head comparison of FIML and MI (e.g., no auxiliary variables under MCAR and few auxiliary variables under MAR), where both approaches are easily implemented and should be equally efficient in theory. However, as documented by <xref ref-type="bibr" rid="ref56">Savalei and Bentler (2009)</xref>, MI generally provides more straightforward inclusion of a large number of auxiliary variables, while FIML often requires saturated-correlates modeling with auxiliary variables that could substantially increase complexity and compromise convergence. This important practical distinction suggests avenues for future research, such as targeted comparisons of MI and saturated-correlates FIML in LGCMs with many auxiliaries or under conditions that challenge FIML convergence. Fourth, our simulation was conducted under the assumption of data normality, utilizing ML or FIML estimators. However, when normality is violated, methodological adjustments become critical. Nonnormality can introduce significant challenges, including biased standard errors, inaccurate test statistics, and potentially misleading fit indices. An important direction for future research involves exploring how different imputation and pooling strategies address nonnormality in LGCM. Fifth, our evaluation on long-format multilevel imputation was limited to the approaches available in Blimp (<xref ref-type="bibr" rid="ref17">Enders et al., 2020</xref>; <xref ref-type="bibr" rid="ref34">Keller and Enders, 2023</xref>) and did not include more recent or alternative substantive-model-compatible (SMC) imputation developments for multilevel data, such as the SMC-JM approach in the R package jomo (<xref ref-type="bibr" rid="ref47">Quartagno and Carpenter, 2022</xref>; <xref ref-type="bibr" rid="ref48">2023</xref>), and the sequential modeling approach in the R package mdmb (<xref ref-type="bibr" rid="ref24">Grund et al., 2021</xref>). Future research could incorporate direct comparisons of these methods under conditions similar to or more extreme than those examined in our study, to further inform methodological choices for handling complex missing data. Finally, the pooling strategies employed in this study did not appear to be well-suited for long-format multilevel imputation approaches. The observed deflated Type I error rates and reduced statistical power highlight the need for further methodological investigation and the development of more targeted post-imputation techniques.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec25">
<title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found at: <ext-link xlink:href="https://nces.ed.gov/ecls/dataproducts.asp" ext-link-type="uri">https://nces.ed.gov/ecls/dataproducts.asp</ext-link>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="ethics-statement" id="sec26">
<title>Ethics statement</title>
<p>Ethical approval was not required for the study involving humans in accordance with the local legislation and institutional requirements. Written informed consent to participate in this study was not required from the participants or the participants&#x2019; legal guardians/next of kin in accordance with the national legislation and the institutional requirements.</p>
</sec>
<sec sec-type="author-contributions" id="sec27">
<title>Author contributions</title>
<p>FJ: Methodology, Writing &#x2013; original draft, Conceptualization, Investigation, Visualization, Writing &#x2013; review &#x0026; editing, Formal analysis. YY: Writing &#x2013; original draft, Methodology, Conceptualization, Investigation, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="COI-statement" id="sec28">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec29">
<title>Generative AI statement</title>
<p>The author(s) declared that Generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec30">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="ref001"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Allison</surname><given-names>P. D.</given-names></name></person-group> (<year>2001</year>). <source>Missing Data</source>, <publisher-loc>Thousand Oaks, CA</publisher-loc>: <publisher-name>Sage</publisher-name>.</mixed-citation></ref>
<ref id="ref1"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Asparouhov</surname><given-names>T.</given-names></name> <name><surname>Muth&#x00E9;n</surname><given-names>B</given-names></name></person-group>. (<year>2010</year>). Multiple imputation with Mplus. Technical Report. Available online at: <ext-link xlink:href="https://www.statmodel.com" ext-link-type="uri">https://www.statmodel.com</ext-link> (accessed September, 18, 2021)</mixed-citation></ref>
<ref id="ref002"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Audigier</surname><given-names>V.</given-names></name> <name><surname>Resche-Rigon</surname><given-names>M.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x201C;Micemd&#x201D;: multiple imputation by chained equations with multilevel data</article-title>. Available online at: <ext-link xlink:href="https://CRAN.R-project.org/package=micemd" ext-link-type="uri">https://CRAN.R-project.org/package=micemd</ext-link>.</mixed-citation></ref>
<ref id="ref4"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Biesanz</surname><given-names>J. C.</given-names></name> <name><surname>Deeb-Sossa</surname><given-names>N.</given-names></name> <name><surname>Papadakis</surname><given-names>A. A.</given-names></name> <name><surname>Bollen</surname><given-names>K. A.</given-names></name> <name><surname>Curran</surname><given-names>P. J.</given-names></name></person-group> (<year>2004</year>). <article-title>The role of coding time in estimating and interpreting growth curve models</article-title>. <source>Psychol. Methods</source> <volume>9</volume>, <fpage>30</fpage>&#x2013;<lpage>52</lpage>. doi: <pub-id pub-id-type="doi">10.1037/1082-989X.9.1.30</pub-id>, <pub-id pub-id-type="pmid">15053718</pub-id></mixed-citation></ref>
<ref id="ref5"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Bollen</surname><given-names>K. A.</given-names></name></person-group> (<year>1989</year>). <source>Structural Equations with Latent Variables</source>, <volume>210</volume> <publisher-loc>New York, NY</publisher-loc>: <publisher-name>John Wiley &#x0026; Sons</publisher-name>.</mixed-citation></ref>
<ref id="ref6"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Bollen</surname><given-names>K. A.</given-names></name> <name><surname>Curran</surname><given-names>P. J.</given-names></name></person-group> (<year>2006</year>). <source>Latent curve Models: A Structural Equation Perspective</source>. <publisher-loc>Hoboken, NJ</publisher-loc>: <publisher-name>John Wiley &#x0026; Sons</publisher-name>.</mixed-citation></ref>
<ref id="ref7"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bradley</surname><given-names>J. V.</given-names></name></person-group> (<year>1978</year>). <article-title>Robustness?</article-title> <source>Br. J. Math. Stat. Psychol.</source> <volume>31</volume>, <fpage>144</fpage>&#x2013;<lpage>152</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.2044-8317.1978.tb00581.x</pub-id></mixed-citation></ref>
<ref id="ref8"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Buse</surname><given-names>A.</given-names></name></person-group> (<year>1982</year>). <article-title>The likelihood ratio, Wald, and Lagrange multiplier tests: an expository note</article-title>. <source>Am. Stat.</source> <volume>36</volume>, <fpage>153</fpage>&#x2013;<lpage>157</lpage>. doi: <pub-id pub-id-type="doi">10.1080/00031305.1982.10482817</pub-id></mixed-citation></ref>
<ref id="ref9"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Carpenter</surname><given-names>J. R.</given-names></name> <name><surname>Goldstein</surname><given-names>H.</given-names></name> <name><surname>Kenward</surname><given-names>M. G.</given-names></name></person-group> (<year>2011</year>). <article-title>REALCOM-IMPUTE software for multilevel multiple imputation with mixed response types</article-title>. <source>J. Stat. Softw.</source> <volume>45</volume>, <fpage>1</fpage>&#x2013;<lpage>14</lpage>. doi: <pub-id pub-id-type="doi">10.18637/jss.v045.i05</pub-id></mixed-citation></ref>
<ref id="ref10"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chan</surname><given-names>K. W.</given-names></name> <name><surname>Meng</surname><given-names>X.-L.</given-names></name></person-group> (<year>2022</year>). <article-title>Multiple improvements of multiple imputation likelihood ratio tests</article-title>. <source>Stat. Sin.</source> <volume>2022</volume>, <fpage>1489</fpage>&#x2013;<lpage>1514</lpage>. doi: <pub-id pub-id-type="doi">10.5705/ss.202019.0314</pub-id></mixed-citation></ref>
<ref id="ref12"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Collins</surname><given-names>L. M.</given-names></name> <name><surname>Schafer</surname><given-names>J. L.</given-names></name> <name><surname>Kam</surname><given-names>C. M.</given-names></name></person-group> (<year>2001</year>). <article-title>A comparison of inclusive and restrictive strategies in modern missing data procedures</article-title>. <source>Psychol. Methods</source> <volume>6</volume>, <fpage>330</fpage>&#x2013;<lpage>351</lpage>. doi: <pub-id pub-id-type="doi">10.1037/1082-989X.6.4.330</pub-id>, <pub-id pub-id-type="pmid">11778676</pub-id></mixed-citation></ref>
<ref id="ref13"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Depaoli</surname><given-names>S.</given-names></name> <name><surname>Jia</surname><given-names>F.</given-names></name> <name><surname>Heo</surname><given-names>I.</given-names></name></person-group> (<year>2023</year>). <article-title>Detecting model misspecification in Bayesian piecewise growth models</article-title>. <source>Struct. Equ. Model. Multidiscip. J.</source> <volume>30</volume>, <fpage>574</fpage>&#x2013;<lpage>591</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10705511.2022.2144865</pub-id></mixed-citation></ref>
<ref id="ref14"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Enders</surname><given-names>C. K.</given-names></name></person-group> (<year>2001</year>). <article-title>A primer on maximum likelihood algorithms available for use with missing data</article-title>. <source>Struct. Equ. Model.</source> <volume>8</volume>, <fpage>128</fpage>&#x2013;<lpage>141</lpage>. doi: <pub-id pub-id-type="doi">10.1207/S15328007SEM0801_7</pub-id></mixed-citation></ref>
<ref id="ref15"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Enders</surname><given-names>C. K.</given-names></name></person-group> (<year>2011</year>). <article-title>Analyzing longitudinal data with missing values</article-title>. <source>Rehabil. Psychol.</source> <volume>56</volume>, <fpage>267</fpage>&#x2013;<lpage>288</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0025579</pub-id>, <pub-id pub-id-type="pmid">21967118</pub-id></mixed-citation></ref>
<ref id="ref003"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Enders</surname><given-names>C. K.</given-names></name></person-group> (<year>2022</year>). <source>Applied missing data analysis (2nd ed.)</source>. <publisher-name>The Guilford Press</publisher-name>.</mixed-citation></ref>
<ref id="ref16"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Enders</surname><given-names>C. K.</given-names></name> <name><surname>Bandalos</surname><given-names>D. L.</given-names></name></person-group> (<year>2001</year>). <article-title>The relative performance of full information maximum likelihood estimation for missing data in structural equation models</article-title>. <source>Struct. Equ. Model. Multidiscip. J.</source> <volume>8</volume>, <fpage>430</fpage>&#x2013;<lpage>457</lpage>. doi: <pub-id pub-id-type="doi">10.1207/S15328007SEM0803_5</pub-id></mixed-citation></ref>
<ref id="ref17"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Enders</surname><given-names>C. K.</given-names></name> <name><surname>Du</surname><given-names>H.</given-names></name> <name><surname>Keller</surname><given-names>B. T.</given-names></name></person-group> (<year>2020</year>). <article-title>A model-based imputation procedure for multilevel regression models with random coefficients, interaction effects, and nonlinear terms</article-title>. <source>Psychol. Methods</source> <volume>25</volume>, <fpage>88</fpage>&#x2013;<lpage>112</lpage>. doi: <pub-id pub-id-type="doi">10.1037/met0000228</pub-id>, <pub-id pub-id-type="pmid">31259566</pub-id></mixed-citation></ref>
<ref id="ref18"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Enders</surname><given-names>C. K.</given-names></name> <name><surname>Mansolf</surname><given-names>M.</given-names></name></person-group> (<year>2018</year>). <article-title>Assessing the fit of structural equation models with multiply imputed data</article-title>. <source>Psychol. Methods</source> <volume>23</volume>, <fpage>76</fpage>&#x2013;<lpage>93</lpage>. doi: <pub-id pub-id-type="doi">10.1037/met0000102</pub-id>, <pub-id pub-id-type="pmid">27893216</pub-id></mixed-citation></ref>
<ref id="ref21"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gottschall</surname><given-names>A. C.</given-names></name> <name><surname>West</surname><given-names>S. G.</given-names></name> <name><surname>Enders</surname><given-names>C. K.</given-names></name></person-group> (<year>2012</year>). <article-title>A comparison of item-level and scale-level multiple imputation for questionnaire batteries</article-title>. <source>Multivar. Behav. Res.</source> <volume>47</volume>, <fpage>1</fpage>&#x2013;<lpage>25</lpage>. doi: <pub-id pub-id-type="doi">10.1080/00273171.2012.640589</pub-id></mixed-citation></ref>
<ref id="ref22"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Graham</surname><given-names>J. W.</given-names></name></person-group> (<year>2003</year>). <article-title>Adding missing-data-relevant variables to FIML-based structural equation models</article-title>. <source>Struct. Equ. Model. Multidiscip. J.</source> <volume>10</volume>, <fpage>80</fpage>&#x2013;<lpage>100</lpage>. doi: <pub-id pub-id-type="doi">10.1207/S15328007SEM1001_4</pub-id></mixed-citation></ref>
<ref id="ref23"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Grund</surname><given-names>S.</given-names></name> <name><surname>L&#x00FC;dtke</surname><given-names>O.</given-names></name> <name><surname>Robitzsch</surname><given-names>A.</given-names></name></person-group> (<year>2018</year>). <article-title>Multiple imputation of missing data for multilevel models: simulations and recommendations</article-title>. <source>Organ. Res. Methods</source> <volume>21</volume>, <fpage>111</fpage>&#x2013;<lpage>149</lpage>.</mixed-citation></ref>
<ref id="ref24"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Grund</surname><given-names>S.</given-names></name> <name><surname>L&#x00FC;dtke</surname><given-names>O.</given-names></name> <name><surname>Robitzsch</surname><given-names>A.</given-names></name></person-group> (<year>2021</year>). <article-title>Multiple imputation of missing data in multilevel models with the R package mdmb: a flexible sequential modeling approach</article-title>. <source>Behav. Res. Methods</source> <volume>53</volume>, <fpage>2631</fpage>&#x2013;<lpage>2649</lpage>. doi: <pub-id pub-id-type="doi">10.3758/s13428-020-01530-0</pub-id></mixed-citation></ref>
<ref id="ref25"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Grund</surname><given-names>S.</given-names></name> <name><surname>L&#x00FC;dtke</surname><given-names>O.</given-names></name> <name><surname>Robitzsch</surname><given-names>A.</given-names></name></person-group> (<year>2023</year>). <article-title>Pooling methods for likelihood ratio tests in multiply imputed data sets</article-title>. <source>Psychol. Methods</source> <volume>28</volume>, <fpage>1207</fpage>&#x2013;<lpage>1221</lpage>. doi: <pub-id pub-id-type="doi">10.1177/1094428117703686</pub-id>, <pub-id pub-id-type="pmid">37104764</pub-id></mixed-citation></ref>
<ref id="ref26"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Honaker</surname><given-names>J.</given-names></name> <name><surname>King</surname><given-names>G.</given-names></name> <name><surname>Blackwell</surname><given-names>M.</given-names></name></person-group> (<year>2011</year>). <article-title>Amelia II: a program for missing data</article-title>. <source>J. Stat. Softw.</source> <volume>45</volume>, <fpage>1</fpage>&#x2013;<lpage>47</lpage>. doi: <pub-id pub-id-type="doi">10.18637/jss.v045.i07</pub-id></mixed-citation></ref>
<ref id="ref28"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Huque</surname><given-names>M. H.</given-names></name> <name><surname>Carlin</surname><given-names>J. B.</given-names></name> <name><surname>Simpson</surname><given-names>J. A.</given-names></name> <name><surname>Lee</surname><given-names>K. J.</given-names></name></person-group> (<year>2018</year>). <article-title>A comparison of multiple imputation methods for missing data in longitudinal studies</article-title>. <source>BMC Med. Res. Methodol.</source> <volume>18</volume>:<fpage>168</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12874-018-0615-</pub-id></mixed-citation></ref>
<ref id="ref30"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jia</surname><given-names>F.</given-names></name> <name><surname>Wu</surname><given-names>W.</given-names></name></person-group> (<year>2022</year>). <article-title>A comparison of multiple imputation strategies to deal with missing nonnormal data in structural equation modeling</article-title>. <source>Behav. Res. Methods</source> <volume>55</volume>, <fpage>3100</fpage>&#x2013;<lpage>3119</lpage>. doi: <pub-id pub-id-type="doi">10.3758/s13428-022-01936-y</pub-id></mixed-citation></ref>
<ref id="ref33"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Jorgensen</surname><given-names>T.</given-names></name> <name><surname>Rosseel</surname><given-names>Y.</given-names></name></person-group> (<year>2025</year>). Lavaan.mi: fit structural equation models to multiply imputed data (version 0.1-0) [computer software]. Available online at: <ext-link xlink:href="https://cran.r-project.org/web/packages/lavaan.mi/index.html" ext-link-type="uri">https://cran.r-project.org/web/packages/lavaan.mi/index.html</ext-link> (Accessed February 7, 2025).</mixed-citation></ref>
<ref id="ref34"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Keller</surname><given-names>B. T.</given-names></name> <name><surname>Enders</surname><given-names>C. K.</given-names></name></person-group> (<year>2023</year>). Blimp user&#x2019;s guide (Version 3). Available online at: <ext-link xlink:href="https://www.appliedmissingdata.com/blimp" ext-link-type="uri">https://www.appliedmissingdata.com/blimp</ext-link> (Accessed February 7, 2025).</mixed-citation></ref>
<ref id="ref35"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kohli</surname><given-names>N.</given-names></name> <name><surname>Harring</surname><given-names>J. R.</given-names></name></person-group> (<year>2013</year>). <article-title>Modeling growth in latent variables using a piecewise function</article-title>. <source>Multivar. Behav. Res.</source> <volume>48</volume>, <fpage>370</fpage>&#x2013;<lpage>397</lpage>. doi: <pub-id pub-id-type="doi">10.1080/00273171.2013.778191</pub-id>, <pub-id pub-id-type="pmid">26741847</pub-id></mixed-citation></ref>
<ref id="ref37"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>K.-H.</given-names></name> <name><surname>Meng</surname><given-names>X.-L.</given-names></name> <name><surname>Raghunathan</surname><given-names>T. E.</given-names></name> <name><surname>Rubin</surname><given-names>D. B.</given-names></name></person-group> (<year>1991</year>). <article-title>Significance levels from repeated p-values with multiply-imputed data</article-title>. <source>Stat. Sin.</source> <volume>1</volume>, <fpage>65</fpage>&#x2013;<lpage>92</lpage>. Available online at: <ext-link xlink:href="https://www.jstor.org/stable/24303994" ext-link-type="uri">https://www.jstor.org/stable/24303994</ext-link></mixed-citation></ref>
<ref id="ref39"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>Y.</given-names></name> <name><surname>Sriutaisuk</surname><given-names>S.</given-names></name></person-group> (<year>2020</year>). <article-title>Evaluation of model fit in structural equation models with ordinal missing data: an examination of the D2 method</article-title>. <source>Struct. Equ. Model.</source> <volume>27</volume>, <fpage>561</fpage>&#x2013;<lpage>583</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10705511.2019.1662307</pub-id></mixed-citation></ref>
<ref id="ref41"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Meng</surname><given-names>X.-L.</given-names></name> <name><surname>Rubin</surname><given-names>D. B.</given-names></name></person-group> (<year>1992</year>). <article-title>Performing likelihood ratio tests with multiply-imputed data sets</article-title>. <source>Biometrika</source> <volume>79</volume>, <fpage>103</fpage>&#x2013;<lpage>111</lpage>. doi: <pub-id pub-id-type="doi">10.1093/biomet/79.1.103</pub-id></mixed-citation></ref>
<ref id="ref42"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Mulligan</surname><given-names>G. M.</given-names></name> <name><surname>McCarroll</surname><given-names>J. C.</given-names></name> <name><surname>Flanagan</surname><given-names>K. D.</given-names></name> <name><surname>McPhee</surname><given-names>C.</given-names></name></person-group> (<year>2019</year>). <source>Findings from the Fifth-Grade Round of the Early Childhood Longitudinal Study, Kindergarten Class of 2010&#x2013;11 (ECLS-K: 2011). First look. NCES 2019-130</source>. <publisher-loc>Washington, DC</publisher-loc>: <publisher-name>National Center for Education Statistics</publisher-name>. Available online at: <ext-link xlink:href="https://eric.ed.gov/?id=ED592787" ext-link-type="uri">https://eric.ed.gov/?id=ED592787</ext-link> (Accessed March 24, 2025).</mixed-citation></ref>
<ref id="ref45"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Quartagno</surname><given-names>M.</given-names></name> <name><surname>Carpenter</surname><given-names>J. R.</given-names></name></person-group> (<year>2016</year>). <article-title>Multiple imputation for IPD meta-analysis: allowing for heterogeneity and studies with missing covariates</article-title>. <source>Stat. Med.</source> <volume>35</volume>, <fpage>2938</fpage>&#x2013;<lpage>2954</lpage>. doi: <pub-id pub-id-type="doi">10.1002/sim.6837</pub-id>, <pub-id pub-id-type="pmid">26681666</pub-id></mixed-citation></ref>
<ref id="ref46"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Quartagno</surname><given-names>M.</given-names></name> <name><surname>Carpenter</surname><given-names>J. R.</given-names></name></person-group> (<year>2019</year>). <article-title>Multiple imputation for discrete data: evaluation of the joint latent normal model</article-title>. <source>Biom. J.</source> <volume>61</volume>, <fpage>1003</fpage>&#x2013;<lpage>1019</lpage>. doi: <pub-id pub-id-type="doi">10.1002/bimj.201800222</pub-id>, <pub-id pub-id-type="pmid">30868652</pub-id></mixed-citation></ref>
<ref id="ref47"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Quartagno</surname><given-names>M.</given-names></name> <name><surname>Carpenter</surname><given-names>J. R.</given-names></name></person-group> (<year>2022</year>). <article-title>Substantive model compatible multilevel multiple imputation: a joint modeling approach</article-title>. <source>Stat. Med.</source> <volume>41</volume>, <fpage>5000</fpage>&#x2013;<lpage>5015</lpage>. doi: <pub-id pub-id-type="doi">10.1002/sim.9549</pub-id>, <pub-id pub-id-type="pmid">35959539</pub-id></mixed-citation></ref>
<ref id="ref48"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Quartagno</surname><given-names>M.</given-names></name> <name><surname>Carpenter</surname><given-names>J. R.</given-names></name></person-group> (<year>2023</year>). Jomo: a package for multilevel joint modelling multiple imputation. Available online at: <ext-link xlink:href="https://CRAN.R-project.org/package=jomo" ext-link-type="uri">https://CRAN.R-project.org/package=jomo</ext-link> (Accessed February 10, 2025).</mixed-citation></ref>
<ref id="ref49"><mixed-citation publication-type="other"><person-group person-group-type="author"><collab id="coll1">R Core Team</collab></person-group> (<year>2021</year>). <source>R: A Language and Environment for Statistical Computing</source>. <publisher-name>R Foundation for Statistical Computing</publisher-name>, <publisher-loc>Vienna, Austria</publisher-loc>. Available online at: <ext-link xlink:href="https://www.R-project.org/" ext-link-type="uri">https://www.R-project.org/</ext-link>. (Accessed June 30, 2023).</mixed-citation></ref>
<ref id="ref51"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Resche-Rigon</surname><given-names>M.</given-names></name> <name><surname>White</surname><given-names>I. R.</given-names></name></person-group> (<year>2018</year>). <article-title>Multiple imputation by chained equations for systematically and sporadically missing multilevel data</article-title>. <source>Stat. Methods Med. Res.</source> <volume>27</volume>, <fpage>1634</fpage>&#x2013;<lpage>1649</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0962280216666564</pub-id>, <pub-id pub-id-type="pmid">27647809</pub-id></mixed-citation></ref>
<ref id="ref53"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rosseel</surname><given-names>Y.</given-names></name></person-group> (<year>2012</year>). <article-title>Lavaan: an R package for structural equation modeling</article-title>. <source>J. Stat. Softw.</source> <volume>48</volume>, <fpage>1</fpage>&#x2013;<lpage>36</lpage>. doi: <pub-id pub-id-type="doi">10.18637/jss.v048.i02</pub-id></mixed-citation></ref>
<ref id="ref004"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rubin</surname><given-names>D. B.</given-names></name></person-group> (<year>1976</year>). <article-title>Inference and missing data</article-title>. <source>Biometrika</source>, <volume>63</volume>, <fpage>581</fpage>&#x2013;<lpage>592</lpage>.</mixed-citation></ref>
<ref id="ref54"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Rubin</surname><given-names>D. B.</given-names></name></person-group> (<year>1987</year>). <source>Multiple Imputation for Nonresponse in Surveys</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>John Wiley &#x0026; Sons</publisher-name>.</mixed-citation></ref>
<ref id="ref56"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Savalei</surname><given-names>V.</given-names></name> <name><surname>Bentler</surname><given-names>P. M.</given-names></name></person-group> (<year>2009</year>). <article-title>A two-stage approach to missing data: theory and application to auxiliary variables</article-title>. <source>Struct. Equ. Model. Multidiscip. J.</source> <volume>16</volume>, <fpage>477</fpage>&#x2013;<lpage>497</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10705510903008238</pub-id></mixed-citation></ref>
<ref id="ref58"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Schafer</surname><given-names>J. L.</given-names></name></person-group> (<year>1997</year>). <source>Analysis of Incomplete Multivariate Data</source>. <publisher-loc>Boca Raton, FL</publisher-loc>: <publisher-name>CRC press</publisher-name>.</mixed-citation></ref>
<ref id="ref63"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Tourangeau</surname><given-names>K.</given-names></name> <name><surname>Nord</surname><given-names>C.</given-names></name> <name><surname>L&#x00EA;</surname><given-names>T.</given-names></name> <name><surname>Wallner-Allen</surname><given-names>K.</given-names></name> <name><surname>Vaden-Kiernan</surname><given-names>N.</given-names></name> <name><surname>Blaker</surname><given-names>L.</given-names></name> <etal/></person-group>. (<year>2019</year>). <source>Early childhood longitudinal study, kindergarten class of 2010&#x2013;11 (ECLS-K: 2011) user&#x2019;s manual for the ECLS-K: 2011 kindergarten&#x2013;fifth grade data file and electronic codebook, public version (NCES 2019&#x2013;051)</source>. <publisher-loc>Washington, DC</publisher-loc>: <publisher-name>U.S. Department of Education, National Center for Education Statistics</publisher-name>.</mixed-citation></ref>
<ref id="ref65"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>van Buuren</surname><given-names>S.</given-names></name> <name><surname>Brand</surname><given-names>J. P. L.</given-names></name> <name><surname>Groothuis-Oudshoorn</surname><given-names>C.</given-names></name> <name><surname>Rubin</surname><given-names>D. B.</given-names></name></person-group> (<year>2006</year>). <article-title>Fully conditional specification in multivariate imputation</article-title>. <source>J. Stat. Comput. Simul.</source> <volume>76</volume>, <fpage>1049</fpage>&#x2013;<lpage>1064</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10629360600810434</pub-id></mixed-citation></ref>
<ref id="ref66"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>van Buuren</surname><given-names>S.</given-names></name> <name><surname>Groothuis-Oudshoorn</surname><given-names>K.</given-names></name></person-group> (<year>2011</year>). <article-title>Mice: multivariate imputation by chained equations in R</article-title>. <source>J. Stat. Softw.</source> <volume>45</volume>, <fpage>1</fpage>&#x2013;<lpage>67</lpage>. doi: <pub-id pub-id-type="doi">10.18637/jss.v045.i03</pub-id></mixed-citation></ref>
<ref id="ref67"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>White</surname><given-names>I. R.</given-names></name> <name><surname>Royston</surname><given-names>P.</given-names></name> <name><surname>Wood</surname><given-names>A. M.</given-names></name></person-group> (<year>2011</year>). <article-title>Multiple imputation using chained equations: issues and guidance for practice</article-title>. <source>Stat. Med.</source> <volume>30</volume>, <fpage>377</fpage>&#x2013;<lpage>399</lpage>. doi: <pub-id pub-id-type="doi">10.1002/sim.4067</pub-id>, <pub-id pub-id-type="pmid">21225900</pub-id></mixed-citation></ref>
<ref id="ref68"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname><given-names>W.</given-names></name> <name><surname>West</surname><given-names>S. G.</given-names></name></person-group> (<year>2010</year>). <article-title>Sensitivity of fit indices to misspecification in growth curve models</article-title>. <source>Multivar. Behav. Res.</source> <volume>45</volume>, <fpage>420</fpage>&#x2013;<lpage>452</lpage>. doi: <pub-id pub-id-type="doi">10.1080/00273171.2010.483378</pub-id>, <pub-id pub-id-type="pmid">26760488</pub-id></mixed-citation></ref>
<ref id="ref71"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Zhao</surname><given-names>J. H.</given-names></name> <name><surname>Schafer</surname><given-names>J. L.</given-names></name></person-group> (<year>2015</year>). pan: multiple imputation for multivariate panel or clustered data. Available online at: <ext-link xlink:href="https://cran.r-project.org/web/packages/pan/pan.pdf" ext-link-type="uri">https://cran.r-project.org/web/packages/pan/pan.pdf</ext-link> (Accessed February 10, 2025).</mixed-citation></ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0002">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/22411/overview">Holmes Finch</ext-link>, Ball State University, United States</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0003">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/916834/overview">Yutian Tang Thompson</ext-link>, University of Oklahoma Health Sciences Center, United States</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/585081/overview">Ricardo Olmos</ext-link>, Autonomous University of Madrid, Spain</p>
</fn>
</fn-group>
<fn-group>
<fn id="fn0001">
<label>1</label>
<p>Complete results, including MSE, as well as the code for simulation and analysis in empirical example are available in OSF (<ext-link xlink:href="https://osf.io/3bswx/overview" ext-link-type="uri">https://osf.io/3bswx/overview</ext-link>).</p>
</fn>
</fn-group>
</back>
</article>