<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychol.</journal-id>
<journal-title>Frontiers in Psychology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychol.</abbrev-journal-title>
<issn pub-type="epub">1664-1078</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyg.2025.1499076</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Psychology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Comparing raw score difference, multilevel modeling, and structural equation modeling methods for estimating discrepancy in dyads</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>McEnturff</surname> <given-names>Amber</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Chen</surname> <given-names>Qi</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/11028/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Henson</surname> <given-names>Robin K.</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/45638/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Glaman</surname> <given-names>Ryan</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/401597/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Luo</surname> <given-names>Wen</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/430888/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Alexandria City Public Schools</institution>, <addr-line>Alexandria, VA</addr-line>, <country>United States</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Educational Psychology, University of North Texas</institution>, <addr-line>Denton, TX</addr-line>, <country>United States</country></aff>
<aff id="aff3"><sup>3</sup><institution>Department of Educational Leadership and Technology, Tarleton State University</institution>, <addr-line>Stephenville, TX</addr-line>, <country>United States</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Educational Psychology, Texas A&#x0026;M University</institution>, <addr-line>College Station, TX</addr-line>, <country>United States</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0001">
<p>Edited by: Wenchao Ma, University of Minnesota Twin Cities, United States</p>
</fn>
<fn fn-type="edited-by" id="fn0002">
<p>Reviewed by: Max Auerswald, University of Ulm, Germany</p>
<p>Jiun-Yu Wu, Southern Methodist University, United States</p>
</fn>
<corresp id="c001">&#x002A;Correspondence: Amber McEnturff, <email>amber.mcenturff@acps.k12.va.us</email>;Qi Chen, <email>qi.chen@unt.edu</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>19</day>
<month>06</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1499076</elocation-id>
<history>
<date date-type="received">
<day>20</day>
<month>09</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>22</day>
<month>04</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 McEnturff, Chen, Henson, Glaman and Luo.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>McEnturff, Chen, Henson, Glaman and Luo</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Dyadic data analysis is commonly used in psychological research involving pairs of individuals in a nested relationship, such as parent and child, student and teacher, and pairs of spouses. There are several methods for calculating dyadic discrepancy (i.e., difference) scores, and purpose of the present study was to explore which of these methods produced the most accurate discrepancy estimates and most accurate outcome prediction.</p>
</sec>
<sec>
<title>Methods</title>
<p>Using a Monte Carlo simulation, the present study compared three methods for estimating discrepancy scores in dyad pairs: raw score difference (RSD), empirical Bayes estimates from multilevel modeling (MLM), and factor scores from structural equation modeling (SEM). Design factors for this simulation included intraclass correlation (ICC), cluster number, reliability estimates, effect size of discrepancy, and effect size variance.</p>
</sec>
<sec>
<title>Results</title>
<p>Results suggest discrepancy estimates from MLM had poor reliability compared to RSD and SEM methods. These findings were driven primarily by having a high ICC, high effect size variance, and low number of clusters. None of the design factors had an appreciable impact on either the RSD or SEM estimates.</p>
</sec>
<sec>
<title>Discussion</title>
<p>RSD and SEM methods performed similarly, and are recommended for practical use in estimating discrepancy values. MLM is not recommended as it featured comparatively poor reliability.</p>
</sec>
</abstract>
<kwd-group>
<kwd>dyadic analysis</kwd>
<kwd>dyadic discrepancy</kwd>
<kwd>multilevel modeling</kwd>
<kwd>structural equation modeling</kwd>
<kwd>Monte Carlo simulation</kwd>
</kwd-group>
<counts>
<fig-count count="11"/>
<table-count count="5"/>
<equation-count count="15"/>
<ref-count count="48"/>
<page-count count="20"/>
<word-count count="13789"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Quantitative Psychology and Measurement</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>This study&#x2019;s purpose was to determine the best way to measure the difference between members of a dyad, or two people, on a psychological construct (i.e., relationship satisfaction). Because there are several methods used in the literature and no clear consensus on the best approach, a Monte Carlo simulation compared three of these methods across a variety of potential research conditions, including variations on intraclass correlation (ICC), cluster number, reliability, effect size, and effect size variance.</p>
<p><xref ref-type="bibr" rid="ref38">Sayer and Klute (2005)</xref> defined a dyad as &#x201C;two individuals&#x201D; &#x201C;nested in a relationship&#x201D; (p. 291). Common examples of dyads include parent and child, employee and supervisor, or student and professor. Dyadic discrepancy is defined as the degree to which two individuals nested in a relationship differ on some construct of interest. The construct could be virtually any psychological or educational measure, such as depression, intelligence, or personality. For example, if each member of a heterosexual married couple completes an assessment of marital satisfaction, the scores may reveal that a wife has a much higher level of marital satisfaction than her husband. The difference in levels of marital satisfaction between the husband and wife is the dyadic discrepancy. The discrepancy score represents both the magnitude (size) and direction (which dyad member has a higher score) of the difference.</p>
<p>In addition to understanding the discrepancy itself, it may be useful to understand the relationship between the discrepancy and some other variable. Following the marital satisfaction scenario, the amount of discrepancy may be related to the effectiveness of couples&#x2019; counseling. Therefore, the focus of this study includes both the estimation of discrepancy and its relationship with another variable.</p>
<p>The importance of accurate discrepancy estimation lies in both the prevalence of research using dyads and the implications of inaccurate discrepancy estimation. Dyadic discrepancy is studied in multiple areas of psychology. For example, the acculturation gap (<xref ref-type="bibr" rid="ref12">Costigan and Dokis, 2006</xref>) is a type of dyadic discrepancy that may occur between parent and child when one member of the dyad acculturates to a new culture at a different level than the other member. The discrepancy represents the size of the acculturation gap and the direction (whether parent or child has become more acculturated than the other). Acculturation gap may predict child maladjustment (<xref ref-type="bibr" rid="ref22">Kim et al., 2013</xref>). In this example, accurate discrepancy estimation is important for understanding the relationship between the acculturation gap and outcomes like child maladjustment, which may then impact family interventions.</p>
<p>As another example, dyadic discrepancy has also been applied in end-of-life care research. For example, <xref ref-type="bibr" rid="ref39">Schmid et al. (2010)</xref> analyzed the relationship between the discrepancy in desire for medical intervention and family demographic characteristics to learn which families were most at risk for having a large discrepancy between the patients&#x2019; actual medical care wishes and how the family perceived them. Like the acculturation example, a better understanding of the relationship between the discrepancy and family characteristics can guide recommendations about interventions that prepare families for end-of-life care decisions. Other examples discrepancy research include: marital satisfaction discrepancy related to psychological adjustment to widowhood (<xref ref-type="bibr" rid="ref001">Carr and Boerner, 2009</xref>); informant discrepancies between reporters of child psychological behavior related to the diagnosis of the child (<xref ref-type="bibr" rid="ref15">De Los Reyes and Kazdin, 2004</xref>); and, discrepancies between parent and child educational expectations related to adolescent adjustment (<xref ref-type="bibr" rid="ref43">Wang and Benner, 2013</xref>). Accurate and consistent discrepancy score estimation is the first step to understanding the relationship between discrepancy and other variables.</p>
<sec id="sec2">
<label>1.1</label>
<title>Conceptualization of dyad discrepancies</title>
<p>Importantly, there are different ways to conceptualize dyadic discrepancy, such as idiographic versus nomothetic measures of discrepancy. The idiographic approach computes discrepancy for each dyad separately and can be compared among dyads. Following the marriage example, each couple would have its own marital satisfaction discrepancy score.</p>
<p>In the nomothetic approach, a single discrepancy estimate is computed across all dyads. Using marriage, the discrepancy would be a single measure, that might, for example, reflect a general trend where husbands tended to be more or less satisfied in their marriages than wives. Idiographic discrepancies can be summarized using descriptive statistics such as mean or standard deviation and used in a nomothetic approach (<xref ref-type="bibr" rid="ref19">Kenny et al., 2006a</xref>).</p>
<p>The goal of a dyadic analysis might be to build generalizable knowledge about marital satisfaction (nomothetic) or to better understand the marital satisfaction of individual dyads (idiographic). As described by <xref ref-type="bibr" rid="ref42">Steele et al. (2013)</xref>, analyses could combine both nomothetic and idiographic approaches. They stated, &#x201C;&#x2026;we need methods that allow individual trajectories to emerge while simultaneously looking to a common point of comparison&#x201D; (p. 676). The methods compared in this study output a single idiographic discrepancy measure for each dyad. The discrepancy can then be used to answer idiographic or nomothetic research questions.</p>
<p>Another conceptual issue is the difference between distinguishable and indistinguishable dyads (<xref ref-type="bibr" rid="ref002">Gonzalez and Griffin, 1997</xref>). Distinguishable dyads are differentiable by some trait that is of interest in the research. In marital satisfaction, a heterosexual married couple would be considered distinguishable, for example, by role (husband and wife), gender, and potentially other variables such as employment status (where one works and one does not). Indistinguishable dyads have no distinguishing factor between them, such as identical twins. Other dyads that could be distinguishable, like husband and wife, may be treated as indistinguishable if role, gender, or other distinguishing factor is not of interest to the research study. For distinguishable dyads, both the size (how different are the members of a dyad) and direction (which dyad member has the higher score) of the discrepancy must be used in the analysis. For indistinguishable dyads, only the size of the discrepancy matters, and some statistics would be inappropriate for such data. For example, Pearson <italic>r</italic> should not be computed for indistinguishable dyads because <italic>r</italic> requires paired data with specific groups, where each score in the pair must belong to a particular group. Pearson <italic>r</italic> could mathematically be computed as a measure of association between a group of dyads, but <italic>r</italic> would depend on how each dyad member was assigned to a group, which would be an arbitrary decision that alters the value of <italic>r</italic> when changed. Therefore, it is important to ensure measures computed for dyadic data appropriately take distinguishability into account.</p>
<p>Another issue impacting the computation of dyadic discrepancy is whether a single score or composite scale score is used. In some discrepancy models, the construct of interest is represented by a single score from each dyad member, which may be a single item score or a composite scale score generated from multiple items in a separate analysis of the measurement model. Conversely, some models, such as structural equation models, use item-level data and incorporate the measurement model and discrepancy model into one analysis (<xref ref-type="bibr" rid="ref33">Newsom, 2002</xref>). The scope of this research is limited to the single-score case. Whether a single score or item-level data is used, measurement invariance is assumed before calculating discrepancy scores. Confirmation of measurement invariance ensures that measures are indeed tapping the same construct when used with two different populations (<xref ref-type="bibr" rid="ref36">Russell et al., 2016</xref>).</p>
<p>In summary, when choosing discrepancy calculation methods, it is important to consider whether the research is idiographic or nomothetic in nature, whether dyads are distinguishable or indistinguishable within the context of the research question, and what kind of numerical data will be used to compute the discrepancy (a single score or multiple scores).</p>
</sec>
<sec id="sec3">
<label>1.2</label>
<title>Discrepancy estimation methods</title>
<p>Three methods for estimating discrepancy were identified that fit into the theoretical framework described above; that is, they provide an idiographic measure of discrepancy (an individual score for each dyad), they may be used for distinguishable or indistinguishable dyads, and they use the composite score rather than individual item scores. The three methods are the raw score difference (RSD), the empirical Bayes discrepancy (EBD) estimate from multilevel modeling (MLM), and the factor score from structural equation modeling (SEM). In this section, each method is described in detail, and reasons for not including other discrepancy methods are also provided. Throughout this section, the symbols <italic>X</italic> and <italic>Y</italic> are used to represent scores from dyad members <italic>A</italic> and <italic>B</italic>, respectively.</p>
<sec id="sec4">
<label>1.2.1</label>
<title>Raw score difference</title>
<p>The RSD is computed by subtracting one raw score from another, as shown in <xref ref-type="disp-formula" rid="EQ1">Equation 1</xref>:</p>
<disp-formula id="EQ1">
<label>(1)</label>
<mml:math id="M1">
<mml:mi mathvariant="italic">RSD</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>Y</mml:mi>
</mml:math>
</disp-formula>
<p>The RSD is easily interpretable; a value of 0 represents lack of discrepancy between the dyad members (<xref ref-type="bibr" rid="ref17">Guion et al., 2009</xref>).</p>
<p>RSD has been criticized for having low reliability (<xref ref-type="bibr" rid="ref13">Cronbach and Furby, 1970</xref>). Reliability is the overall consistency of a measure and, according to classical test theory, is the true score variance divided by observed score variance (<xref ref-type="bibr" rid="ref16">DeVellis, 2006</xref>). In applied research, where it is not possible to know true score variance, reliability is estimated using methods such as test&#x2013;retest or inter-rater reliability. Using Monte Carlo simulation methods, however, it is possible to compute the true measure of reliability because both true score and observed score variances are known.</p>
<p>The formula for estimating reliability of RSD based on its components (raw scores from each dyad member) has several variations (<xref ref-type="bibr" rid="ref27">Lord, 1963</xref>). The formula suggested by Lord assumes uncorrelated error variance, which is likely to be violated in dyads due to the dependency of dyad members on one another. Thus, to illustrate the reliability issue with RSD scores, a formula allowing correlated error variances was used. <xref ref-type="bibr" rid="ref45">Williams and Zimmerman&#x2019;s (1977)</xref> formula was used in a pre-test post-test design context, but it can be interpreted in the dyadic discrepancy context by thinking of <italic>X</italic> and <italic>Y</italic> as scores from each member of a dyad, respectively. The formula for reliability is shown in <xref ref-type="disp-formula" rid="EQ2">Equation 2</xref>:</p>
<disp-formula id="EQ2">
<label>(2)</label>
<mml:math id="M2">
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">DD</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mtable columnalign="left">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">XX</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msub>
<mml:mtext mathvariant="italic">VarX</mml:mtext>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">YY</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msub>
<mml:mtext mathvariant="italic">VarY</mml:mtext>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>2</mml:mn>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mi mathvariant="italic">XY</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>&#x03C3;</mml:mi>
<mml:mi>X</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>&#x03C3;</mml:mi>
<mml:mi>Y</mml:mi>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mo>+</mml:mo>
<mml:mn>2</mml:mn>
<mml:mi>&#x03C1;</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mi>X</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mi>Y</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:msub>
<mml:mi>&#x03C3;</mml:mi>
<mml:mi>X</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>&#x03C3;</mml:mi>
<mml:mi>Y</mml:mi>
</mml:msub>
<mml:msqrt>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">XX</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mrow>
<mml:mi mathvariant="italic">YY</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
</mml:msqrt>
</mml:mtd>
</mml:mtr>
</mml:mtable>
<mml:mrow>
<mml:mtext mathvariant="italic">VarX</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext mathvariant="italic">VarY</mml:mtext>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>2</mml:mn>
<mml:msub>
<mml:mi>&#x03C1;</mml:mi>
<mml:mi mathvariant="italic">XY</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>&#x03C3;</mml:mi>
<mml:mi>X</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>&#x03C3;</mml:mi>
<mml:mi>Y</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:math>
</disp-formula>
<p>where <italic>&#x03C1;<sub>DD&#x2019;</sub></italic> is the reliability of RSD, <italic>&#x03C1;<sub>XX&#x2019;</sub></italic> and <italic>&#x03C1;<sub>YY&#x2019;</sub></italic> are the reliabilities of <italic>X</italic> and <italic>Y</italic> (e.g., reliabilities of the raw scores for dyad member <italic>X</italic> and dyad member <italic>Y</italic>, respectively), Var <italic>X</italic> and Var <italic>Y</italic> are the variances of <italic>X</italic> and <italic>Y</italic>, respectively, <italic>&#x03C1;<sub>XY</sub></italic> is the correlation between <italic>X</italic> and <italic>Y</italic>, <italic>&#x03C3;<sub>X</sub></italic> and <italic>&#x03C3;<sub>Y</sub></italic> are the standard deviations of <italic>X</italic> and <italic>Y</italic>, respectively, and <italic>&#x03C1;</italic>(<italic>E<sub>X</sub>, E<sub>Y</sub></italic>) is the correlation between the error variances of <italic>X</italic> and <italic>Y</italic>. As demonstrated in this formula, anything that makes the numerator larger in the formula above increases the reliability of RSD, thus mitigating the reliability issue of RSD and making RSD a viable option for discrepancy estimation. These include higher reliabilities of <italic>X</italic> and <italic>Y</italic> and smaller correlation between <italic>X</italic> and <italic>Y</italic>.</p>
<p>Another feature of this formula is that, as long as <italic>&#x03C1;<sub>XY</sub></italic> is positive, the reliability of RSD cannot be greater than the average of the reliabilities of <italic>X</italic> and <italic>Y</italic> (<xref ref-type="bibr" rid="ref9">Chiou and Spreng, 1996</xref>). This is the primary argument against RSD because, in some cases, reliability of RSD is actually lower than the reliabilities of <italic>X</italic> and <italic>Y</italic>, but reliability of RSD is never higher. However, <xref ref-type="bibr" rid="ref46">Zumbo (1999)</xref> argued that because there are situations where the reliability of difference scores is not an issue, RSD should not be ruled out in every instance. Therefore, despite the potential reliability issues, the RSD was evaluated as part of this study. The RSD is expected to have lower reliability in cases where reliability of <italic>X</italic> and <italic>Y</italic> are lower or <italic>X</italic> and <italic>Y</italic> are highly correlated.</p>
</sec>
<sec id="sec5">
<label>1.2.2</label>
<title>Empirical Bayes (EB) estimate from MLM</title>
<p>In dyadic research, MLM can be used to estimate the average intercept and slope across all dyads as well as the within-dyad intercept and slope. In MLM, parameters are estimated using EB estimation instead of the traditional ordinary least squares (OLS) estimation method. The dyad-level slope is one of the parameters estimated in the model described below. The dyad-level slope is the idiographic discrepancy score, which is referred to as EBD in this study.</p>
<p>As described by <xref ref-type="bibr" rid="ref22">Kim et al. (2013)</xref>, the following MLM was used to generate the EBD:</p>
<disp-formula id="EQ3">
<label>(3a)</label>
<mml:math id="M3">
<mml:mtext>Level</mml:mtext>
<mml:mspace width="0.1em"/>
<mml:mn>1</mml:mn>
<mml:mo>:</mml:mo>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mi mathvariant="italic">ij</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mn>0</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mtext mathvariant="italic">report</mml:mtext>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mi mathvariant="italic">ij</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B5;</mml:mi>
<mml:mi mathvariant="italic">ij</mml:mi>
</mml:msub>
</mml:math>
</disp-formula>
<disp-formula id="EQ4">
<label>(3b)</label>
<mml:math id="M4">
<mml:mtext>with</mml:mtext>
<mml:mspace width="0.1em"/>
<mml:msub>
<mml:mi>&#x03B5;</mml:mi>
<mml:mi mathvariant="italic">ij</mml:mi>
</mml:msub>
<mml:mo>&#x223C;</mml:mo>
<mml:mi>N</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<disp-formula id="EQ5">
<label>(4a)</label>
<mml:math id="M5">
<mml:mtext>Level</mml:mtext>
<mml:mspace width="0.1em"/>
<mml:mn>2</mml:mn>
<mml:mo>:</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mn>0</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B3;</mml:mi>
<mml:mn>00</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mn>0</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</disp-formula>
<disp-formula id="EQ6">
<label>(4b)</label>
<mml:math id="M6">
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B3;</mml:mi>
<mml:mn>10</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</disp-formula>
<disp-formula id="EQ7">
<label>(4c)</label>
<mml:math id="M7">
<mml:mtext>with</mml:mtext>
<mml:mspace width="0.1em"/>
<mml:mo stretchy="true">[</mml:mo>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mn>0</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="true">]</mml:mo>
<mml:mo>&#x223C;</mml:mo>
<mml:mi mathvariant="italic">MVN</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mo stretchy="true">[</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo stretchy="true">]</mml:mo>
<mml:mo>,</mml:mo>
<mml:mo stretchy="true">[</mml:mo>
<mml:msub>
<mml:mi>&#x03C4;</mml:mi>
<mml:mn>00</mml:mn>
</mml:msub>
<mml:msub>
<mml:mi>&#x03C4;</mml:mi>
<mml:mn>01</mml:mn>
</mml:msub>
<mml:msub>
<mml:mi>&#x03C4;</mml:mi>
<mml:mn>10</mml:mn>
</mml:msub>
<mml:msub>
<mml:mi>&#x03C4;</mml:mi>
<mml:mn>11</mml:mn>
</mml:msub>
<mml:mo stretchy="true">]</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<disp-formula id="EQ8">
<label>(5)</label>
<mml:math id="M8">
<mml:mtext>Combined model</mml:mtext>
<mml:mo>:</mml:mo>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mi mathvariant="italic">ij</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B3;</mml:mi>
<mml:mn>00</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msup>
<mml:msub>
<mml:mi>&#x03B3;</mml:mi>
<mml:mn>10</mml:mn>
</mml:msub>
<mml:mo>&#x2217;</mml:mo>
</mml:msup>
<mml:mtext mathvariant="italic">repor</mml:mtext>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mi mathvariant="italic">ij</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mn>0</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msup>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2217;</mml:mo>
</mml:msup>
<mml:mtext mathvariant="italic">repor</mml:mtext>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mi mathvariant="italic">ij</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B5;</mml:mi>
<mml:mi mathvariant="italic">ij</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<p><italic>Y<sub>ij</sub></italic> represents the score for each individual <italic>i</italic> within the same dyad <italic>j.</italic> &#x201C;Report&#x201D; is a dichotomous indicator with a value of &#x2212;0.5 if the score is reported by dyad member <italic>A</italic>, and 0.5 if reported by dyad member <italic>B</italic>. <italic>&#x03B2;<sub>0j</sub></italic> is the mean score between <italic>X</italic> and <italic>Y</italic> for each dyad <italic>j</italic>, and <italic>&#x03B2;<sub>1j</sub></italic> is the discrepancy score between <italic>X</italic> and <italic>Y</italic> for each dyad <italic>j</italic>. <italic>&#x03B5;<sub>ij</sub></italic> is the unique effect associated with individual <italic>i</italic> nested within dyad <italic>j</italic> (i.e., measurement error). <italic>&#x03B3;</italic><sub>00</sub> is the mean score across all dyads, and <italic>&#x03B3;</italic><sub>10</sub> is the mean discrepancy score across all dyads. <italic>u<sub>0j</sub></italic> is the unique effect of dyad <italic>j</italic> on the mean score, and <italic>u<sub>1j</sub></italic> is the unique effect of dyad <italic>j</italic> on the mean discrepancy score.</p>
<p>This random-coefficient model was fitted using the EB estimation procedure (<xref ref-type="bibr" rid="ref35">Raudenbush and Bryk, 2002</xref>). The EB estimates of <italic>&#x03B2;</italic><sub>1j</sub> (i.e., discrepancy in each dyad, or EBD) of the model were saved.</p>
<p>The model requires input of measurement error for the observed scores from each dyad member in order to sufficiently identify the model (<xref ref-type="bibr" rid="ref7">Cano et al., 2005</xref>). The formula used to calculate measurement error (i.e., <italic>r<sub>ij</sub></italic>) is given in <xref ref-type="disp-formula" rid="EQ9">Equation 6</xref>:</p>
<disp-formula id="EQ9">
<label>(6)</label>
<mml:math id="M9">
<mml:mi mathvariant="italic">ME</mml:mi>
<mml:mo>=</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x03B1;</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2217;</mml:mo>
<mml:msup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:math>
</disp-formula>
<p>where <italic>&#x03B1;</italic> is the reliability of the measure, and <italic>&#x03C3;<sup>2</sup></italic> is the variance of all scores within dyads.</p>
<p>The EBD may be a better estimate of discrepancy. EB estimates are also known as &#x201C;shrinkage&#x201D; estimates (<xref ref-type="bibr" rid="ref35">Raudenbush and Bryk, 2002</xref>). The equation for the EB estimate is:</p>
<disp-formula id="EQ10">
<label>(7)</label>
<mml:math id="M10">
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>&#x03B2;</mml:mi>
<mml:mo stretchy="true">&#x0302;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mi mathvariant="italic">EB</mml:mi>
</mml:msubsup>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03BB;</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>&#x03B2;</mml:mi>
<mml:mo stretchy="true">&#x0302;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mi mathvariant="italic">OLS</mml:mi>
</mml:msubsup>
<mml:mo>+</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03BB;</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:msub>
<mml:mi>&#x03B3;</mml:mi>
<mml:mn>10</mml:mn>
</mml:msub>
</mml:math>
</disp-formula>
<p>where <italic>&#x03BB;<sub>j</sub></italic> is the reliability of the OLS estimate, and <italic>&#x03B3;</italic><sub>10</sub> is the overall slope across all dyads. The EB estimate is shrunken based on the reliability of the OLS estimate (<italic>&#x03BB;<sub>j</sub></italic>) which is defined in <xref ref-type="disp-formula" rid="EQ11">Equation 8</xref>:</p>
<disp-formula id="EQ11">
<label>(8)</label>
<mml:math id="M11">
<mml:msub>
<mml:mi>&#x03BB;</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi mathvariant="italic">Var</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>&#x03B2;</mml:mi>
<mml:mo stretchy="true">&#x0302;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mi mathvariant="italic">OLS</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">Var</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>&#x03B2;</mml:mi>
<mml:mo stretchy="true">&#x0302;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mi mathvariant="italic">OLS</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:msup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>/</mml:mo>
<mml:msub>
<mml:mi>n</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M12">
<mml:mi mathvariant="italic">Var</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>&#x03B2;</mml:mi>
<mml:mo stretchy="true">&#x0302;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mi mathvariant="italic">OLS</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> represents the variance of the OLS estimates and <italic>n<sub>j</sub></italic>&#x202F;=&#x202F;2 in a dyad. Reliability increases as the variance of the OLS estimates increases, the level-1 residual variance decreases, or <italic>n<sub>j</sub></italic> increases.</p>
<p>The OLS estimate is weighted by reliability, and therefore counts less toward the EB estimate as reliability decreases. Meanwhile, the overall slope (<italic>&#x03B3;</italic><sub>10</sub>) is weighted by one minus the reliability, such that as reliability decreases, the overall slope is weighted more. Including both the OLS estimate and the overall slope, adjusted for reliability, results in an optimal weighted combination of the two (<xref ref-type="bibr" rid="ref35">Raudenbush and Bryk, 2002</xref>). Another way of viewing the EB estimate is as a &#x201C;composite of the sample slope estimate (<italic>&#x03B3;</italic><sub>10</sub>) and the predicted value of individual&#x2019;s slope estimate <inline-formula>
<mml:math id="M13">
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>&#x03B2;</mml:mi>
<mml:mo stretchy="true">&#x0302;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mi mathvariant="italic">OLS</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>&#x201D; (<xref ref-type="bibr" rid="ref40">Stage, 2001</xref>, p. 92).</p>
<p>When reliability estimates are low, as is the case with small cluster sizes such as dyads, the EB &#x201C;borrow strength from all of the information&#x2026;in the entire dataset to improve the estimates for dyad discrepancy scores&#x201D; (<xref ref-type="bibr" rid="ref22">Kim et al., 2013</xref>, p. 905). In addition, variance in the scores is divided into two parts: (a) variance associated with dyads; and (b) variance associated with individual members in the dyads (i.e., measurement error variance) (<xref ref-type="bibr" rid="ref22">Kim et al., 2013</xref>). The discrepancy estimates have measurement error partialed out and may be a more accurate estimate of the discrepancy.</p>
<p>On the other hand, a drawback of EB estimates is that they may &#x201C;over-shrink&#x201D; the estimates of random coefficients when cluster size is very small and lead to under-estimates of the posterior variance of the random coefficients (<xref ref-type="bibr" rid="ref34">Raudenbush, 2008</xref>). As a result, when EB estimates are used as predictors in a regression analysis, their raw regression coefficients and standard error estimates might be inaccurate, especially when the variance of EB estimates differ significantly from that of the true discrepancies.</p>
</sec>
<sec id="sec6">
<label>1.2.3</label>
<title>SEM discrepancy</title>
<p>SEM can be used to estimate discrepancy by fitting the model shown in <xref ref-type="fig" rid="fig1">Figure 1</xref>, which is based on <xref ref-type="bibr" rid="ref33">Newsom (2002)</xref>. In the SEM discrepancy model, the latent intercept and slope predict the individual scores of each dyad member. Paths from the slope to individual scores are fixed to 0.5 and &#x2212;0.5, so that intercept reflects the average score of both dyad members. The paths from intercept to individual scores are fixed to 1. The SEM dyadic discrepancy is indicated by the latent slope in <xref ref-type="fig" rid="fig1">Figure 1</xref>. Fitting this model using SEM would typically result in a single estimate for the latent slope that represents all dyads. However, it is possible to specify options in some software packages (such as PROC SCORE in SAS, or SAVEDATA in Mplus) that would save idiographic estimates of the latent slope. These individual estimates of the latent slope serve as the discrepancy estimates. One primary benefit of using SEM is the model&#x2019;s flexibility, such as the ability to incorporate correlated measurement errors into the model (<xref ref-type="bibr" rid="ref33">Newsom, 2002</xref>).</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>SEM path diagram for predicting an outcome with discrepancy score based on <xref ref-type="bibr" rid="ref33">Newsom (2002)</xref>.</p>
</caption>
<graphic xlink:href="fpsyg-16-1499076-g001.tif"/>
</fig>
</sec>
<sec id="sec7">
<label>1.2.4</label>
<title>Other discrepancy estimation methods not included in the present study</title>
<p>Two other methods found in discrepancy research were excluded from this study. One was the standardized score difference, notated as difference in z (DIZ). To calculate DIZ, each dyad member&#x2019;s score is converted to a z score, and one member&#x2019;s score is subtracted from the other (<xref ref-type="bibr" rid="ref15">De Los Reyes and Kazdin, 2004</xref>). However, the standardization of scores prior to computing a discrepancy changes the interpretation of the discrepancy (<xref ref-type="bibr" rid="ref17">Guion et al., 2009</xref>). Compared with the RSD method, a DIZ score of 0 does not mean perfect agreement between dyads, but rather that both dyad members have average scores within their respective distributions.</p>
<p>The second method excluded from this study was the OLS residual method (abbreviated as &#x201C;RES&#x201D; to indicate residual). RES involves using one member&#x2019;s rating to predict the other&#x2019;s in a linear regression, and outputting the residual for each dyad to serve as a discrepancy (<xref ref-type="bibr" rid="ref15">De Los Reyes and Kazdin, 2004</xref>). This score is typically standardized into a z score before use. The RES score is affected by the correlation between dyad members&#x2019; scores (<xref ref-type="bibr" rid="ref15">De Los Reyes and Kazdin, 2004</xref>). Say for example dyad member Y&#x2019;s score is predicted by dyad member X&#x2019;s score in a linear regression, and the standardized residual (RES) is output. The correlation between the independent variable X and RES is always 0. Larger correlations between dyad members X and Y mean weaker relationships between the Y and RES, while smaller correlations between X and Y mean stronger relationships between the Y and RES. This is true because, the more variance in Y explained by X, the less variance there is left unexplained (i.e., the variance of residual), and the less Y is related to that residual. When there is not much variance in Y explained by X, there is a lot of Y-related variance leftover.</p>
</sec>
</sec>
<sec id="sec8">
<label>1.3</label>
<title>Possible factors influencing discrepancy estimation</title>
<p>As discussed above, this study includes three methods of estimating dyadic discrepancy. In addition there are several data characteristics (i.e., design factors) which may impact the estimation of dyadic discrepancy. Based on review of applied and methodological research, these include ICC, cluster number (number of dyads), reliability of measurement, and effect size and effect size variance of the discrepancy. Each of these is discussed in more detail in this section.</p>
<sec id="sec9">
<label>1.3.1</label>
<title>Intraclass correlation</title>
<p>Nonindependence is a key consideration in dyadic data. Nonindependence means that the scores from two dyad members may share similarity more than scores from people not within the same dyad. Thus, the scores violate the assumption of independence of observations under the general linear model framework. The degree of nonindependence may impact the estimation of dyadic discrepancy. Ignoring the nonindependence of observations and analyzing data as though they are independent has implications for the accuracy of standard error estimates (<xref ref-type="bibr" rid="ref8">Chen et al., 2010</xref>). The standard errors for predictors at the ignored level may be underestimated, inflating the Type I error rate. Conversely, the standard error of a predictor below the ignored level may be overestimated, reducing the statistical power of the analysis (<xref ref-type="bibr" rid="ref28">Luo and Kwok, 2009</xref>; <xref ref-type="bibr" rid="ref32">Moerbeek, 2004</xref>).</p>
<p>There are several methods for measuring nonindependence. The unconditional ICC can be used to measure nonindependence. The unconditional ICC is computed as shown in <xref ref-type="disp-formula" rid="EQ12">Equation 9</xref> (<xref ref-type="bibr" rid="ref35">Raudenbush and Bryk, 2002</xref>):</p>
<disp-formula id="EQ12">
<label>(9)</label>
<mml:math id="M14">
<mml:mi>&#x03C1;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:msub>
<mml:mi>&#x03C4;</mml:mi>
<mml:mn>00</mml:mn>
</mml:msub>
<mml:mrow>
<mml:msup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03C4;</mml:mi>
<mml:mn>00</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:math>
</disp-formula>
<p>where <italic>&#x03C4;</italic><sub>00</sub> is the variance between dyads (i.e., how much the average of the two scores within the dyad varies among dyads) and <italic>&#x03C3;<sup>2</sup></italic> is the variance within dyads. ICC is interpreted as the proportion of variance in the individual scores that is between dyads. In other words, it is how much of the variance in level-1 scores is explained at the dyad level. Higher values of ICC indicate a stronger clustering effect, or a higher level of nonindependence. In addition to <italic>unconditional ICC</italic>, there is also the <italic>conditional ICC</italic>, which is computed after predictors are included in the HLM model (<xref ref-type="bibr" rid="ref35">Raudenbush and Bryk, 2002</xref>).</p>
<p>The level of nonindependence has shown varying impacts in studies. One study revealed no effect of ICC on parameter estimates in a multilevel model with one predictor at level one and one predictor at level two (<xref ref-type="bibr" rid="ref29">Maas and Hox, 2005</xref>). Low ICC may help overcome small cluster numbers, resulting in more accurate parameter and standard error estimates (<xref ref-type="bibr" rid="ref29">Maas and Hox, 2005</xref>). Another study revealed underestimated standard errors when ICC was higher (<xref ref-type="bibr" rid="ref23">Krull and MacKinnon, 2001</xref>). Low ICC is expected to result in more accurate discrepancy estimation in the current study according to the reliability equation from <xref ref-type="bibr" rid="ref45">Williams and Zimmerman (1977)</xref>.</p>
</sec>
<sec id="sec10">
<label>1.3.2</label>
<title>Cluster number</title>
<p>Cluster number, or the number of dyads, varies widely in applied research and has been shown to impact the accuracy of parameter estimation (<xref ref-type="bibr" rid="ref29">Maas and Hox, 2005</xref>) and the power for detecting statistical significance (<xref ref-type="bibr" rid="ref8">Chen et al., 2010</xref>). While fixed effects are consistently accurate despite cluster number, standard error estimates are typically biased when cluster number is less than 100 (<xref ref-type="bibr" rid="ref10">Clarke and Wheaton, 2007</xref>; <xref ref-type="bibr" rid="ref29">Maas and Hox, 2005</xref>). Standard error estimates typically improve as cluster number increases (<xref ref-type="bibr" rid="ref29">Maas and Hox, 2005</xref>).</p>
</sec>
<sec id="sec11">
<label>1.3.3</label>
<title>Reliability</title>
<p>Reliability, as a design factor, is operationalized in this study as variance of scores among a group of dyad members in a sample, i.e., the variance of all <italic>X</italic> raw scores from dyad member A, compared with the variance of true scores. Increased reliability is expected to result in more accurate parameter estimates.</p>
</sec>
<sec id="sec12">
<label>1.3.4</label>
<title>Effect size and effect size variance of discrepancy</title>
<p>The size of the discrepancy between dyad members, and the variation of effect size among dyads, may also impact its estimation. In a previous study about dyadic discrepancy estimation, accuracy of EBD estimates was better when effect size was lower (<xref ref-type="bibr" rid="ref30">McEnturff et al., 2013</xref>). Furthermore, when using discrepancy as an independent variable in regression, the accuracy of intercept and slope estimates was better when effect size was higher.</p>
</sec>
</sec>
<sec id="sec13">
<label>1.4</label>
<title>Gaps in current literature</title>
<p>Historically, several studies have examined various approaches and design factors for discrepancy estimation. <xref ref-type="bibr" rid="ref15">De Los Reyes and Kazdin (2004)</xref> compared RSD to two other methods, the standardized score and residual score methods, using one empirical dataset. Although De Los Reyes and Kazdin thought for the purposes of their research that the standardized score method was most appropriate, in their conclusion, they stated, &#x201C;However, there may be other instances in which other measures may be conceptually and methodologically optimal&#x201D; (p. 334). They also noted that, &#x201C;Our goal was to convey that an accumulating body of research cannot be expected to produce consistent results because the measures used among the studies are not interchangeable&#x201D; (p. 334). A thorough analysis of existing discrepancy methods would aid in comparability of results produced in discrepancy research. Furthermore, De Los Reyes and Kazdin used empirical data. As explained later, a statistical simulation has some advantages when comparing various methods of estimation.</p>
<p><xref ref-type="bibr" rid="ref19">Kenny et al. (2006a</xref>, <xref ref-type="bibr" rid="ref20">2006b)</xref> have published substantial amounts of literature about dyadic data. However, they focus on nomothetic approaches. The idiographic measurement of dyadic discrepancy still needs investigation, as noted in their book. It is important to study approaches that work for both idiographic and nomothetic research. Nomothetic research may be more useful in moving theory forward, but idiographic scores have immediate clinical use for understanding how a particular dyad fits within a theory and using that knowledge to guide interventions for the dyad.</p>
<p>More recent research has also illustrated gaps and highlighted the need to further methodologically examine various approaches to discrepancy estimation in dyadic analysis. Although the RSD approach has been historically criticized for its low reliability (<xref ref-type="bibr" rid="ref13">Cronbach and Furby, 1970</xref>), recent researchers have continued to debate its use, both highlighting its problems (<xref ref-type="bibr" rid="ref24">Laird, 2020</xref>) and defending its use in certain contexts (<xref ref-type="bibr" rid="ref6">Campione-Barr et al., 2020</xref>). Furthermore, although the EBD estimation approach using MLM has seen recent use in empirical literature (<xref ref-type="bibr" rid="ref3">Bar-Sella et al., 2023</xref>), there has been little-to-no recent methodological research examining this approach. Lastly, although SEM-based discrepancy estimation methods see continued use in both empirical (<xref ref-type="bibr" rid="ref2">Barooj-Kiakalaee et al., 2022</xref>) and methodological (<xref ref-type="bibr" rid="ref37">Sakaluk et al., 2025</xref>) literature, little simulation work has been conducted recently comparing this estimation approach with other competing approaches. Overall, these various gaps demonstrate the need to examine and compare these types of approaches to discrepancy estimation in dyadic analysis.</p>
<p>Finally, the importance of discrepancy estimation stems from the high-stakes topics studied using dyadic data, including topics related to family functioning, adolescent adjustment, and end-of-life-care. Dyads are the building blocks of interpersonal relationships, and better understanding of dyads can lead to stronger theories to support the well-being of individuals and families.</p>
</sec>
<sec id="sec14">
<label>1.5</label>
<title>Purpose of the current study</title>
<p>Given the potential implications of inaccurate discrepancy estimation, and the lack of research comparing the methods, the following questions are addressed with this study. First, of RSD, EBD, and SEM, which method generates the most accurate estimate of discrepancy? Second, of the three methods, which allows the most accurate prediction of an outcome? Finally, what is the impact of the design factors ICC, cluster number, reliability, effect size, and effect size variance on the accuracy of estimates and prediction?</p>
</sec>
</sec>
<sec sec-type="methods" id="sec15">
<label>2</label>
<title>Method</title>
<p>A Monte Carlo simulation study was conducted, in which the true scores are generated first, then error added in order to create observed scores. Once the analysis was conducted on the observed scores, the results could be compared to the true scores to assess the performance of the statistic. This will further the work of De Los Reyes and Kazdin, whose empirical study did not allow the comparison to the true score.</p>
<sec id="sec16">
<label>2.1</label>
<title>Design factors</title>
<p>To enhance the external validity of the simulation study results, findings from a past literature review (<xref ref-type="bibr" rid="ref30">McEnturff et al., 2013</xref>) helped set the levels of design factors that are found in real life research involving dyads. In their review, McEnturff et al. evaluated the following literature: <xref ref-type="bibr" rid="ref4">Baumann et al. (2010)</xref>, <xref ref-type="bibr" rid="ref5">Blood et al. (2013)</xref>, <xref ref-type="bibr" rid="ref12">Costigan and Dokis (2006)</xref>, <xref ref-type="bibr" rid="ref14">Crouter et al. (2006)</xref>, <xref ref-type="bibr" rid="ref18">Gulliford et al. (1999)</xref>, <xref ref-type="bibr" rid="ref21">Kim et al. (2009)</xref>, <xref ref-type="bibr" rid="ref25">Lau et al. (2005)</xref>, <xref ref-type="bibr" rid="ref26">Leidy et al. (2009)</xref>, <xref ref-type="bibr" rid="ref31">McHale et al. (2005)</xref>, <xref ref-type="bibr" rid="ref41">Stander et al. (2001)</xref>, and <xref ref-type="bibr" rid="ref44">Wheeler et al. (2010)</xref>. This review led to the following design factors.</p>
<sec id="sec17">
<label>2.1.1</label>
<title>Conditional ICC</title>
<p>To avoid conflation of the unconditional ICC and the standardized average discrepancy within dyads, we manipulated the conditional ICC when &#x201C;report&#x201D; is included in the data generation model depicted in <xref ref-type="disp-formula" rid="EQ3 EQ4 EQ5 EQ6 EQ7 EQ8">Equations 3a&#x2013;5</xref>. The conditional ICC is independent of the discrepancy within dyads (<italic>&#x03B2;</italic><sub>1<italic>j</italic></sub>). From here onward, ICC all refers to &#x201C;conditional ICC.&#x201D;</p>
<p>Data reflected conditional ICC values of 0.1, 0.3, and 0.5 with &#x201C;report&#x201D; as the only predictor. Studies using MLM in complex survey designs have typical ICC values ranging from 0 to 0.3 (<xref ref-type="bibr" rid="ref18">Gulliford et al., 1999</xref>). Research involving dyads has shown ICC values as high as 0.49 (<xref ref-type="bibr" rid="ref5">Blood et al., 2013</xref>).</p>
</sec>
<sec id="sec18">
<label>2.1.2</label>
<title>Cluster number</title>
<p>Data sets with cluster numbers of 50, 150, 250, and 400 were generated. Cluster numbers found in the review ranged from 68 (<xref ref-type="bibr" rid="ref41">Stander et al., 2001</xref>) to 399 (<xref ref-type="bibr" rid="ref21">Kim et al., 2009</xref>). Cluster numbers were distributed throughout that range.</p>
</sec>
<sec id="sec19">
<label>2.1.3</label>
<title>Reliability</title>
<p>For distinguishable dyads, data were generated with both matching, set at 0.7 and 0.8, and mismatched reliabilities of 0.7 for one dyad member and 0.8 for the other. Commonly found levels of reliability in the literature review were similar to the minimum values accepted as adequate in education, ranging from coefficient alpha of 0.67 (<xref ref-type="bibr" rid="ref44">Wheeler et al., 2010</xref>) to 0.96 (<xref ref-type="bibr" rid="ref4">Baumann et al., 2010</xref>).</p>
</sec>
<sec id="sec20">
<label>2.1.4</label>
<title>Effect size of discrepancy</title>
<p>For this study, Cohen&#x2019;s <italic>d</italic> was 0.2, 0.5, and 0.8 to reflect widely used benchmarks for small, medium, and large effects (<xref ref-type="bibr" rid="ref11">Cohen, 1988</xref>). It should be noted that these benchmarks are simply a rule of thumb and should not be the sole factor for evaluating effect size in any study. Effect sizes must be interpreted within the context of the study topic and methods. Effect sizes varied widely in the literature review, from <italic>d</italic>&#x202F;=&#x202F;0.05 to <italic>d</italic>&#x202F;=&#x202F;1.34.</p>
</sec>
<sec id="sec21">
<label>2.1.5</label>
<title>Effect size variance</title>
<p>Variance of discrepancies among dyads was set to 0.5 and 1. Literature reporting the variance of effect sizes was scant.</p>
</sec>
</sec>
<sec id="sec22">
<label>2.2</label>
<title>Data generation</title>
<p>A program was written and executed in SAS 9.4 to generate simulated data across a set of study conditions to examine bias and reliability of discrepancy estimates and their use in prediction. As described in the literature review, design factors included variations on nonindependence (ICC), cluster number, reliability, effect size, and effect size variance. The design factors are summarized in <xref ref-type="table" rid="tab1">Table 1</xref>. A total of 216 simulation conditions were represented, with 1,000 replications generated for each condition, for a total of 216,000 datasets (<xref ref-type="bibr" rid="ref1">Arend and Sch&#x00E4;fer, 2019</xref>). After the data were generated, discrepancy estimates for all three methods (RSD, EBD, and SEM) were computed and used in subsequent evaluation analyses described below. Discrepancy estimates from the EBD and SEM methods were generated using the full-information maximum likelihood (FIML) estimation method. All analyses were conducted in SAS except the computation of SEM, which was computed using MPlus. The MPlus SAVEDATA option enabled the export of factor scores to use as the SEM discrepancy. The syntax for data generation and analysis in SAS and MPlus can be found in <xref ref-type="supplementary-material" rid="SM1">Appendix 1</xref>.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Study conditions.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" colspan="3">ICC</th>
<th align="center" valign="top" colspan="3">Reliability</th>
<th align="center" valign="top" colspan="2">Effect Size</th>
<th align="center" valign="top">Sample</th>
</tr>
<tr>
<th align="left" valign="top">ICC</th>
<th align="center" valign="top">Between Variance</th>
<th align="center" valign="top">Within Variance</th>
<th align="center" valign="top">Reliability</th>
<th align="center" valign="top">Error Variance 1</th>
<th align="center" valign="top">Error Variance 2</th>
<th align="center" valign="top">Effect Size</th>
<th align="center" valign="top">Effect Size Variance</th>
<th align="center" valign="top">
<italic>n</italic>
</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="bottom">0.1</td>
<td align="center" valign="bottom">0.1</td>
<td align="center" valign="bottom">0.9</td>
<td align="center" valign="bottom">0.7</td>
<td align="center" valign="bottom">0.43</td>
<td align="center" valign="bottom">0.43</td>
<td align="center" valign="bottom">0.2</td>
<td align="center" valign="bottom">0.5</td>
<td align="center" valign="bottom">50</td>
</tr>
<tr>
<td align="left" valign="bottom">0.3</td>
<td align="center" valign="bottom">0.3</td>
<td align="center" valign="bottom">0.7</td>
<td align="center" valign="bottom">0.8</td>
<td align="center" valign="bottom">0.25</td>
<td align="center" valign="bottom">0.25</td>
<td align="center" valign="bottom">0.5</td>
<td align="center" valign="bottom">1</td>
<td align="center" valign="bottom">150</td>
</tr>
<tr>
<td align="left" valign="bottom">0.5</td>
<td align="center" valign="bottom">0.5</td>
<td align="center" valign="bottom">0.5</td>
<td align="center" valign="bottom">0.7 / 0.8</td>
<td align="center" valign="bottom">0.43</td>
<td align="center" valign="bottom">0.25</td>
<td align="center" valign="bottom">0.8</td>
<td/>
<td align="center" valign="bottom">250</td>
</tr>
<tr>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td align="center" valign="bottom">400</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Data were generated for both indistinguishable and distinguishable dyads. However, the regression models appropriate for indistinguishable and distinguishable dyads are not the same. For indistinguishable dyads, the outcome, <italic>Z</italic>, was generated using arbitrary values for the slope (0.8) and intercept (0.5), as shown in the equation below:</p>
<disp-formula id="EQ13">
<label>(10)</label>
<mml:math id="M15">
<mml:mi>Z</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>.5</mml:mn>
<mml:mo>+</mml:mo>
<mml:mn>.8</mml:mn>
<mml:mo>&#x2223;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mtext>true</mml:mtext>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mtext>true</mml:mtext>
</mml:msub>
<mml:mo>&#x2223;</mml:mo>
<mml:mo>+</mml:mo>
<mml:mtext mathvariant="italic">rannor</mml:mtext>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<p>where <italic>X</italic><sub>true</sub> and <italic>Y</italic><sub>true</sub> are the true scores for each dyad member and the absolute value of the difference between these true scores is the discrepancy score.</p>
<p>However, for distinguishable dyads, the direction of the discrepancy is lost when using the absolute value of the discrepancy, such as in the indistinguishable dyad case. For example, in the parent&#x2013;child dyad example, it is useful to know not only how different parents and children are, but which dyad member scores higher or lower on the construct of interest. Therefore, a different regression model must be used for distinguishable dyads.</p>
<p>A solution to this problem is shown in <xref ref-type="disp-formula" rid="EQ14">Equation 11</xref>, related to the method used by <xref ref-type="bibr" rid="ref43">Wang and Benner (2013)</xref>:</p>
<disp-formula id="EQ14">
<label>(11)</label>
<mml:math id="M16">
<mml:mi>Z</mml:mi>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>Y</mml:mi>
<mml:mo>&#x2223;</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mi>W</mml:mi>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>Y</mml:mi>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>W</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>e</mml:mi>
</mml:math>
</disp-formula>
<p>Here, |<italic>X &#x2013; Y</italic>| is the absolute value of the discrepancy, W is a dichotomous indicator of the direction of the discrepancy (equal to 0 if <italic>X&#x202F;&#x003C;&#x202F;Y</italic> and 1 if <italic>X&#x202F;&#x003E;&#x202F;= Y</italic>), and the third predictor is the interaction between them. Following this, the outcome for distinguishable dyads in this study was generated as follows:</p>
<disp-formula id="EQ15">
<label>(12)</label>
<mml:math id="M17">
<mml:mi>Z</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>.5</mml:mn>
<mml:mo>+</mml:mo>
<mml:mn>.8</mml:mn>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>Y</mml:mi>
<mml:mo>&#x2223;</mml:mo>
<mml:mo>+</mml:mo>
<mml:mn>.5</mml:mn>
<mml:mi>W</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>.2</mml:mn>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>Y</mml:mi>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>W</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>e</mml:mi>
</mml:math>
</disp-formula>
</sec>
<sec id="sec23">
<label>2.3</label>
<title>Evaluation of methods</title>
<p>The outcome of interest in this study was the bias of parameters estimated and their standard errors. The various values that were used to evaluate the discrepancy estimation methods are described in this section. <xref ref-type="table" rid="tab2">Table 2</xref> includes the equations used to compute the evaluation measures.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Equations for evaluating methods for dyadic discrepancy.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Measure</th>
<th align="center" valign="top">Equation</th>
<th align="left" valign="top">Description</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Absolute bias (AB) for discrepancy estimates and parameter estimates</td>
<td align="center" valign="top">
<inline-formula>
<mml:math id="M18">
<mml:mi mathvariant="italic">AB</mml:mi>
<mml:mo>=</mml:mo>
<mml:mo>&#x2223;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>&#x03B8;</mml:mi>
<mml:mo stretchy="true">&#x0302;</mml:mo>
</mml:mover>
<mml:mi mathvariant="italic">est</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03B8;</mml:mi>
<mml:mi mathvariant="italic">pop</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2223;</mml:mo>
</mml:math>
</inline-formula>
</td>
<td align="left" valign="top"><inline-formula>
<mml:math id="M19">
<mml:msub>
<mml:mover accent="true">
<mml:mi>&#x03B8;</mml:mi>
<mml:mo stretchy="true">&#x0302;</mml:mo>
</mml:mover>
<mml:mi mathvariant="italic">est</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is the mean of the estimated discrepancy score across the replications and <inline-formula>
<mml:math id="M20">
<mml:msub>
<mml:mi>&#x03B8;</mml:mi>
<mml:mi mathvariant="italic">pop</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is the true parameter value (i.e., true discrepancy score).</td>
</tr>
<tr>
<td align="left" valign="top">Reliability of discrepancy estimates</td>
<td align="center" valign="top">
<inline-formula>
<mml:math id="M21">
<mml:mfrac>
<mml:msubsup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mtext mathvariant="italic">true</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:msubsup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mi mathvariant="italic">est</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mfrac>
</mml:math>
</inline-formula>
</td>
<td align="left" valign="top"><inline-formula>
<mml:math id="M22">
<mml:msubsup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mtext mathvariant="italic">true</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:math>
</inline-formula> is the variance of the true discrepancy scores, and <inline-formula>
<mml:math id="M23">
<mml:msubsup>
<mml:mi>&#x03C3;</mml:mi>
<mml:mi mathvariant="italic">est</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:math>
</inline-formula> is the variance of the discrepancy estimates.</td>
</tr>
<tr>
<td align="left" valign="top">AB for standard errors</td>
<td align="center" valign="top">
<inline-formula>
<mml:math id="M24">
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mi mathvariant="italic">est</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext mathvariant="italic">Mean</mml:mtext>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>D</mml:mi>
<mml:mi mathvariant="italic">est</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>
</td>
<td align="left" valign="top"><inline-formula>
<mml:math id="M25">
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mi mathvariant="italic">est</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is the standard error of the estimate, and <inline-formula>
<mml:math id="M26">
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>D</mml:mi>
<mml:mi mathvariant="italic">est</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is the standard deviation of the corresponding parameter estimates across the 1,000 iterations of each simulation condition.</td>
</tr>
<tr>
<td align="left" valign="top">Power for the slope estimate in prediction</td>
<td align="left" valign="top">
<inline-formula>
<mml:math id="M27">
<mml:mfrac>
<mml:mrow>
<mml:mtext mathvariant="italic">Number of estimates with</mml:mtext>
<mml:mspace width="0.25em"/>
<mml:mi>p</mml:mi>
<mml:mo>&#x003C;</mml:mo>
<mml:mn>.05</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mtext mathvariant="italic">Total number of estimates</mml:mtext>
<mml:mspace width="0.25em"/>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1000</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:math>
</inline-formula>
</td>
<td align="left" valign="top">The proportion of statistically significant estimates out of the total number of estimates per condition</td>
</tr>
<tr>
<td align="left" valign="top">AB for <italic>R<sup>2</sup></italic> estimate</td>
<td align="center" valign="top">
<inline-formula>
<mml:math id="M28">
<mml:msubsup>
<mml:mi>R</mml:mi>
<mml:mi mathvariant="italic">est</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext mathvariant="italic">Mean</mml:mtext>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mi>R</mml:mi>
<mml:mtext mathvariant="italic">true</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>
</td>
<td align="left" valign="top"><inline-formula>
<mml:math id="M29">
<mml:msubsup>
<mml:mi>R</mml:mi>
<mml:mi mathvariant="italic">est</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:math>
</inline-formula> is the proportion of variance explained in the outcome by the discrepancy estimate, and <inline-formula>
<mml:math id="M30">
<mml:msubsup>
<mml:mi>R</mml:mi>
<mml:mtext mathvariant="italic">true</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:math>
</inline-formula> is the proportion of variance explained in the outcome by the true discrepancy scores</td>
</tr>
</tbody>
</table>
</table-wrap>
<sec id="sec24">
<label>2.3.1</label>
<title>Bias of discrepancy estimate</title>
<p>First, estimated discrepancy scores were compared to the true discrepancy score to determine accuracy of the discrepancy estimate. To assess accuracy, the absolute bias (AB) for the estimated discrepancy score was calculated as the difference between the true score and the estimate.</p>
<p>AB equal to zero indicated an unbiased estimate of the parameter. A negative AB indicated an underestimation of the parameter (i.e., the estimated value was smaller than the true parameter value), whereas a positive AB indicated an overestimation of the parameter (i.e., the estimated value was larger than the true parameter value).</p>
</sec>
<sec id="sec25">
<label>2.3.2</label>
<title>Reliability of estimates</title>
<p>Reliability of discrepancy estimates was calculated by dividing the variance of the true discrepancy scores by the variance of the discrepancy estimates, as shown in the reliability equation in <xref ref-type="table" rid="tab2">Table 2</xref>. Reliability is normally thought of as ranging from zero to one because the variance of observed scores is normally greater than the variance of true scores. However, because of the EBD shrinkage effect described in <xref ref-type="disp-formula" rid="EQ10">Equation 7</xref>, the variance of EBD estimates was sometimes less than the variance of true discrepancy scores. This resulted in reliability estimates greater than one. Therefore, in this study, an estimate is most reliable when its reliability is closest to one, indicating that the variance of true scores is equal to variance of estimates. Distance from one, whether in the positive or negative direction, indicated deviance from perfect reliability. Reliability less than one happened when the discrepancy estimate was more variable than the true discrepancy score. Reliability greater than one happened when the discrepancy estimate was less variable than the true discrepancy score.</p>
</sec>
<sec id="sec26">
<label>2.3.3</label>
<title>Predictive power</title>
<p>Although the accuracy of discrepancy estimates is interesting on its own, in practice, it is useful to understand how the estimated discrepancy impacts an outcome. For example, in addition to studying the amount of discrepancy in marital satisfaction, a researcher may also be interested in how the discrepancy predicts an outcome like depression. In this simulation, the discrepancy estimates were used in a regression analysis to predict an outcome. The accuracy of prediction and hypothesis testing was evaluated.</p>
<p>A previously stated, the regression models appropriate for indistinguishable and distinguishable dyads are not the same (see <xref ref-type="disp-formula" rid="EQ13 EQ15">Equations 10, 12</xref>, respectively), and this impacts the calculation of discrepancy values. For indistinguishable dyads, only the amount of discrepancy matters, because the direction of discrepancy is arbitrary depending on which dyad member is assigned as <italic>A</italic> and which is assigned as <italic>B</italic>. In this scenario, the absolute value of the discrepancy score can be used as the independent variable in the regression (see <xref ref-type="disp-formula" rid="EQ13">Equation 10</xref>). Following this, the absolute value of discrepancy estimates (RSD-AV, EBD-AV, and SEM-AV) were each used independently to predict the outcome, and the resulting parameter estimates (i.e., estimated slopes and their standard errors) were assessed for bias.</p>
<p>As previously mentioned regarding distinguishable dyads, the direction of the discrepancy is lost when using the absolute value of the discrepancy as an independent variable, as with the indistinguishable dyad case. Therefore, using the distinguishable dyad equation (<xref ref-type="disp-formula" rid="EQ15">Equation 12</xref>), the absolute value of discrepancy estimates (RSD-AV, EBD-AV, and SEM-AV), together with W which indicated the direction of the discrepancy, were each used independently to predict the outcome, and the parameter estimates were assessed for bias.</p>
</sec>
<sec id="sec27">
<label>2.3.4</label>
<title>Bias, power, and coverage rates for parameter estimates and standard errors</title>
<p>Bias of parameter estimates demonstrated how accurate discrepancy estimates from each of the three methods predicted the simulated outcome. First, the bias for the parameter estimates (intercept and slopes) and their standard errors were computed as described in the bias equations for parameters and standard errors in <xref ref-type="table" rid="tab2">Table 2</xref>. The bias for standard errors equation in <xref ref-type="table" rid="tab2">Table 2</xref> shows that because there is no true score standard error to use in the bias calculation, standard error estimates were compared to the standard deviation of all estimates within each simulation condition.</p>
<p>Additionally, the power for the slope estimates was computed as the proportion of statistically significant estimates out of the total number of estimates (see <xref ref-type="table" rid="tab2">Table 2</xref>). The coverage rate was computed as the proportion of cases where the true value of the slope is found within the confidence interval for the slope. Higher coverage rates indicate better estimates of the regression parameters.</p>
<p>Secondly, the accuracy of the <italic>R<sup>2</sup></italic> estimate was examined by computing the bias, compared with the <italic>R<sup>2</sup></italic> obtained in the true score regression model. The equation is shown in <xref ref-type="table" rid="tab2">Table 2</xref>.</p>
</sec>
<sec id="sec28">
<label>2.3.5</label>
<title>Impact of design factors on outcomes</title>
<p>Finally, analysis of variance (ANOVA) was used to determine which estimates were most influenced by manipulations of design factors. The corresponding effect sizes (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;SS<sub>effect</sub>/SS<sub>total</sub>) were used to determine the contribution of the five design factors (ICC, cluster number, reliability, effect size, and effect size variance) and method (RSD, EBD, and SEM) to the accuracy of the discrepancy estimation. Post-hoc ANOVAs predicting bias of discrepancy estimation with the five design factors were conducted separately for each of the three methods (RSD, EBD, and SEM), rather than using method as an independent variable, which aided in the interpretation of the impact of design factors on bias of estimates from each method.</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="sec29">
<label>3</label>
<title>Results</title>
<p><xref ref-type="table" rid="tab3">Table 3</xref> includes the means and standard deviations of estimates. <xref ref-type="table" rid="tab3">Table 3</xref> shows on average how the three methods compared on all evaluation measures. For example, the first row of <xref ref-type="table" rid="tab3">Table 3</xref> shows that average bias of discrepancy estimates was zero for all three methods. <xref ref-type="table" rid="tab4">Table 4</xref> shows the effect sizes (<italic>&#x03B7;</italic><sup>2</sup>) for all six-way ANOVAs measuring the impact of the design factors (method, reliability, ICC, cluster number, effect size, and effect size variance) and all two-way interactions on the measures of accuracy for the three estimation methods. <xref ref-type="table" rid="tab4">Table 4</xref> is important for understanding which measures were substantially impacted by variation in study conditions. <xref ref-type="table" rid="tab5">Table 5</xref> includes effect sizes (<italic>&#x03B7;</italic><sup>2</sup>) for post-hoc five-way ANOVAs measuring the impact of the design factors (reliability, ICC, cluster number, effect size, and effect size variance) and all two-way interactions on the measures of accuracy for the three estimation methods individually. In <xref ref-type="table" rid="tab4">Tables 4</xref>, <xref ref-type="table" rid="tab5">5</xref>, only effect sizes at least 0.01 are shown in the table, and only medium and large effects of 0.06 or greater (per <xref ref-type="bibr" rid="ref11">Cohen, 1988</xref>) are interpreted and discussed.</p>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Mean (standard deviation) of bias, reliability, and discrepancy as predictor estimates.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th>Estimate</th>
<th>Estimate property</th>
<th align="center" valign="top">RSD</th>
<th align="center" valign="top">EBD</th>
<th align="center" valign="top">SEM</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Accuracy of discrepancy</td>
<td align="left" valign="top">Absolute bias (AB) of discrepancy</td>
<td align="center" valign="top">0.00 (0.06)</td>
<td align="center" valign="top">0.00 (0.06)</td>
<td align="center" valign="top">0.00 (0.13)</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Reliability of discrepancy</td>
<td align="center" valign="top">0.51 (0.06)</td>
<td align="center" valign="top">2.29 (63.70)</td>
<td align="center" valign="top">0.53 (0.06)</td>
</tr>
<tr>
<td align="left" valign="top">Discrepancy as predictor</td>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top">Discrepancy slope</td>
<td align="left" valign="top">AB of estimate</td>
<td align="center" valign="top">&#x2212;0.26 (0.11)</td>
<td align="center" valign="top">0.22 (0.43)</td>
<td align="center" valign="top">&#x2212;0.25 (0.12)</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">AB of standard error</td>
<td align="center" valign="top">0.00 (0.02)</td>
<td align="center" valign="top">&#x2212;0.07 (0.28)</td>
<td align="center" valign="top">0.00 (0.02)</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Power of estimate</td>
<td align="center" valign="top">0.96 (0.20)</td>
<td align="center" valign="top">0.95 (0.22)</td>
<td align="center" valign="top">0.96 (0.20)</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Coverage rate of estimate</td>
<td align="center" valign="top">0.91 (0.29)</td>
<td align="center" valign="top">0.24 (0.43)</td>
<td align="center" valign="top">0.89 (0.31)</td>
</tr>
<tr>
<td align="left" valign="top">Direction slope</td>
<td align="left" valign="top">AB of estimate</td>
<td align="center" valign="top">&#x2212;0.29 (0.32)</td>
<td align="center" valign="top">&#x2212;0.29 (0.38)</td>
<td align="center" valign="top">&#x2212;0.29 (0.35)</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">AB of standard error</td>
<td align="center" valign="top">0.00 (0.04)</td>
<td align="center" valign="top">&#x2212;0.03 (0.12)</td>
<td align="center" valign="top">&#x2212;0.02 (0.04)</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Power of estimate</td>
<td align="center" valign="top">0.14 (0.35)</td>
<td align="center" valign="top">0.16 (0.36)</td>
<td align="center" valign="top">0.16 (0.37)</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Coverage rate of estimate</td>
<td align="center" valign="top">0.77 (0.42)</td>
<td align="center" valign="top">0.75 (0.43)</td>
<td align="center" valign="top">1.00 (0.00)</td>
</tr>
<tr>
<td align="left" valign="top">Discrepancy by direction interaction slope</td>
<td align="left" valign="top">AB of estimate</td>
<td align="center" valign="top">&#x2212;0.13 (0.16)</td>
<td align="center" valign="top">&#x2212;0.08 (0.58)</td>
<td align="center" valign="top">&#x2212;0.13 (0.16)</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">AB of standard error</td>
<td align="center" valign="top">0.00 (0.02)</td>
<td align="center" valign="top">&#x2212;0.07 (0.41)</td>
<td align="center" valign="top">0.00 (0.02)</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Power of estimate</td>
<td align="center" valign="top">0.09 (0.29)</td>
<td align="center" valign="top">0.09 (0.29)</td>
<td align="center" valign="top">0.10 (0.29)</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Coverage rate of estimate</td>
<td align="center" valign="top">0.18 (0.39)</td>
<td align="center" valign="top">0.58 (0.49)</td>
<td align="center" valign="top">0.19 (0.40)</td>
</tr>
<tr>
<td align="left" valign="top">R-squared</td>
<td align="left" valign="top">AB of estimate</td>
<td align="center" valign="top">&#x2212;0.04 (0.03)</td>
<td align="center" valign="top">&#x2212;0.05 (0.04)</td>
<td align="center" valign="top">&#x2212;0.04 (0.03)</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Power of estimate</td>
<td align="center" valign="top">0.99 (0.09)</td>
<td align="center" valign="top">0.98 (0.13)</td>
<td align="center" valign="top">0.99 (0.09)</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>Summary of <italic>&#x03B7;</italic><sup>2</sup> for the six-way ANOVA main and first-order interaction effects (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;&#x2265;&#x202F;0.01).</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th align="center" valign="top" colspan="2">Discrepancy</th>
<th align="center" valign="top" colspan="2">Slope&#x2014;discrepancy</th>
<th align="center" valign="top" colspan="2">Slope&#x2014;direction</th>
<th align="center" valign="top" colspan="2">Slope&#x2014;discrepancy &#x002A; direction interaction</th>
<th align="center" valign="top">
<italic>R</italic>
<sup>2</sup>
</th>
</tr>
<tr>
<th/>
<th align="center" valign="top">Estimate bias</th>
<th align="center" valign="top">Reliability of estimate</th>
<th align="center" valign="top">Estimate bias</th>
<th align="center" valign="top">Standard error bias</th>
<th align="center" valign="top">Estimate bias</th>
<th align="center" valign="top">Standard error bias</th>
<th align="center" valign="top">Estimate bias</th>
<th align="center" valign="top">Standard error bias</th>
<th align="center" valign="top">Estimate bias</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Method</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.42</td>
<td align="center" valign="top">0.05</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.04</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">0.69</td>
</tr>
<tr>
<td align="left" valign="top">N</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">ICC</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">Reliability</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">Effect size</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
</tr>
<tr>
<td align="left" valign="top">Effect size variance</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
</tr>
<tr>
<td align="left" valign="top">M&#x002A;N</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.06</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.05</td>
<td align="center" valign="top">0.00</td>
</tr>
<tr>
<td align="left" valign="top">M&#x002A;I</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">0.01</td>
</tr>
<tr>
<td align="left" valign="top">M&#x002A;R</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">M&#x002A;ES</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">M&#x002A;ESV</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">0.01</td>
</tr>
<tr>
<td align="left" valign="top">N&#x002A;I</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">N&#x002A;R</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">N&#x002A;ES</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">N&#x002A;ESV</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">I&#x002A;R</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">I&#x002A;ES</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">I&#x002A;ESV</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">R&#x002A;ES</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">R&#x002A;ESV</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">ES&#x002A;ESV</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Design factors are abbreviated in the table as (a) N&#x202F;=&#x202F;cluster number; (b) M&#x202F;=&#x202F;method; (c) I&#x202F;=&#x202F;ICC; (d) R&#x202F;=&#x202F;reliability; (e) ES&#x202F;=&#x202F;effect size; (f) ESV&#x202F;=&#x202F;effect size variance. Bias refers to the absolute bias (AB) defined in <xref ref-type="table" rid="tab2">Table 2</xref>.</p>
</table-wrap-foot>
</table-wrap>
<table-wrap position="float" id="tab5">
<label>Table 5</label>
<caption>
<p>Summary of <italic>&#x03B7;</italic><sup>2</sup> for the post-hoc five-way ANOVA main and first order interaction effects (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;&#x2265;&#x202F;0.01).</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th align="center" valign="top" colspan="3">Reliability</th>
<th align="center" valign="top" colspan="3">Discrepancy slope bias</th>
<th align="center" valign="top" colspan="3">Discrepancy slope standard error bias</th>
<th align="center" valign="top" colspan="3">Direction slop standard error bias</th>
<th align="center" valign="top" colspan="3">Interaction slope standard error bias</th>
<th align="center" valign="top" colspan="3"><italic>R</italic><sup>2</sup> bias</th>
</tr>
<tr>
<th/>
<th align="center" valign="top">RSD</th>
<th align="center" valign="top">EBD</th>
<th align="center" valign="top">SEM</th>
<th align="center" valign="top">RSD</th>
<th align="center" valign="top">EBD</th>
<th align="center" valign="top">SEM</th>
<th align="center" valign="top">RSD</th>
<th align="center" valign="top">EBD</th>
<th align="center" valign="top">SEM</th>
<th align="center" valign="top">RSD</th>
<th align="center" valign="top">EBD</th>
<th align="center" valign="top">SEM</th>
<th align="center" valign="top">RSD</th>
<th align="center" valign="top">EBD</th>
<th align="center" valign="top">SEM</th>
<th align="center" valign="top">RSD</th>
<th align="center" valign="top">EBD</th>
<th align="center" valign="top">SEM</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">N</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.09</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.05</td>
<td align="center" valign="top">0.06</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.08</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">0.01</td>
</tr>
<tr>
<td align="left" valign="top">ICC</td>
<td align="center" valign="top">0.06</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.04</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.04</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">0.04</td>
<td align="center" valign="top">0.02</td>
</tr>
<tr>
<td align="left" valign="top">Reliability</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">Effect size</td>
<td align="center" valign="top">0.24</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.23</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.05</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">0.04</td>
</tr>
<tr>
<td align="left" valign="top">Effect size variance</td>
<td align="center" valign="top">0.55</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.52</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.11</td>
<td align="center" valign="top">0.05</td>
<td align="center" valign="top">0.07</td>
</tr>
<tr>
<td align="left" valign="top">N&#x002A;I</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.06</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.06</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">N&#x002A;R</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">N&#x002A;ES</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">N&#x002A;ESV</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.03</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">I&#x002A;R</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">I&#x002A;ES</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">I&#x002A;ESV</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.02</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">R&#x002A;ES</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">R&#x002A;ESV</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
<tr>
<td align="left" valign="top">ES&#x002A;ESV</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.01</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Post-hoc ANOVAs were conducted for each method separately to aid in the interpretation of the effects. The dependent variables were discrepancy bias, reliability of discrepancy, three bias slope estimates and their standard errors (discrepancy, direction, and interaction), and R<sup>2</sup> bias. The dependent variables discrepancy bias, direction slope, and interaction slope are excluded from the table because design factors were not substantial predictors (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;&#x2265;&#x202F;0.01) for any of the 3 methods. All other dependent variables are included in columns above. Design factors are abbreviated in the table as (a) N&#x202F;=&#x202F;cluster number; (b) M&#x202F;=&#x202F;method; (c) I&#x202F;=&#x202F;ICC; (d) R&#x202F;=&#x202F;reliability; (e) ES&#x202F;=&#x202F;effect size; (f) ESV&#x202F;=&#x202F;effect size variance.</p>
</table-wrap-foot>
</table-wrap>
<sec id="sec30">
<label>3.1</label>
<title>Bias of discrepancy estimates</title>
<p>The average bias of all three discrepancy estimates was zero. Furthermore, ANOVA results showed no notable effect sizes using method and design factors to explain the bias of discrepancy estimates. In other words, no variations of method or design factors accounted for a significant amount of bias in discrepancy estimates.</p>
</sec>
<sec id="sec31">
<label>3.2</label>
<title>Reliability of discrepancy estimates</title>
<p>As described in the methods, reliability is a measure of the consistency of the discrepancy estimates. Perfect reliability occurred when the variance of discrepancy estimates is equal to the variance of true discrepancy score, resulting in reliability equal to one. Estimates were considered less reliable as reliability values deviated further from one. On average, reliability values of EBD estimates were the furthest from one and therefore the least reliable (reliability&#x202F;=&#x202F;2.29, <italic>&#x03C3;</italic>&#x202F;=&#x202F;63.70). Reliability for RSD (reliability&#x202F;=&#x202F;0.51, <italic>&#x03C3;</italic>&#x202F;=&#x202F;0.06) and SEM (reliability&#x202F;=&#x202F;0.53, <italic>&#x03C3;</italic>&#x202F;=&#x202F;0.06) were better. Furthermore, initial six-way ANOVA results showed no substantial effect sizes using method and design factors to explain the reliability of discrepancy estimates. However, some effects were found using the post-hoc ANOVAs described below.</p>
<p>The six-way ANOVA results showed that reliability was not substantially impacted by method or design factors. Though the means did not substantially differ by method, the box plot in <xref ref-type="fig" rid="fig2">Figure 2</xref> shows the range for EBD is impacted by outliers.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Reliability of discrepancy estimate by method (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;&#x003C;&#x202F;0.001). The minimum and maximum bias are represented by the endpoints of each plot. The upper edge of the box represents the third quartile (75th percentile), and the lower edge of the box represents the first quartile (25th percentile). The median (50th percentile) is represented by the line within the box, and the mean is represented by the diamond within the box.</p>
</caption>
<graphic xlink:href="fpsyg-16-1499076-g002.tif"/>
</fig>
<sec id="sec32">
<label>3.2.1</label>
<title>Post-hoc ANOVAs by method</title>
<p>Post-hoc ANOVAs were conducted for each method individually. As shown in <xref ref-type="table" rid="tab5">Table 5</xref>, reliability of EBD estimates was not substantially (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;&#x003E;&#x202F;= 0.01) impacted by any design factor. RBD and SEM reliability were each greatly impacted by effect size variance (RSD <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.55 and SEM <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.52) and effect size (RSD <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.24 and SEM <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.23). To a lesser extent, RBD and SEM reliability were impacted by ICC (RSD <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.06 and SEM <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.04). Reliability increased as effect size variance and effect size increased. Reliability decreased as ICC increased. Across all levels of design factors, SEM reliability was greater than RSD. These trends are further illustrated in <xref ref-type="fig" rid="fig3">Figure 3</xref>.</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Reliability of RSD and SEM discrepancy estimate by design factors. Design factors shown are effect size variance (RSD <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.55 and SEM <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.52), effect size (RSD <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.24 and SEM <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.23), and ICC (RSD <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.06 and SEM <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.04). EBD is excluded because <italic>&#x03B7;</italic><sup>2</sup>&#x202F;&#x003C;&#x202F;0.01 for all effects. The minimum and maximum bias are represented by the ends of each plot. The upper edge of the box represents the third quartile (75th percentile), and the lower edge of the box represents the first quartile (25th percentile). The median (50th percentile) is represented by the line within the box, and the mean is represented by the symbol within the box. Outliers are labeled with the O symbol for RSD and the + symbol for SEM.</p>
</caption>
<graphic xlink:href="fpsyg-16-1499076-g003.tif"/>
</fig>
</sec>
</sec>
<sec id="sec33">
<label>3.3</label>
<title>Predictive power of discrepancy estimates</title>
<p>Simulated regression models were used to evaluate the accuracy of discrepancy estimation methods in predicting an outcome. There were three slope estimates in the regression model: (1) discrepancy slope, which was the slope estimate for the discrepancy; (2) direction slope, which was the slope estimate for the dichotomous indicator of direction of discrepancy (i.e., 0 where the score from dyad member A is greater than the score from dyad member B, and 1 where the score from dyad member A is less than the score from dyad member B), and (3) slope (discrepancy by direction interaction), representing the interaction effect between discrepancy and direction.</p>
<p>Results presented below are for distinguishable dyads. The prediction model for indistinguishable dyads, which only included one discrepancy slope, had similar results as the discrepancy slope for distinguishable dyads, rendering those results redundant. For each of the three slope estimates as well as <italic>R<sup>2</sup></italic> estimates, the results include descriptive statistics for bias, ANOVA results, power, and coverage rate.</p>
<sec id="sec34">
<label>3.3.1</label>
<title>Discrepancy slope estimate and standard error bias</title>
<p>The discrepancy slope estimates, estimating the strength of the relationship between the discrepancy and the outcome, were slightly less biased for EBD (AB&#x202F;=&#x202F;0.22) than RSD (AB&#x202F;=&#x202F;0.26) and SEM (AB&#x202F;=&#x202F;0.25). However, the range of AB for EBD (min AB&#x202F;=&#x202F;&#x2212;27.1, max AB&#x202F;=&#x202F;66.5) was vastly larger that of RSD and SEM, which both ranged about &#x2212;1.4 to &#x2212;0.3. The standard deviation of AB for EBD was 0.43. The large range in conjunction with the relatively reasonable standard deviation indicated that AB of slope estimate (discrepancy) for EBD included extreme outliers (i.e., an outlier exceeding 3&#x002A;interquartile range below the 1st quartile or above the 3rd quartile). The boxplots shown in <xref ref-type="fig" rid="fig4">Figure 4</xref> illustrate the distributions of bias by method. Differences among methods, as shown in <xref ref-type="fig" rid="fig4">Figure 4</xref>, accounted for a substantial amount of variance in bias of discrepancy slope estimate (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.42).</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Absolute bias (AB) of discrepancy slope estimate by method (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.42) and AB of standard error (SE) of discrepancy slope estimate by method (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.05). The minimum and maximum bias are represented by the endpoints of each plot. The upper edge of the box represents the third quartile (75th percentile), and the lower edge of the box represents the first quartile (25th percentile). The median (50th percentile) is represented by the line within the box, and the mean is represented by the diamond within the box.</p>
</caption>
<graphic xlink:href="fpsyg-16-1499076-g004.tif"/>
</fig>
<p>Similarly, the standard errors of slope estimates in the regression equation were most biased for the EBD method (AB&#x202F;=&#x202F;0.08), and on average, equal to zero for RSD and SEM. This means that the estimates of the relationship between discrepancy and the outcome were less consistent for the EBD method, and quite consistent for RSD and SEM. In the ANOVA, differences among methods accounted for an <italic>&#x03B7;</italic><sup>2</sup> of 0.05.</p>
<p>The ANOVA predicting AB of standard error estimates for discrepancy slope showed one interaction with effect size of at least 0.06: the interaction between method and N-size (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.06). Post-hoc ANOVAs were conducted separately for each method to aid in interpretation of the six-way ANOVAs. <xref ref-type="fig" rid="fig5">Figure 5</xref> includes three plots showing substantial effects of cluster number (N) on standard error of slope estimates for the EBD method. The first plot in <xref ref-type="fig" rid="fig5">Figure 5</xref>, for discrepancy slope standard error bias, shows that standard error bias is stable across cluster number for RSD and SEM methods, but increases as cluster number increases for EBD (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.09). Furthermore, cluster number interacted with ICC for the EBD method (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.06). The interaction effect, plotted in <xref ref-type="fig" rid="fig6">Figure 6</xref>, shows that the effect of cluster number (N) on AB of discrepancy slope standard errors increases as ICC increases.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Standard error bias by N and method for discrepancy slope, direction slope, and interaction slope.</p>
</caption>
<graphic xlink:href="fpsyg-16-1499076-g005.tif"/>
</fig>
<fig position="float" id="fig6">
<label>Figure 6</label>
<caption>
<p>Absolute bias (AB) of discrepancy slope and interaction slope standard error by cluster number (N) and ICC, for EBD method only (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.06 for each plot).</p>
</caption>
<graphic xlink:href="fpsyg-16-1499076-g006.tif"/>
</fig>
<p>The coverage rate (i.e., the percentage of models in which the true score discrepancy slope was found in the confidence interval for the discrepancy slope estimates) was larger for the RSD (91%) and SEM (89%) methods, while EBD was 24%. This indicates that the RSD and SEM methods more accurately predicted the strength of the relationship between the discrepancy and the outcome than EBD.</p>
<p>The power (aka proportion of statistically significant estimates) for the discrepancy slope estimate was computed for the three estimation methods. The power for the RSD and SEM was 0.96, and for EBD, 0.95.</p>
</sec>
<sec id="sec35">
<label>3.3.2</label>
<title>Direction slope estimate and standard error bias</title>
<p>The bias of direction slope estimates was the same for all three methods (AB&#x202F;=&#x202F;&#x2212;0.29). That means the direction of the discrepancy for distinguishable dyads&#x2019; relationship with the outcome was estimated with similar levels of bias for all three methods. However, the EBD method suffers from outliers, shown in the boxplots in <xref ref-type="fig" rid="fig7">Figure 7</xref>.</p>
<fig position="float" id="fig7">
<label>Figure 7</label>
<caption>
<p>Absolute bias (AB) of direction slope estimate by method (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.42) and AB of standard error (SE) of direction slope estimate by method (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.05).</p>
</caption>
<graphic xlink:href="fpsyg-16-1499076-g007.tif"/>
</fig>
<p>The average bias of standard errors was also comparable among all three methods, with RSD being the least biased (AB&#x202F;=&#x202F;0.00), followed by SEM (AB&#x202F;=&#x202F;&#x2212;0.03) and EBD (AB&#x202F;=&#x202F;&#x2212;0.03). The boxplots of these distributions are shown in <xref ref-type="fig" rid="fig5">Figure 5</xref> to illustrate EBD&#x2019;s outliers. Neither the slope estimate nor its standard error were substantially (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;&#x003E;&#x202F;= 0.06) impacted by method and design factors in the original ANOVAs (see <xref ref-type="table" rid="tab4">Table 4</xref>). However, the post-hoc ANOVAs revealed that standard error bias from the SEM and EBD methods was substantially impacted by cluster number, as shown in the upper-right plot in <xref ref-type="fig" rid="fig5">Figure 5</xref>. Standard error bias decreased as cluster number increased for EBD (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.05) and SEM (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.06).</p>
<p>The coverage rate of the direction slope estimate was 100% for SEM and lower for RSD (77%) and EBD (75%). The power for direction slope estimate was quite low among all methods, ranging from 0.14 for RSD to 0.16 for EBD and SEM. Lower power was expected because the outcome variable was generated based on a true slope of 0.5. It makes sense that power is lower for direction slope than discrepancy slope, which was generated based on a true slope of 0.8. A stronger relationship between outcome and predictor results in a greater percentage of statistically significant results.</p>
</sec>
<sec id="sec36">
<label>3.3.3</label>
<title>Discrepancy by direction interaction slope estimate and standard error bias</title>
<p>The AB of the discrepancy by slope interaction effect was the greatest for RSD and SEM, both with AB&#x202F;=&#x202F;&#x2212;0.13. EBD had bias of &#x2212;0.08. Outliers remained prevalent for the EBD method. The distributions are shown in <xref ref-type="fig" rid="fig8">Figure 8</xref>.</p>
<fig position="float" id="fig8">
<label>Figure 8</label>
<caption>
<p>Absolute bias (AB) of interaction slope estimate by method (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.42) and AB of standard error (SE) of interaction slope estimate by method (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.05).</p>
</caption>
<graphic xlink:href="fpsyg-16-1499076-g008.tif"/>
</fig>
<p>The mean AB of standard errors was 0 for RSD and SEM, and &#x2212;0.07 for EBD. The EBD method produced extreme standard error outliers, with standard error bias ranging from &#x2212;3.46 to 81.63. Neither the slope estimate nor its standard error were substantially (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;&#x003E;&#x202F;= 0.06) impacted by method and design factors in the ANOVAs (see <xref ref-type="table" rid="tab4">Table 4</xref>). According to the post-hoc ANOVAs, however, the RSD and SEM methods were not substantially impacted by design factors, but the EBD method was. As shown in the bottom plot of <xref ref-type="fig" rid="fig5">Figure 5</xref>, bias decreased sharply as cluster number (N) increased. Furthermore, cluster number interacted with ICC for the EBD method. <xref ref-type="fig" rid="fig6">Figure 6</xref> shows that the effect of cluster number on standard error bias increases as ICC increases.</p>
<p>The mean AB of standard errors was 0 for RSD and SEM, and &#x2212;0.07 for EBD. The EBD method produced extreme standard error outliers, with standard error bias ranging from &#x2212;3.46 to 81.63. Neither the slope estimate nor its standard error were substantially (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;&#x003E;&#x202F;= 0.06) impacted by method and design factors in the ANOVAs (see <xref ref-type="table" rid="tab4">Table 4</xref>). According to the post-hoc ANOVAs, however, the RSD and SEM methods were not substantially impacted by design factors, but the EBD method was. As shown in the bottom plot of <xref ref-type="fig" rid="fig5">Figure 5</xref>, bias decreased sharply as cluster number (N) increased. Furthermore, cluster number interacted with ICC for the EBD method. <xref ref-type="fig" rid="fig5">Figure 5</xref> shows that the effect of cluster number on standard error bias increases as ICC increases.</p>
<p>The coverage rate of discrepancy&#x002A;direction interaction slope estimate was highest for EBD (58%). It was substantially lower for SEM (19%) and RSD (18%). Finally, the power of the discrepancy&#x002A;direction interaction estimates was low and comparable among the three methods. Power was highest for SEM (0.10), followed by RSD (0.09) and EBD (0.09).</p>
</sec>
<sec id="sec37">
<label>3.3.4</label>
<title><italic>R<sup>2</sup></italic> bias</title>
<p>RSD and SEM <italic>R<sup>2</sup></italic> bias values were &#x2212;0.04, and EBD was &#x2212;0.05. Estimation method explained a large proportion of the variance in <italic>R</italic><sup>2</sup> bias (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.69). EBD accounted for the differences among methods as shown in <xref ref-type="fig" rid="fig9">Figure 9</xref>. The post-hoc ANOVAs explained that <italic>R<sup>2</sup></italic> bias from each method (RSD, EBD, and SEM) was substantially impacted by effect size variance. Bias by method and effect size variance is plotted in <xref ref-type="fig" rid="fig10">Figure 10</xref>. The plot shows that <italic>R<sup>2</sup></italic> bias increases as effect size variance increases. The power of <italic>R</italic><sup>2</sup> was high, at 0.98 for EBD, and 0.99 for RSD and SEM. The high power of <italic>R</italic><sup>2</sup> values across all three methods indicated that each method produced a statistically significant <italic>R</italic><sup>2</sup>, effectively identifying the existence of a relationship between the outcome and predictors.</p>
<fig position="float" id="fig9">
<label>Figure 9</label>
<caption>
<p>Absolute bias (AB) of <italic>R</italic><sup>2</sup> by method (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.69).</p>
</caption>
<graphic xlink:href="fpsyg-16-1499076-g009.tif"/>
</fig>
<fig position="float" id="fig10">
<label>Figure 10</label>
<caption>
<p>Absolute bias (AB) of <italic>R</italic><sup>2</sup> by method and effect size variance.</p>
</caption>
<graphic xlink:href="fpsyg-16-1499076-g010.tif"/>
</fig>
</sec>
</sec>
</sec>
<sec sec-type="discussion" id="sec38">
<label>4</label>
<title>Discussion</title>
<p>These findings suggest that dyadic discrepancy from MLM (i.e., EBD) suffers from poor reliability, especially where ICC was high, effect size variance was high, and cluster number was low, which hinders its accuracy as a predictor. The implications of this finding are that RSD or SEM may be preferred because they are not impacted as greatly by ICC, effect size variance, and cluster number. These findings are discussed more fully below, followed by a discussion of limitations and recommendations for future research.</p>
<sec id="sec39">
<label>4.1</label>
<title>Why did the EBD shrinkage effect result in outliers?</title>
<p>The data were explored further to better understand why EBD produced outliers in prediction. First &#x201C;outlier&#x201D; conditions were defined as those with AB discrepancy slope for EBD fell beyond the range of AB discrepancy slope for RSD and SEM, which was about &#x2212;1.4 to &#x2212;0.8. A total of 8,111 (or 3.8%) of AB of EBD estimates met this condition. Outliers were most prevalent where ICC equaled 0.5 and cluster number equaled 50, as shown in <xref ref-type="fig" rid="fig11">Figure 11</xref>.</p>
<fig position="float" id="fig11">
<label>Figure 11</label>
<caption>
<p>Percentage of outliers by ICC and cluster number.</p>
</caption>
<graphic xlink:href="fpsyg-16-1499076-g011.tif"/>
</fig>
<p>Examining the outlier data showed that variance of EBD within outlier samples was lower than the non-outlier samples. This led to a deeper analysis of the variance components in EBD estimation. According to <xref ref-type="disp-formula" rid="EQ10">Equation 7</xref>, EBD is a weighted combination of the OLS slope and the grand mean of slopes across all dyads (&#x03B3;<sub>10</sub>). It is weighted by the reliability of the OLS estimate. The more concentrated &#x03B2;<sub>1j</sub> values are around &#x03B3;<sub>10</sub>, the more &#x03B3;<sub>10</sub> is weighted in EBD. The more the central tendency is weighted in EBD, the less variable EBD will be. In extreme outlying cases, the variance of EBD was near zero, indicating over shrinkage, which was cautioned against by <xref ref-type="bibr" rid="ref34">Raudenbush (2008)</xref>, particularly when cluster sizes are small. As a result, EBD became ineffective as a predictor in the regression models.</p>
</sec>
<sec id="sec40">
<label>4.2</label>
<title>Which method should researchers use to estimate dyadic discrepancy?</title>
<p>One purpose of this study was to determine the most accurate method for estimating dyadic discrepancy. On average, AB was zero for all three methods evaluated (RSD, EBD, and SEM). Using method and design factors to predict bias in an ANOVA resulted in <italic>&#x03B7;</italic><sup>2</sup> less than 0.0001. Considering average bias alone, one might conclude that all three methods are equally accurate.</p>
<p>However, though the methods do not differ in average bias, they do differ in reliability of bias. The EBD method produced estimates with the poorest reliability. On average, reliability was 2.29; being greater than one indicates that variance of EBD estimates was less than variance of true discrepancy scores. This proved to be problematic for bias of estimates and their standard errors in prediction, as discussed below.</p>
<p>Another purpose of the study was to determine which method&#x2019;s discrepancy estimates most accurately predict an outcome. Prediction was evaluated using slope estimate bias, standard error of slope estimate bias, power, coverage rate, and effect size (<italic>R</italic><sup>2</sup>). The discrepancy estimates from the EBD method produced extreme outliers in the prediction models. This resulted in EBD being the poorest performer by far in slope estimate bias and standard error bias for all three slopes (discrepancy, direction, and discrepancy&#x002A;direction interaction). ANOVA effect size, <italic>&#x03B7;</italic><sup>2</sup>, for method was not large except for when predicting discrepancy slope bias (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.42). Small effects were seen using method to predict bias of slope standard error (slope discrepancy S.E. <italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.05, direction&#x202F;=&#x202F;0.04, and discrepancy&#x002A;direction interaction&#x202F;=&#x202F;0.02), as well as slope (interaction) bias (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.01).</p>
<p>The issues with EBD stem from the &#x201C;over-shrinkage&#x201D; described in the literature review above (<xref ref-type="bibr" rid="ref34">Raudenbush, 2008</xref>; <xref ref-type="bibr" rid="ref35">Raudenbush and Bryk, 2002</xref>; <xref ref-type="bibr" rid="ref40">Stage, 2001</xref>). In the current study, the over-shrinkage primarily impacted samples with small cluster numbers and, more so, high conditional ICC. Cluster number interacts with method (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.06), and the interaction plots (<xref ref-type="fig" rid="fig5">Figure 5</xref>) show that bias was greatest for EBD where cluster size was 50.</p>
<p>An examination of EBD outliers revealed that over 85% of the outlying samples had the high conditional ICC value of 0.5. The variance of EBD in these samples was very low. Because the EBD method partials out the variance from the grand slope (see <xref ref-type="disp-formula" rid="EQ3 EQ4 EQ5 EQ6 EQ7 EQ8">Equations 3a&#x2013;5</xref>), if dyads have a high level of dependence, more of the variance overall is partialed out from the dyad-level discrepancy. This results in EBD estimates with low variance, because the variance accounted for by the grand slope has been removed already. The shrunken variances of EBD relative to the true score discrepancy caused the extreme outliers in bias of parameters and their standard errors in the prediction equations.</p>
<p>Overall, none of the three methods were clearly more accurate than the other, and bias was not substantially impacted by method or design factor. However, the poor reliability of EBD and the resulting impact on accuracy of predicting an outcome suggests RSD and SEM are better estimates of dyadic discrepancy. RSD may be preferred since it is easier to compute. However, SEM has the advantages of model flexibility, such as predicting the outcome directly in the same model or including other relationships and variables in the model.</p>
</sec>
<sec id="sec41">
<label>4.3</label>
<title>Was raw-score difference impacted by reliability?</title>
<p>According to the reliability formula in <xref ref-type="disp-formula" rid="EQ1">Equation 1</xref> from <xref ref-type="bibr" rid="ref45">Williams and Zimmerman (1977)</xref>, RSD reliability would be higher when the reliability of scores from individual dyad members was higher and when ICC was smaller. According to <xref ref-type="table" rid="tab5">Table 5</xref> and <xref ref-type="fig" rid="fig3">Figure 3</xref>, the ANOVA predicting RSD reliability with design factors confirmed that reliability for RSD was higher when ICC was lower (<italic>&#x03B7;</italic><sup>2</sup>&#x202F;=&#x202F;0.06). Reliability of scores for dyad members <italic>A</italic> and <italic>B</italic> was expected to have an impact on reliability of discrepancy estimates. However, in the ANOVA predicting reliability of estimates, <italic>&#x03B7;</italic><sup>2</sup> was 0 for reliability, indicating that RSD reliability did not depend on the reliability of individual dyad member scores. The reliability values simulated in this study were set high at 0.7, 0.8, and mixed 0.7 and 0.8, per values commonly found in applied research. Future research should include lower levels of reliability as a design factor to test the limits of how low reliability of scores from dyad member <italic>A</italic> and <italic>B</italic> can go without impacting the reliability of discrepancy.</p>
</sec>
<sec id="sec42">
<label>4.4</label>
<title>Limitations and recommendations for future research</title>
<p>As explained in the methods and results, reliability is typically thought of as ranging from zero to one, but the EBD shrinkage effect often resulted in reliability values greater than one. We did not identify an alternate method of computing reliability for EBD other than the traditional true score variance divided by observed score variance. Future research should consider whether there is a better way to compute or interpret the reliability of EBD.</p>
<p>Furthermore, one of the benefits of the EBD shrinkage effect is the ability to include dyads with missing or unreliable data, which then &#x201C;borrow&#x201D; strength from the rest of the sample (<xref ref-type="bibr" rid="ref22">Kim et al., 2013</xref>). However, missing data was not considered in this simulation. Varying degrees of missingness could be simulated in future research to generate understanding of whether and how each method overcomes the limitations of missing data.</p>
<p>The findings suggest that even though RSD and SEM had poor reliability, these estimates still do a good job predicting an outcome as evidenced by high levels of power. This suggests that RSD is suitable for many practical, real-life applications of dyadic discrepancy research, despite historical concerns that it is unreliable. Statistically, the reliability of the discrepancy score is impacted by the reliability of each dyad member&#x2019;s scores, but the conditions prevalent in dyadic data literature may overcome these concerns by having high reliabilities of dyad member&#x2019;s scores and low to moderate dependence. However, future research should further push the upper and lower limits of the design factors in the current study, specifically reliability of dyad member&#x2019;s scores and cluster number, in an effort to determine under what conditions the RSD would become unacceptable.</p>
<p>A simple regression model was used to evaluate accuracy of prediction, but in reality, more complicated models are needed to adequately address dyadic discrepancy research questions. While RSD is the most straightforward computational approach, the ability to generate an accurate dyadic discrepancy in SEM is promising for researchers seeking to use the discrepancy in more complicated models, such as the second-order factor model from <xref ref-type="bibr" rid="ref33">Newsom (2002)</xref>. The discrepancy can be generated in the same model as the prediction model, and the measurement model could be included. Though it is possible to output the idiographic discrepancy using SEM, in practice, RSD is easier to compute for purposes of idiographic research. But SEM offers the flexibility of using discrepancy in a nomothetic model while maintaining the ability to output it ideographically as well. Future research should ensure the good performance of the SEM discrepancy in this study is maintained in more complicated models, including those with the measurement model included. It would also be useful to understand the impacts of measurement invariance on dyadic discrepancy and its use in prediction (<xref ref-type="bibr" rid="ref36">Russell et al., 2016</xref>).</p>
<p>EBD and SEM discrepancy estimates were generated using full-information maximum likelihood (FIML) estimation method. Restricted maximum likelihood (REML) is an alternative estimation method that may result in less biased estimates, particularly when cluster number is small (<xref ref-type="bibr" rid="ref35">Raudenbush and Bryk, 2002</xref>). Future research should investigate in more detail whether the estimation method matters in the current context.</p>
<p>Finally, the findings here cannot be generalized to conditions not included in the simulation. Furthermore, future research should apply the techniques to real data, as opposed to simulated data, to see if the estimates compare to those found in this study.</p>
</sec>
<sec id="sec43">
<label>4.5</label>
<title>Practical implications</title>
<p>Researchers seeking to make an informed decision about which method to use to study dyadic discrepancy would hope for a clear answer about which method is best. Notwithstanding the limitations and directions for future research in the preceding section, the findings suggest that RSD or SEM perform quite similarly, and better than EBD on average. Though the estimates themselves did not have great reliability for any method, the RSD and SEM methods produced estimates with high coverage rates and power when predicting an outcome with the discrepancy. This suggests that for the purpose of predicting an outcome, either of these methods would be suitable, and neither were greatly impacted by the design factors, indicating that they work well in the full range of research conditions simulated. Researchers studying more complicated models may opt for the SEM discrepancy estimate, while researchers interested in simpler models predicting an outcome with a discrepancy score should find that the easy-to-compute RSD works as well as SEM to predict an outcome. Further research, described in the preceding section, is necessary before concluding whether EBD provides a more accurate and useful estimate than RSD or SEM in other conditions, such as with missing data.</p>
</sec>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec44">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec sec-type="author-contributions" id="sec45">
<title>Author contributions</title>
<p>AM: Conceptualization, Investigation, Methodology, Project administration, Resources, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing, Data curation, Formal analysis, Visualization. QC: Conceptualization, Funding acquisition, Investigation, Methodology, Resources, Supervision, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing, Project administration. RH: Supervision, Writing &#x2013; review &#x0026; editing. RG: Writing &#x2013; review &#x0026; editing. WL: Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="funding-information" id="sec46">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This study was partially supported by the 2012 Junior Faculty Summer Research Fellowship, University of North Texas, Denton.</p>
</sec>
<ack>
<p>We would like to acknowledge Dr. Su Yeong Kim from the University of Texas at Austin for her insights on an earlier version of the manuscript related to the scope of the study.</p>
</ack>
<sec sec-type="COI-statement" id="sec47">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="sec48">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec49">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fpsyg.2025.1499076/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fpsyg.2025.1499076/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Supplementary_file_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Arend</surname> <given-names>M. G.</given-names></name> <name><surname>Sch&#x00E4;fer</surname> <given-names>T.</given-names></name></person-group> (<year>2019</year>). <article-title>Statistical power in two-level models: a tutorial based on Monte Carlo simulation</article-title>. <source>Psychol. Methods</source> <volume>24</volume>, <fpage>1</fpage>&#x2013;<lpage>19</lpage>. doi: <pub-id pub-id-type="doi">10.1037/met0000195</pub-id>, PMID: <pub-id pub-id-type="pmid">30265048</pub-id></citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barooj-Kiakalaee</surname> <given-names>O.</given-names></name> <name><surname>Hosseini</surname> <given-names>S.</given-names></name> <name><surname>Mohammadpour-Tahmtan</surname> <given-names>R.</given-names></name> <name><surname>Hosseini-Tabaghdehi</surname> <given-names>M.</given-names></name> <name><surname>Jahanfar</surname> <given-names>S.</given-names></name> <name><surname>Esmaeili-Douki</surname> <given-names>Z.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Paternal postpartum depression&#x2019;s relationship to maternal pre and postpartum depression, and father-mother dyads marital satisfaction: a structural equation model analysis of a longitudinal study</article-title>. <source>J. Affect. Disord.</source> <volume>297</volume>, <fpage>375</fpage>&#x2013;<lpage>380</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jad.2021.10.110</pub-id>, PMID: <pub-id pub-id-type="pmid">34715195</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bar-Sella</surname> <given-names>A.</given-names></name> <name><surname>Nof</surname> <given-names>A.</given-names></name> <name><surname>Baucom</surname> <given-names>B. R.</given-names></name> <name><surname>Goldstein</surname> <given-names>P.</given-names></name> <name><surname>Romanov</surname> <given-names>S.</given-names></name> <name><surname>Shpakouskaya</surname> <given-names>I.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>The prognostic role of emotion regulation dynamics in the treatment of major depressive disorder</article-title>. <source>J. Couns. Clin. Psychol.</source> <volume>91</volume>, <fpage>744</fpage>&#x2013;<lpage>749</lpage>. doi: <pub-id pub-id-type="doi">10.1037/ccp0000835</pub-id>, PMID: <pub-id pub-id-type="pmid">37616125</pub-id></citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baumann</surname> <given-names>A. A.</given-names></name> <name><surname>Kuhlberg</surname> <given-names>J. A.</given-names></name> <name><surname>Zayas</surname> <given-names>L. H.</given-names></name></person-group> (<year>2010</year>). <article-title>Familism, mother-daughter mutuality, and suicide attempts of adolescent Latinas</article-title>. <source>J. Fam. Psychol.</source> <volume>24</volume>, <fpage>616</fpage>&#x2013;<lpage>624</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0020584</pub-id>, PMID: <pub-id pub-id-type="pmid">20954772</pub-id></citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Blood</surname> <given-names>E. A.</given-names></name> <name><surname>Kalish</surname> <given-names>L. A.</given-names></name> <name><surname>Shrier</surname> <given-names>L. A.</given-names></name></person-group> (<year>2013</year>). <article-title>Estimating heterogeneous intra-class correlation coefficients in dyadic ecological momentary assessment</article-title>. <source>J. Mod. Appl. Stat. Methods</source> <volume>12</volume>, <fpage>207</fpage>&#x2013;<lpage>219</lpage>. doi: <pub-id pub-id-type="doi">10.22237/jmasm/1367382120</pub-id></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Campione-Barr</surname> <given-names>N.</given-names></name> <name><surname>Lindell</surname> <given-names>A. K.</given-names></name> <name><surname>Giron</surname> <given-names>S. E.</given-names></name></person-group> (<year>2020</year>). <article-title>More data, more problems: analytical complications of studying differential family experiences over time: reply to Laird</article-title>. <source>Dev. Psychol.</source> <volume>56</volume>, <fpage>978</fpage>&#x2013;<lpage>981</lpage>. doi: <pub-id pub-id-type="doi">10.1037/dev0000912</pub-id>, PMID: <pub-id pub-id-type="pmid">32271077</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cano</surname> <given-names>A.</given-names></name> <name><surname>Johansen</surname> <given-names>A. B.</given-names></name> <name><surname>Franz</surname> <given-names>A.</given-names></name></person-group> (<year>2005</year>). <article-title>Multilevel analysis of couple congruence on pain, interference, and disability</article-title>. <source>Pain</source> <volume>118</volume>, <fpage>369</fpage>&#x2013;<lpage>379</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.pain.2005.09.003</pub-id>, PMID: <pub-id pub-id-type="pmid">16289795</pub-id></citation></ref>
<ref id="ref001"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carr</surname> <given-names>D.</given-names></name> <name><surname>Boerner</surname> <given-names>K.</given-names></name></person-group> (<year>2009</year>). <article-title>Do spousal discrepancies in marital quality assessments affect psychological adjustment to widowhood?</article-title> <source>J. Marr. Fam.</source> <volume>71</volume>, <fpage>495</fpage>&#x2013;<lpage>509</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1741-3737.2009.00615.x</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>Q.</given-names></name> <name><surname>Kwok</surname> <given-names>O.</given-names></name> <name><surname>Luo</surname> <given-names>W.</given-names></name> <name><surname>Willson</surname> <given-names>V. L.</given-names></name></person-group> (<year>2010</year>). <article-title>The impact of ignoring a level of nesting structure in multilevel growth mixture models: a Monte Carlo study</article-title>. <source>Struct. Equ. Model.</source> <volume>17</volume>, <fpage>570</fpage>&#x2013;<lpage>589</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10705511.2010.510046</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chiou</surname> <given-names>J.</given-names></name> <name><surname>Spreng</surname> <given-names>R. A.</given-names></name></person-group> (<year>1996</year>). <article-title>The reliability of difference scores: a re-examination</article-title>. <source>J. Consum. Satisf. Dissatisfaction Complain. Behav.</source> <volume>9</volume>, <fpage>158</fpage>&#x2013;<lpage>167</lpage>.</citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Clarke</surname> <given-names>P.</given-names></name> <name><surname>Wheaton</surname> <given-names>B.</given-names></name></person-group> (<year>2007</year>). <article-title>Addressing data sparseness in contextual population research: using cluster analysis to create synthetic neighborhoods</article-title>. <source>Sociol. Methods Res.</source> <volume>35</volume>, <fpage>311</fpage>&#x2013;<lpage>351</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0049124106292362</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Cohen</surname> <given-names>J.</given-names></name></person-group> (<year>1988</year>). <source>Statistical power analysis for the behavioral sciences</source>. <edition>2nd</edition> Edn. <publisher-loc>Mahwah, NJ</publisher-loc>: <publisher-name>Erlbaum.</publisher-name></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Costigan</surname> <given-names>C. L.</given-names></name> <name><surname>Dokis</surname> <given-names>D. P.</given-names></name></person-group> (<year>2006</year>). <article-title>Similarities and differences in acculturation among mothers, fathers, and children in immigrant Chinese families</article-title>. <source>J. Cross-Cult. Psychol.</source> <volume>37</volume>, <fpage>723</fpage>&#x2013;<lpage>741</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0022022106292080</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cronbach</surname> <given-names>L. J.</given-names></name> <name><surname>Furby</surname> <given-names>L.</given-names></name></person-group> (<year>1970</year>). <article-title>How we should measure "change": or should we?</article-title> <source>Psychol. Bull.</source> <volume>74</volume>, <fpage>68</fpage>&#x2013;<lpage>80</lpage>. doi: <pub-id pub-id-type="doi">10.1037/h0029382</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Crouter</surname> <given-names>A. C.</given-names></name> <name><surname>Davis</surname> <given-names>K. D.</given-names></name> <name><surname>Updegraff</surname> <given-names>K.</given-names></name> <name><surname>Delgado</surname> <given-names>M.</given-names></name> <name><surname>Fortner</surname> <given-names>M.</given-names></name></person-group> (<year>2006</year>). <article-title>Mexican American fathers' occupational conditions: links to family members' psychological adjustment</article-title>. <source>J. Marriage Fam.</source> <volume>68</volume>, <fpage>843</fpage>&#x2013;<lpage>858</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1741-3737.2006.00299.x</pub-id>, PMID: <pub-id pub-id-type="pmid">18414596</pub-id></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>De Los Reyes</surname> <given-names>A.</given-names></name> <name><surname>Kazdin</surname> <given-names>A. E.</given-names></name></person-group> (<year>2004</year>). <article-title>Measuring informant discrepancies in clinical child research</article-title>. <source>Psychol. Assess.</source> <volume>16</volume>, <fpage>330</fpage>&#x2013;<lpage>334</lpage>. doi: <pub-id pub-id-type="doi">10.1037/1040-3590.16.3.330</pub-id>, PMID: <pub-id pub-id-type="pmid">15456389</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>DeVellis</surname> <given-names>R. F.</given-names></name></person-group> (<year>2006</year>). <article-title>Classical test theory</article-title>. <source>Med. Care</source> <volume>44</volume>, <fpage>S50</fpage>&#x2013;<lpage>S59</lpage>. doi: <pub-id pub-id-type="doi">10.1097/01.mlr.0000245426.10853.30</pub-id>, PMID: <pub-id pub-id-type="pmid">17060836</pub-id></citation></ref>
<ref id="ref002"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gonzalez</surname> <given-names>R.</given-names></name> <name><surname>Griffin</surname> <given-names>D.</given-names></name></person-group> (<year>1997</year>). &#x201C;<article-title>On the statistics of interdependence: Treating dyadic data with respect</article-title>,&#x201D; in <source>Handbook of personal relationships: Theory, research and interventions (2nd ed.)</source>. ed. <person-group person-group-type="editor"><name><surname>Duck</surname> <given-names>S.</given-names></name></person-group> (<publisher-name>John Wiley &#x0026; Sons, Inc.</publisher-name>), p. <fpage>271</fpage>&#x2013;<lpage>302</lpage>.</citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guion</surname> <given-names>K.</given-names></name> <name><surname>Mrug</surname> <given-names>S.</given-names></name> <name><surname>Windle</surname> <given-names>M.</given-names></name></person-group> (<year>2009</year>). <article-title>Predictive value of informant discrepancies in reports of parenting: relations to early adolescents' adjustment</article-title>. <source>J. Abnorm. Child Psychol.</source> <volume>37</volume>, <fpage>17</fpage>&#x2013;<lpage>30</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10802-008-9253-5</pub-id>, PMID: <pub-id pub-id-type="pmid">18584134</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gulliford</surname> <given-names>M. C.</given-names></name> <name><surname>Ukoumunne</surname> <given-names>O. C.</given-names></name> <name><surname>Chinn</surname> <given-names>S.</given-names></name></person-group> (<year>1999</year>). <article-title>Components of variance and intraclass correlations for the design of community-based surveys and intervention studies: data from the health survey for England 1994</article-title>. <source>Am. J. Epidemiol.</source> <volume>149</volume>, <fpage>876</fpage>&#x2013;<lpage>883</lpage>. doi: <pub-id pub-id-type="doi">10.1093/oxfordjournals.aje.a009904</pub-id>, PMID: <pub-id pub-id-type="pmid">10221325</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Kenny</surname> <given-names>D. A.</given-names></name> <name><surname>Kashy</surname> <given-names>D. A.</given-names></name> <name><surname>Cook</surname> <given-names>W. L.</given-names></name></person-group> (<year>2006a</year>). &#x201C;<article-title>Dyadic indexes</article-title>&#x201D; in <source>Dyadic data analysis</source>. eds. <person-group person-group-type="editor"><name><surname>Kenny</surname> <given-names>D.</given-names></name> <name><surname>Kashy</surname> <given-names>D.</given-names></name> <name><surname>Cook</surname> <given-names>W.</given-names></name></person-group> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Guilford Press</publisher-name>), <fpage>317</fpage>&#x2013;<lpage>341</lpage>.</citation></ref>
<ref id="ref20"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Kenny</surname> <given-names>D. A.</given-names></name> <name><surname>Kashy</surname> <given-names>D. A.</given-names></name> <name><surname>Cook</surname> <given-names>W. L.</given-names></name></person-group> (<year>2006b</year>). &#x201C;<article-title>The measurement of nonindependence</article-title>&#x201D; in <source>Dyadic data analysis</source>. eds. <person-group person-group-type="editor"><name><surname>Kenny</surname> <given-names>D.</given-names></name> <name><surname>Kashy</surname> <given-names>D.</given-names></name> <name><surname>Cook</surname> <given-names>W.</given-names></name></person-group> (<publisher-loc>New York</publisher-loc>: <publisher-name>Guilford Press</publisher-name>), <fpage>25</fpage>&#x2013;<lpage>52</lpage>.</citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>S. Y.</given-names></name> <name><surname>Chen</surname> <given-names>Q.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Huang</surname> <given-names>X.</given-names></name> <name><surname>Moon</surname> <given-names>U. J.</given-names></name></person-group> (<year>2009</year>). <article-title>Parent&#x2013;child acculturation, parenting, and adolescent depressive symptoms in Chinese immigrant families</article-title>. <source>J. Fam. Psychol.</source> <volume>23</volume>, <fpage>426</fpage>&#x2013;<lpage>437</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0016019</pub-id>, PMID: <pub-id pub-id-type="pmid">19586205</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>S. Y.</given-names></name> <name><surname>Chen</surname> <given-names>Q.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Shen</surname> <given-names>Y.</given-names></name> <name><surname>Orozco-Lapray</surname> <given-names>D.</given-names></name></person-group> (<year>2013</year>). <article-title>Longitudinal linkages among parent&#x2013;child acculturation discrepancy, parenting, parent&#x2013;child sense of alienation, and adolescent adjustment in Chinese immigrant families</article-title>. <source>Dev. Psychol.</source> <volume>49</volume>, <fpage>900</fpage>&#x2013;<lpage>912</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0029169</pub-id>, PMID: <pub-id pub-id-type="pmid">22799587</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krull</surname> <given-names>J. L.</given-names></name> <name><surname>MacKinnon</surname> <given-names>D. P.</given-names></name></person-group> (<year>2001</year>). <article-title>Multilevel modeling of individual and group level mediated effects</article-title>. <source>Multivar. Behav. Res.</source> <volume>36</volume>, <fpage>249</fpage>&#x2013;<lpage>277</lpage>. doi: <pub-id pub-id-type="doi">10.1207/S15327906MBR3602_06</pub-id>, PMID: <pub-id pub-id-type="pmid">26822111</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Laird</surname> <given-names>R. D.</given-names></name></person-group> (<year>2020</year>). <article-title>Analytical challenges of testing hypotheses of agreement and discrepancy: comment on Campione-Barr, Lindell, and Giron (2020)</article-title>. <source>Dev. Psychol.</source> <volume>56</volume>, <fpage>970</fpage>&#x2013;<lpage>977</lpage>. doi: <pub-id pub-id-type="doi">10.1037/dev0000763</pub-id>, PMID: <pub-id pub-id-type="pmid">32271076</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lau</surname> <given-names>A. S.</given-names></name> <name><surname>McCabe</surname> <given-names>K. M.</given-names></name> <name><surname>Yeh</surname> <given-names>M.</given-names></name> <name><surname>Garland</surname> <given-names>A. F.</given-names></name> <name><surname>Wood</surname> <given-names>P. A.</given-names></name> <name><surname>Hough</surname> <given-names>R. L.</given-names></name></person-group> (<year>2005</year>). <article-title>The acculturation gap-distress hypothesis among high-risk Mexican American families</article-title>. <source>J. Fam. Psychol.</source> <volume>19</volume>, <fpage>367</fpage>&#x2013;<lpage>375</lpage>. doi: <pub-id pub-id-type="doi">10.1037/0893-3200.19.3.367</pub-id>, PMID: <pub-id pub-id-type="pmid">16221017</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leidy</surname> <given-names>M. S.</given-names></name> <name><surname>Parke</surname> <given-names>R. D.</given-names></name> <name><surname>Cladis</surname> <given-names>M.</given-names></name> <name><surname>Coltrane</surname> <given-names>S.</given-names></name> <name><surname>Duffy</surname> <given-names>S.</given-names></name></person-group> (<year>2009</year>). <article-title>Positive marital quality, acculturative stress, and child outcomes among Mexican Americans</article-title>. <source>J. Marriage Fam.</source> <volume>71</volume>, <fpage>833</fpage>&#x2013;<lpage>847</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1741-3737.2009.00638.x</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Lord</surname> <given-names>F. M.</given-names></name></person-group> (<year>1963</year>). &#x201C;<article-title>Elementary models for measuring change</article-title>&#x201D; in <source>Problems in measuring change</source>. ed. <person-group person-group-type="editor"><name><surname>Harris</surname> <given-names>C. W.</given-names></name></person-group> (<publisher-loc>Madison, WI</publisher-loc>: <publisher-name>University of Wisconsin Press</publisher-name>), <fpage>21</fpage>&#x2013;<lpage>38</lpage>.</citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname> <given-names>W.</given-names></name> <name><surname>Kwok</surname> <given-names>O.</given-names></name></person-group> (<year>2009</year>). <article-title>The impacts of ignoring a crossed factor in analyzing cross-classified data</article-title>. <source>Multivar. Behav. Res.</source> <volume>44</volume>, <fpage>182</fpage>&#x2013;<lpage>212</lpage>. doi: <pub-id pub-id-type="doi">10.1080/00273170902794214</pub-id>, PMID: <pub-id pub-id-type="pmid">26754266</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maas</surname> <given-names>C. J.</given-names></name> <name><surname>Hox</surname> <given-names>J. J.</given-names></name></person-group> (<year>2005</year>). <article-title>Sufficient sample sizes for multilevel modeling</article-title>. <source>Methodol. Eur. J. Res. Methods Behav. Soc. Sci.</source> <volume>1</volume>, <fpage>86</fpage>&#x2013;<lpage>92</lpage>. doi: <pub-id pub-id-type="doi">10.1027/1614-2241.1.3.86</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="other"><person-group person-group-type="author"><name><surname>McEnturff</surname> <given-names>A.</given-names></name> <name><surname>Chen</surname> <given-names>Q.</given-names></name> <name><surname>Turner</surname> <given-names>H.</given-names></name> <name><surname>Luo</surname> <given-names>W.</given-names></name></person-group> (<year>2013</year>) <italic>Evaluating MLM and SEM approaches of estimating acculturation discrepancy: a simulation study.</italic> Paper presented at the 121st annual meeting of the American Psychological Association, Honolulu, Hawaii.</citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McHale</surname> <given-names>S. M.</given-names></name> <name><surname>Updegraff</surname> <given-names>K. A.</given-names></name> <name><surname>Shanahan</surname> <given-names>L.</given-names></name> <name><surname>Crouter</surname> <given-names>A. C.</given-names></name> <name><surname>Killoren</surname> <given-names>S. E.</given-names></name></person-group> (<year>2005</year>). <article-title>Siblings&#x2019; differential treatment in Mexican American families</article-title>. <source>J. Marriage Fam.</source> <volume>67</volume>, <fpage>1259</fpage>&#x2013;<lpage>1274</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1741-3737.2005.00215.x</pub-id>, PMID: <pub-id pub-id-type="pmid">18414595</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moerbeek</surname> <given-names>M.</given-names></name></person-group> (<year>2004</year>). <article-title>The consequence of ignoring a level of nesting in multilevel analysis</article-title>. <source>Multivar. Behav. Res.</source> <volume>39</volume>, <fpage>129</fpage>&#x2013;<lpage>149</lpage>. doi: <pub-id pub-id-type="doi">10.1207/s15327906mbr3901_5</pub-id>, PMID: <pub-id pub-id-type="pmid">26759936</pub-id></citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Newsom</surname> <given-names>J. T.</given-names></name></person-group> (<year>2002</year>). <article-title>A multilevel structural equation model for dyadic data</article-title>. <source>Struct. Equ. Model.</source> <volume>9</volume>, <fpage>431</fpage>&#x2013;<lpage>447</lpage>. doi: <pub-id pub-id-type="doi">10.1207/S15328007SEM0903_7</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Raudenbush</surname> <given-names>S. W.</given-names></name></person-group> (<year>2008</year>). &#x201C;<article-title>Many small groups</article-title>,&#x201D; in <source>Handbook of multilevel analysis</source>. eds. <person-group person-group-type="editor"><name><surname>de Leeuw</surname> <given-names>J.</given-names></name> <name><surname>Meijer</surname> <given-names>E.</given-names></name></person-group> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>).</citation></ref>
<ref id="ref35"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Raudenbush</surname> <given-names>S. W.</given-names></name> <name><surname>Bryk</surname> <given-names>A. S.</given-names></name></person-group> (<year>2002</year>). <source>Hierarchical linear models: Applications and data analysis methods</source>. <edition>2nd</edition> Edn. <publisher-loc>Thousand Oaks, CA</publisher-loc>: <publisher-name>Sage Publications, Inc</publisher-name>.</citation></ref>
<ref id="ref36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Russell</surname> <given-names>J. D.</given-names></name> <name><surname>Graham</surname> <given-names>R. A.</given-names></name> <name><surname>Neill</surname> <given-names>E. L.</given-names></name> <name><surname>Weems</surname> <given-names>C. F.</given-names></name></person-group> (<year>2016</year>). <article-title>Agreement in youth-parent perceptions of parenting behaviors: a case for testing measurement invariance in reporter discrepancy research</article-title>. <source>J. Youth Adolesc.</source> <volume>45</volume>, <fpage>2094</fpage>&#x2013;<lpage>2107</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10964-016-0495-1</pub-id>, PMID: <pub-id pub-id-type="pmid">27289553</pub-id></citation></ref>
<ref id="ref37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sakaluk</surname> <given-names>J. K.</given-names></name> <name><surname>Joel</surname> <given-names>S.</given-names></name> <name><surname>Quinn-Nilas</surname> <given-names>C.</given-names></name> <name><surname>Camanto</surname> <given-names>O. J.</given-names></name> <name><surname>Pevie</surname> <given-names>N. W.</given-names></name> <name><surname>Tu</surname> <given-names>E.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>A renewal of dyadic structural equation modeling with latent variables: clarifications, methodological advantages, and new directions</article-title>. <source>Soc. Personal. Psychol. Compass</source> <volume>19</volume>, <fpage>1</fpage>&#x2013;<lpage>15</lpage>. doi: <pub-id pub-id-type="doi">10.1111/spc3.70045</pub-id>, PMID: <pub-id pub-id-type="pmid">40415499</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Sayer</surname> <given-names>A. G.</given-names></name> <name><surname>Klute</surname> <given-names>M. M.</given-names></name></person-group> (<year>2005</year>). &#x201C;<article-title>Analyzing couples and families: multilevel methods</article-title>&#x201D; in <source>Sourcebook of family theory and research</source>. eds. <person-group person-group-type="editor"><name><surname>Bengston</surname> <given-names>V. L.</given-names></name> <name><surname>Acock</surname> <given-names>A. C.</given-names></name> <name><surname>Allen</surname> <given-names>K. R.</given-names></name> <name><surname>Dilworth-Anderson</surname> <given-names>P.</given-names></name> <name><surname>Klein</surname> <given-names>D. M.</given-names></name></person-group> (<publisher-loc>Thousand Oaks, CA</publisher-loc>: <publisher-name>Sage Publications, Inc</publisher-name>), <fpage>289</fpage>&#x2013;<lpage>313</lpage>.</citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schmid</surname> <given-names>B.</given-names></name> <name><surname>Allen</surname> <given-names>R. S.</given-names></name> <name><surname>Haley</surname> <given-names>P. P.</given-names></name> <name><surname>DeCoster</surname> <given-names>J.</given-names></name></person-group> (<year>2010</year>). <article-title>Family matters: dyadic agreement in end-of-life medical decision making</article-title>. <source>The Gerontologist</source> <volume>50</volume>, <fpage>226</fpage>&#x2013;<lpage>237</lpage>. doi: <pub-id pub-id-type="doi">10.1093/geront/gnp166</pub-id>, PMID: <pub-id pub-id-type="pmid">20038541</pub-id></citation></ref>
<ref id="ref40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stage</surname> <given-names>S. A.</given-names></name></person-group> (<year>2001</year>). <article-title>Program evaluation using hierarchical linear modeling with curriculum-based measurement reading probes</article-title>. <source>Sch. Psychol. Q.</source> <volume>16</volume>, <fpage>91</fpage>&#x2013;<lpage>112</lpage>. doi: <pub-id pub-id-type="doi">10.1521/scpq.16.1.91.19159</pub-id></citation></ref>
<ref id="ref41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stander</surname> <given-names>V. A.</given-names></name> <name><surname>Hsiung</surname> <given-names>P.</given-names></name> <name><surname>MacDermid</surname> <given-names>S.</given-names></name></person-group> (<year>2001</year>). <article-title>The relationship of attributions to marital distress: a comparison of mainland Chinese and U.S. couples</article-title>. <source>J. Fam. Psychol.</source> <volume>15</volume>, <fpage>124</fpage>&#x2013;<lpage>134</lpage>. doi: <pub-id pub-id-type="doi">10.1037/0893-3200.15.1.124</pub-id>, PMID: <pub-id pub-id-type="pmid">11322080</pub-id></citation></ref>
<ref id="ref42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Steele</surname> <given-names>J. S.</given-names></name> <name><surname>Ferrer</surname> <given-names>E.</given-names></name> <name><surname>Nesselroade</surname> <given-names>J. R.</given-names></name></person-group> (<year>2013</year>). <article-title>An idiographic approach to estimating models of dyadic interactions with differential equations</article-title>. <source>Psychometrika</source> <volume>79</volume>, <fpage>675</fpage>&#x2013;<lpage>700</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11336-013-9366-9</pub-id>, PMID: <pub-id pub-id-type="pmid">24352513</pub-id></citation></ref>
<ref id="ref43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Benner</surname> <given-names>A. D.</given-names></name></person-group> (<year>2013</year>). <article-title>Parent-child discrepancies in educational expectations: differential effects of actual versus perceived discrepancies</article-title>. <source>Child Dev.</source> <volume>85</volume>, <fpage>891</fpage>&#x2013;<lpage>900</lpage>. doi: <pub-id pub-id-type="doi">10.1111/cdev.12171</pub-id>, PMID: <pub-id pub-id-type="pmid">24116710</pub-id></citation></ref>
<ref id="ref44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wheeler</surname> <given-names>L. A.</given-names></name> <name><surname>Updegraff</surname> <given-names>K. A.</given-names></name> <name><surname>Thayer</surname> <given-names>S. M.</given-names></name></person-group> (<year>2010</year>). <article-title>Conflict resolution in Mexican-origin couples: culture, gender, and marital quality</article-title>. <source>J. Marriage Fam.</source> <volume>72</volume>, <fpage>991</fpage>&#x2013;<lpage>1005</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1741-3737.2010.00744.x</pub-id>, PMID: <pub-id pub-id-type="pmid">21278807</pub-id></citation></ref>
<ref id="ref45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Williams</surname> <given-names>R. H.</given-names></name> <name><surname>Zimmerman</surname> <given-names>D. W.</given-names></name></person-group> (<year>1977</year>). <article-title>The reliability of difference scores when errors are correlated</article-title>. <source>Educ. Psychol. Meas.</source> <volume>37</volume>, <fpage>679</fpage>&#x2013;<lpage>689</lpage>. doi: <pub-id pub-id-type="doi">10.1177/001316447703700310</pub-id></citation></ref>
<ref id="ref46"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Zumbo</surname> <given-names>B. D.</given-names></name></person-group> (<year>1999</year>). &#x201C;<article-title>The simple difference score as an inherently poor measure of change: some reality, much mythology</article-title>&#x201D; in <source>Advances in social science methodology, vol 5</source>. ed. <person-group person-group-type="editor"><name><surname>Thompson</surname> <given-names>B.</given-names></name></person-group> (<publisher-loc>Leeds, England</publisher-loc>: <publisher-name>Emerald Group Publishing Limited</publisher-name>), <fpage>269</fpage>&#x2013;<lpage>304</lpage>.</citation></ref>
</ref-list>
</back>
</article>