<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Pharmacol.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Pharmacology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Pharmacol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1663-9812</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1380586</article-id>
<article-id pub-id-type="doi">10.3389/fphar.2026.1380586</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Estimating real-world treatment effects in the presence of measurement error and sparse outcome data using propensity score methods</article-title>
<alt-title alt-title-type="left-running-head">Burnell et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fphar.2026.1380586">10.3389/fphar.2026.1380586</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Burnell</surname>
<given-names>Jane</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal Analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing &#x2013; review and editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Banerjee</surname>
<given-names>Amitava</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing &#x2013; review and editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Prescott</surname>
<given-names>Gordon</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing &#x2013; review and editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sutton</surname>
<given-names>Chris</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing &#x2013; review and editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Tishkovskaya</surname>
<given-names>Svetlana</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2395079"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing &#x2013; review and editing</role>
</contrib>
</contrib-group>
<aff id="aff1">
<label>1</label>
<institution>Lancashire Clinical Trials Unit, Applied Health Research Hub, University of Lancashire</institution>, <city>Preston</city>, <country country="GB">United Kingdom</country>
</aff>
<aff id="aff2">
<label>2</label>
<institution>Institute of Health Informatics, University College London</institution>, <city>London</city>, <country country="GB">United Kingdom</country>
</aff>
<author-notes>
<corresp id="c001">
<label>&#x2a;</label>Correspondence: Svetlana Tishkovskaya, <email xlink:href="mailto:stishkovskaya@lancashire.ac.uk">stishkovskaya@lancashire.ac.uk</email>
</corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-03-09">
<day>09</day>
<month>03</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>17</volume>
<elocation-id>1380586</elocation-id>
<history>
<date date-type="received">
<day>01</day>
<month>02</month>
<year>2024</year>
</date>
<date date-type="rev-recd">
<day>28</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>13</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Burnell, Banerjee, Prescott, Sutton and Tishkovskaya.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Burnell, Banerjee, Prescott, Sutton and Tishkovskaya</copyright-holder>
<license>
<ali:license_ref start_date="2026-03-09">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>The real-world treatment effect of a novel treatment can be estimated by analysing routinely collected patient data, in the form of Electronic Health Records (EHR). Any treatment allocation in EHR is not randomised and there may be systematic differences between the treatment groups. Propensity Score (PS) methods are commonly used to correct for these differences and reduce the bias in the treatment effect estimate. The aims of the study were to compare the performance of the most popular PS methods in the estimation of the treatment effect in the presence of two common issues in EHRs: covariate measurement error and sparse data.</p>
</sec>
<sec>
<title>Methods</title>
<p>The motivational example for this study was the assessment of the treatment effect of the novel oral anti-coagulant Rivaroxaban compared with the previous standard treatment Warfarin for the prevention of future stroke in patients with atrial fibrillation. Using simulation experiments based on a dataset comparing Rivaroxaban with Warfarin, we evaluated the performance of four PS methods.</p>
</sec>
<sec>
<title>Results</title>
<p>In the simulations with characteristics of the original dataset, using 3:1&#xa0;PS matching generated a largest bias of &#x2b;0.0428 (corresponding ratio of HRs (rHR) 1.0437), whereas for the other PS methods it was smaller and in negative direction: IPTW for ATE -0.0181 (rHR &#x3d; 0.9821); IPTW for ATT -0.0110 (rHR &#x3d; 0.9891); PS stratification &#x2212;0.0099 (rHR &#x3d; 0.9901), with relative differences between rHRs being small to negligible. Fifty percent under-recording of a covariate (stroke) in the PS model, increased the MSE between 6% and 11% compared to the MSE with no introduced measurement error. While 50% over-recording reduced the MSE by around 35%. The difference in the bias of the low prevalence outcome (0.5%) and the high prevalence outcome (10%) was: IPTW for ATE 0.1514 (rHRs &#x3d; 1.1635); IPTW for ATT 0.0160 (rHRs &#x3d; 1.0161); 3:1&#xa0;PS matching 0.0758 (rHRs &#x3d; 1.0787); PS Stratification 0.0177 (rHRs &#x3d; 1.0179). A similar pattern for outcome prevalence was seen for all the simulation scenarios.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>This study showed that PS methods proposed in the literature may not all perform well for individual datasets. The findings produced recommendations for using PS methods in the estimation of real-world treatment effect when the covariate measurement error and sparse outcome data are present.</p>
</sec>
</abstract>
<kwd-group>
<kwd>electronic health records</kwd>
<kwd>measurement error</kwd>
<kwd>oral anti-coagulant</kwd>
<kwd>propensity score methods</kwd>
<kwd>real-world treatment effect</kwd>
<kwd>sparse outcome data</kwd>
<kwd>stroke</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This research was supported by funding from University of Lancashire and partly funded by the National Institute for Health and Care Research Applied Research Collaboration North West Coast (NIHR ARC NWC). The research was also supported by funding from the European Research Council under the European Union&#x2019;s Seventh Framework Programme (FP/2007-2013)/ERC Grant Agreement no. 339239 (data acquisition).</funding-statement>
</funding-group>
<counts>
<fig-count count="8"/>
<table-count count="4"/>
<equation-count count="1"/>
<ref-count count="60"/>
<page-count count="16"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Drugs Outcomes Research and Policies</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>Although a Randomised Controlled Trial (RCT) is seen as the gold standard for estimating the effect of a novel treatment (<xref ref-type="bibr" rid="B52">Sibbald and Roland, 1998</xref>), the treatment effect in a real-world setting when it is prescribed to a more general population is likely to be different. Electronic Health Records (EHR) data offers the opportunity for the estimation of the real-world treatment effect from observational studies. However, the treatment allocation is not randomised so there are likely be systematic differences between the treatment groups, and, if this is not accounted for, the treatment effect estimate will be biased. Propensity Score (PS) methods (<xref ref-type="bibr" rid="B48">Rosenbaum and Rubin, 1983</xref>) are popular in applied medical research for adjusting for this treatment allocation bias.</p>
<p>PS analysis works within the Potential Outcomes Framework (or Counterfactual Framework) where every participant can have two potential outcomes. For participant <italic>i</italic> these are <italic>Y</italic>
<sub>
<italic>i</italic>
</sub>(0) if the control treatment were received and <italic>Y</italic>
<sub>
<italic>i</italic>
</sub>(1) if the novel treatment were received. The treatment effect for participant <italic>i</italic> would be <italic>Y</italic>
<sub>
<italic>i</italic>
</sub>(1) &#x2212; <italic>Y</italic>
<sub>
<italic>i</italic>
</sub>(0). Each participant will only receive one of the treatments (the other is counterfactual) so this cannot be calculated. The observed outcome is <italic>Y</italic>
<sub>
<italic>i</italic>
</sub> &#x3d; <italic>Z</italic>
<sub>
<italic>i</italic>
</sub>
<italic>Y</italic>
<sub>
<italic>i</italic>
</sub>(1) &#x2b; (1 &#x2212; <italic>Z</italic>
<sub>
<italic>i</italic>
</sub>)<italic>Y</italic>
<sub>
<italic>i</italic>
</sub>(0) where <italic>Z</italic> &#x3d; 0 for the control treatment and <italic>Z</italic> &#x3d; 1 for the novel treatment. Using all participants in the study population <italic>E</italic>[<italic>Y</italic>(1) &#x2212; <italic>Y</italic>(0)] will give the Average Treatment Effect (ATE) (<xref ref-type="bibr" rid="B36">Imbens, 2004</xref>), that is the average effect of moving all those in the population from untreated to treated. The Average Treatment Effect of the Treated (ATT) is given by <italic>E</italic>[<italic>Y</italic>(1)&#x2013; <italic>Y</italic>(0) &#x7c;<italic>Z</italic> &#x3d; 1 ] (<xref ref-type="bibr" rid="B36">Imbens, 2004</xref>), that is the average effect of moving those who actually received the active treatment from untreated to treated.</p>
<p>PS methods comprise of a range of approaches to balancing treatment groups, thus reducing the treatment allocation bias and hence obtaining a less biased estimate for the treatment effect estimate. The PS is the probability of receiving the novel treatment calculated from covariates thought to affect the treatment allocation and/or the outcome. This is regarded as a two-step approach; firstly the PS analysis is applied to adjust for treatment allocation bias and secondly the outcome analysis is performed. Propensity score methods provide a robust way to include the confounders (and competing treatments if necessary) in the outcome model and is rapidly becoming the &#x2018;gold standard&#x2019; means to condition for confounders.</p>
<p>If the value of an observation does not match the true value of the quantity (or characteristic) being measured, this is known as &#x2018;measurement error&#x2019; (<xref ref-type="bibr" rid="B55">Wallace, 2020</xref>). There has been a lack of application of measurement error methods within applied research (<xref ref-type="bibr" rid="B24">De Gil et al., 2015</xref>; <xref ref-type="bibr" rid="B43">Millimet, 2011</xref>). The types of measurement error which may occur in EHR are covariate measurement error, outcome measurement error and treatment allocation measurement error. The measurement error investigated in this study is non-differential measurement error, that is the measurement error is assumed to be the same for each treatment group, in a covariate in the treatment allocation model, the PS model. If covariate measurement error exists, the treatment groups will be balanced on the observed rather than the true covariates, so differences between the treatment groups will still exist, leading to a source of bias in the outcome analysis (<xref ref-type="bibr" rid="B44">Nguyen and Stuart, 2020</xref>). Its impact when using PS conditioning was demonstrated by <xref ref-type="bibr" rid="B21">Conover et al. (2021)</xref>, <xref ref-type="bibr" rid="B24">De Gil et al. (2015)</xref> and <xref ref-type="bibr" rid="B35">Hong, Aaby, Siddique and Stuart (2019)</xref>.</p>
<p>Measurement error adjustment methods which could be applied to similar data can be categorised as: generic methods, where the measurement error adjustment is applied to the data then the standard PS analysis is carried out; and specific to PS analysis, where the measurement error adjustment is combined with the PS analysis. Generic methods to address measurement error include: Multiple Over-imputation (MO) (<xref ref-type="bibr" rid="B10">Blackwell et al., 2017</xref>); Simulation Extrapolation (SIMEX) (<xref ref-type="bibr" rid="B22">Cook and Stefanski, 1994</xref>); Minimal Assumption Bounds (<xref ref-type="bibr" rid="B9">Black et al., 2000</xref>); Regression Calibration (<xref ref-type="bibr" rid="B17">Carroll and Stefanski, 1990</xref>). Methods which perform measurement adjustment specifically in PS analysis include: (<xref ref-type="bibr" rid="B12">Braun et al., 2017</xref>; <xref ref-type="bibr" rid="B25">Dong and Millimet, 2020</xref>; <xref ref-type="bibr" rid="B34">Hong et al., 2017</xref>; <xref ref-type="bibr" rid="B46">Raykov, 2012</xref>; <xref ref-type="bibr" rid="B51">Rudolph and Stuart, 2018</xref>; <xref ref-type="bibr" rid="B56">Webb-Vargas, Rudolph, Lenis, Murakami &#x26; Stuart, 2017</xref>). These methods were not used as the focus of this study is to investigate the effect of measurement error when using PS methods.</p>
<p>Another typical problem of EHR datasets is sparseness in data and it can be caused by any of the following: small sample size (<xref ref-type="bibr" rid="B53">Siino et al., 2018</xref>); rare exposure (treatment) (<xref ref-type="bibr" rid="B30">Hajage, Tubach, Steg, Bhatt &#x26; De Rycke, 2016</xref>); rare outcome events (<xref ref-type="bibr" rid="B53">Siino et al., 2018</xref>) which lead to a low number of events per variable (EPV) (<xref ref-type="bibr" rid="B29">Greenland et al., 2016</xref>); unbalanced or highly predictive risk factor variables (<xref ref-type="bibr" rid="B53">Siino et al., 2018</xref>) with narrow distributions or categories which are uncommon; variables which almost perfectly predict the outcome (<xref ref-type="bibr" rid="B29">Greenland et al., 2016</xref>); variables that together almost perfectly predict the exposure (treatment) (<xref ref-type="bibr" rid="B29">Greenland et al., 2016</xref>). Sparse outcome data are the focus of this study.</p>
<p>Sparse data bias produces treatment effect estimates away from the null, so inflated treatment effect estimates are produced. PS methods, Penalised Likelihood Estimation (PLE), Data Augmentation and Bayesian methods are some of the methods to avoid or reduce bias due to sparse data. The current study is limited to the use of PS methods. PS methods reduce sparse data bias by combining the information from several variables into one, making the number of EPV higher in the outcome model.</p>
<p>This study compares the performance of four commonly used PS methods when using EHRs to estimate the real-world treatment effect of a novel product in the presence of other real-world problems associated with EHR data: covariate measurement error and sparse outcome data. Generally the literature only considers one of these problems when comparing the performance of PS methods. The analysis was performed on an extract from The Health Improvement Network (THIN), UK primary care data, containing data from patients with atrial fibrillation (AF) prescribed the Novel Oral Anti-Coagulant (NOAC), Rivaroxaban, compared to the control, Warfarin an Oral Anti-Coagulant (OAC), in the prevention of future stroke. The outcome data were in time-to-event format with future stroke or TIA being an event of interest. The dataset represented typical real-world problems associated with EHR data: covariate measurement error and sparse outcome data.</p>
</sec>
<sec sec-type="methods" id="s2">
<title>Methods</title>
<sec id="s2-1">
<title>Study dataset</title>
<p>This study used a data extract from THIN, one of the UK primary care datasets, supplied to the Performance-Based Innovation Rewards study (REWARD) (<xref ref-type="bibr" rid="B7">Banerjee et al., 2020</xref>), containing data for 21,259 patients with AF. The study dataset was selected using: the first NOAC/OAC prescription was for Rivaroxaban or Warfarin; the first NOAC/OAC prescription date was after the National Institute for Health and Care Excellence (NICE) approval date for the Rivaroxaban (May 2012); the patients were NOAC/OAC-na&#xef;ve, meaning that this was the first NOAC/OAC prescription this patient was recorded as being prescribed. The analysis was to estimate the treatment effect of Rivaroxaban compared to Warfarin in the prevention of future stroke.</p>
</sec>
<sec id="s2-2">
<title>Propensity score conditioning</title>
<p>The literature suggests the steps to run a PS analysis are: generate the PS model; check for common They implement measurement error in different ways is there is sufficient overlap of the PS distributions of the two treatment groups; apply the PS method; check for balance, that checks how well the PS model has been defined, and is implemented by checking that the PS method used has balanced the distribution of each covariate in the PS model between the treatment groups; estimate treatment effect (<xref ref-type="bibr" rid="B1">Austin, 2009a</xref>; <xref ref-type="bibr" rid="B4">Austin, 2011b</xref>; <xref ref-type="bibr" rid="B27">Garrido et al., 2014</xref>; <xref ref-type="bibr" rid="B40">Li, 2013</xref>). If any of the tests fail, then the PS model should be redefined and the process started again. This can be an iterative process.</p>
<p>Conditional on the true PS, treatment allocation is independent of the measured covariates. This means treated and untreated cases with the same true PS will have the same covariate distribution (<xref ref-type="bibr" rid="B48">Rosenbaum and Rubin, 1983</xref>). If the distribution of the covariates is similar for the cases with the same PS, then the PS is sufficiently well defined (<xref ref-type="bibr" rid="B33">Ho, Imai, King &#x26; Stuart, 2007</xref>). As the estimated PS is being generated, tests on the difference of the covariate distributions will indicate if the estimated PS is sufficiently close to the true PS (<xref ref-type="bibr" rid="B1">Austin, 2009a</xref>).</p>
<p>Logistic Regression was selected for the PS model in this study, as part of Generalized Linear Models family which are a traditional approach of directly adjusting for confounding. The literature presents different options for the selection of the covariates to include in the PS model. In this study, variables which influenced the prescribing (treatment allocation), were included in the PS model (although they may have affected the outcome).</p>
<p>Clinically relevant variables for the PS model were selected from advice by clinicians and supported by the literature: stroke (<xref ref-type="bibr" rid="B31">Hankey et al., 2012</xref>; <xref ref-type="bibr" rid="B58">Toso, 2014</xref>), alcohol misuse (<xref ref-type="bibr" rid="B6">Baczek et al., 2012</xref>), chronic kidney disease (<xref ref-type="bibr" rid="B11">Boriani et al., 2016</xref>), liver disease (<xref ref-type="bibr" rid="B37">Lai et al., 2016</xref>), CHA2DS2-VASc score the stroke risk score for patients with Atrial Fibrillation (<xref ref-type="bibr" rid="B28">Giralt-Steinhauer et al., 2013</xref>; <xref ref-type="bibr" rid="B38">Lee, Monz, Clemens, Brueckmann &#x26; Lip, 2012</xref>), HAS-BLED score the risk of major bleeding for patients on anticoagulation for AF (<xref ref-type="bibr" rid="B59">O&#x27;Caoimh et al., 2017</xref>), ischaemic heart disease used to indicate previous myocardial infarction (<xref ref-type="bibr" rid="B8">Bhatia and Lip, 2004</xref>), and age (<xref ref-type="bibr" rid="B60">Wolff et al., 2015</xref>). All clinically relevant variables were kept in the PS model, regardless of their statistical significance during the model selection process. Other non-clinically relevant variables which were seen to affect prescribing (identified from the data) were retained in the model if were statistically significant (p &#x3c; 0.05). The &#x2018;best&#x2019; model was selected, using the Bayesian Information Criterion (BIC) and further refined to give the PS model as shown in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>The refined treatment allocation model for the RI-WA dataset.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Covariate</th>
<th align="left">Coefficient</th>
<th align="left">SE of coefficient</th>
<th align="left">p</th>
<th align="left">[95% CI]</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Previous stroke</td>
<td align="right">0.123</td>
<td align="right">0.061</td>
<td align="right">0.04</td>
<td align="right">(0.004, 0.242)</td>
</tr>
<tr>
<td align="left">Alcohol misuse</td>
<td align="right">0.098</td>
<td align="right">0.128</td>
<td align="right">0.45</td>
<td align="right">(-0.153, 0.348)</td>
</tr>
<tr>
<td align="left">Chronic kidney disease</td>
<td align="right">0.008</td>
<td align="right">0.051</td>
<td align="right">0.87</td>
<td align="right">(-0.093, 0.109)</td>
</tr>
<tr>
<td align="left">Liver disease</td>
<td align="right">0.033</td>
<td align="right">0.437</td>
<td align="right">0.94</td>
<td align="right">(-0.825, 0.890)</td>
</tr>
<tr>
<td align="left">Ischemic heart disease</td>
<td align="right">&#x2212;0.082</td>
<td align="right">0.051</td>
<td align="right">0.11</td>
<td align="right">(-0.181, 0.018)</td>
</tr>
<tr>
<td align="left">First NOAC/OAC prescription was &#x2264;28 days of first AF diagnosis?</td>
<td align="right">&#x2212;0.192</td>
<td align="right">0.042</td>
<td align="right">&#x3c;0.001</td>
<td align="right">(-0.275, &#x2212;0.110)</td>
</tr>
<tr>
<td align="left">&#x3d; 86 if age&#x2264;86, else &#x3d; age</td>
<td align="right">0.077</td>
<td align="right">0.013</td>
<td align="right">&#x3c;0.001</td>
<td align="right">(0.053, 0.102)</td>
</tr>
<tr>
<td align="left">Licence1&#x2a;</td>
<td align="right">0.153</td>
<td align="right">0.011</td>
<td align="right">&#x3c;0.001</td>
<td align="right">(0.131, 0.175)</td>
</tr>
<tr>
<td align="left">Licence1<sup>2</sup>&#x2a;</td>
<td align="right">&#x2212;0.001</td>
<td align="right">&#x3c;0.001</td>
<td align="right">&#x3c;0.001</td>
<td align="right">(-0.002, &#x2212;0.001)</td>
</tr>
<tr>
<td align="left">Constant term</td>
<td align="right">&#x2212;10.830</td>
<td align="right">1.096</td>
<td align="right">&#x3c;0.001</td>
<td align="right">(-12.979, &#x2212;8.682)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>&#x2a;Licence1 is the Rivaroxaban licence date to date of first NOAC/OAC, prescription, in months.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>
<xref ref-type="fig" rid="F1">Figure 1</xref> shows that there was good common support in this dataset when using this model.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Histogram of Propensity Score, using Stata&#x2019;s -psgraph-, for Rivaroxaban (Treated) and Warfarin (Untreated) for the RI-WA dataset.</p>
</caption>
<graphic xlink:href="fphar-17-1380586-g001.tif">
<alt-text content-type="machine-generated">Bar chart comparing distributions of untreated (blue) and treated (red) groups across propensity score intervals. Untreated bars are shown below and treated bars above reference line, with greater frequencies at lower scores for untreated.</alt-text>
</graphic>
</fig>
<p>There are four general categories of methods for using PS to remove the effect of confounding, that is potential differences in characteristics between the treatment groups: PS matching, stratification on the PS, inverse probability treatment weighting (IPTW) on the PS and covariate adjustment on the PS (<xref ref-type="bibr" rid="B3">Austin, 2011a</xref>). In this study, PS matching, IPTW for ATE, IPTW for ATT and PS stratification were used. PS matching creates matched pairs, or groups, by matching each treated participant to one or more untreated participant with a similar PS. The estimate of treatment effect is generated from the matched sample or dataset, retaining only cases for whom a match is made, meaning that it is smaller than the full dataset used by other PS conditioning methods. Several PS matching methods were considered, (the details are presented in (<xref ref-type="bibr" rid="B14">Burnell, 2022</xref>) Appendix B-6.2, and 3:1 nearest neighbour matching with replacement was chosen for use as it generated a larger matched dataset with more outcome events than the 1:1 matching methods. The original dataset had considerably more Warfarin patients (18,348) than Rivaroxaban patients (2,911) which provided a pool of Warfarin controls for matching to the active Rivaroxaban cases. The Stata community-written command -psmatch2- (<xref ref-type="bibr" rid="B39">Leuven and Sianesi, 2003</xref>) was used to apply and implement this. The balancing checks which were applied to the matched dataset were: comparison of the PS distribution between the treatment groups, standardised differences of the variables and the number of matched pairs/groups generated, ((<xref ref-type="bibr" rid="B14">Burnell, 2022</xref>), Appendix B-6.3). These all confirmed that the PS matching had balanced the data sufficiently well.</p>
<p>IPTW on the PS (<xref ref-type="bibr" rid="B47">Rosenbaum, 1987</xref>) uses weights, based on the PS, to generate a synthetic dataset or sample. The weight is defined as the inverse probability of receiving the treatment the participant actually received. In this study, IPTW, implemented using the Stata community-written command -propwt- (<xref ref-type="bibr" rid="B42">Lunt &#x26; Linden, 2023</xref>), was used to estimate the ATE and ATT with a different formula used for the calculation of weights for the ATE and ATT. Balance checking was performed on a single run on the original dataset, with no measurement error added. The standardised means were compared between the treatment groups and the continuous variables plotted to compare their distributions between the treatment groups, (<xref ref-type="bibr" rid="B14">Burnell, 2022</xref>), Appendix B-6.4. These showed the weights applied for IPTW for ATT and IPTW for ATE balanced the standardised means of each variable in the PS model between the treatment groups.</p>
<p>Stratification on the PS (<xref ref-type="bibr" rid="B49">Rosenbaun and Rubin, 1984</xref>) is a form of subclassification, used to reduce bias. By stratifying on the PS, rather than the individual covariates, less strata are needed. The records of all participants are ordered by PS, then grouped into strata. The treatment effect is estimated within each stratum and then these stratum-specific results pooled, or similar, to generate the ATE and the SE of the estimate. Balance checking visually compared standardised differences of the variables between treatment groups following PS stratification with those in the original data, further details are provided in <xref ref-type="sec" rid="s12">Supplementary Table S1</xref> and also in (<xref ref-type="bibr" rid="B14">Burnell, 2022</xref>), Appendix B-6.5. PS stratification using 5, 10 and 50 strata all reduced the standardized differences. 10 strata were chosen for use in this study because it reduced the standardised differences more than 5 strata and each stratum was less sparse than when 50 strata were used.</p>
</sec>
<sec id="s2-3">
<title>Outcome modelling</title>
<p>The primary outcome in the dataset was future stroke. The outcome analysis was performed on time-to-event data, that is time to first stroke following the first NOAC/OAC prescription, using survival analysis methods. Different implementations of Cox regression, which estimated treatment effect, were used to take account of the matched or weighted nature of the data. When using PS matching and PS stratification, Cox regression with stratification was used where each stratum was a matched pair or group in which the baseline hazard was assumed to be constant. When using IPTW, for both the ATE and ATT, the weights generated by IPTW were used directly as an option in the Cox regression. This weight was then used as Stata&#x2019;s <italic>pweight</italic> (probability weights which represent the probability of the case being used in the sample and is proportional to the probability of the case being sampled) in the outcome analysis.</p>
<p>The outcome model was fitted to the analysis dataset used following PS matching. However, these same variables were used for the other PS methods, PS stratification, IPTW for ATE and IPTW for ATT, without refitting the model to the full dataset. This was done for consistency between the PS methods. The chosen model was the four clinically relevant variables identified as significant from the univariate modelling (prescribed blood pressure lowering medication, prescribed statins, prescribed antiplatelets and hypercholesterolemia), the CHA2DS2-VASc score (<xref ref-type="bibr" rid="B41">Lip et al, 2010</xref>) and treatment (<xref ref-type="table" rid="T2">Table 2</xref>). The estimated treatment effect is conditional on the variables in the outcome model. For use in the simulations a baseline hazard function was required. A Weibull distribution was fitted to the data because of the flexibility it offers, by varying its shape parameter, &#x3b3;, the distribution of the function changes.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>The outcome model selected for use. The model includes treatment, the 4 most significant univariate variables and the CHA2DS2-VASc score.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Covariate</th>
<th align="center">HR</th>
<th align="left">SE of HR</th>
<th align="center">95% CI of HR</th>
<th align="left">Coeffi- cient&#x2a;</th>
<th align="center">SE of coeffi- cient</th>
<th align="left">95% CI of coefficient</th>
<th align="left">p- value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Treatment</td>
<td align="center">1.534</td>
<td align="right">0.383</td>
<td align="center">(0.940, 2.504)</td>
<td align="right">0.428</td>
<td align="right">0.250</td>
<td align="right">(-0.062, 0.918)</td>
<td align="center">0.087</td>
</tr>
<tr>
<td align="left">Prescribed blood pressure lowering medication</td>
<td align="center">0.339</td>
<td align="right">0.110</td>
<td align="center">(0.180, 0.639)</td>
<td align="right">&#x2212;1.081</td>
<td align="right">0.323</td>
<td align="right">(-1.714, &#x2212;0.448)</td>
<td align="center">0.001</td>
</tr>
<tr>
<td align="left">Prescribed statins</td>
<td align="center">0.677</td>
<td align="right">0.245</td>
<td align="center">(0.333, 1.378)</td>
<td align="right">&#x2212;0.390</td>
<td align="right">0.362</td>
<td align="right">(-1.100, 0.321)</td>
<td align="center">0.282</td>
</tr>
<tr>
<td align="left">Prescribed antiplatelets</td>
<td align="center">0.646</td>
<td align="right">0.225</td>
<td align="center">(0.326, 1.279)</td>
<td align="right">&#x2212;0.437</td>
<td align="right">0.349</td>
<td align="right">(-1.121, 0.246)</td>
<td align="center">0.210</td>
</tr>
<tr>
<td align="left">Hypercholesterolemia</td>
<td align="center">0.729</td>
<td align="right">0.269</td>
<td align="center">(0.354, 1.502)</td>
<td align="right">&#x2212;0.316</td>
<td align="right">0.369</td>
<td align="right">(-1.039, 0.407)</td>
<td align="center">0.391</td>
</tr>
<tr>
<td align="left">CHA2DS2-VASc score</td>
<td align="center">1.360</td>
<td align="right">0.165</td>
<td align="center">(1.073, 1.725)</td>
<td align="right">0.308</td>
<td align="right">0.121</td>
<td align="right">(0.070, 0.545)</td>
<td align="center">0.011</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>&#x2a;Coefficient is the log(hazard ratio) - presented as it was used in the simulation process.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s2-4">
<title>Simulation method</title>
<p>The simulated datasets were generated using a <italic>plasmode</italic> simulation method (<xref ref-type="bibr" rid="B54">Vaughan et al., 2009</xref>) which is a resampling method where the draws of cases, that is &#x2018;individual patient records&#x2019;, are made from the original data and the resulting cases copied to the generated dataset. This preserves the relationship between the baseline variables for each case and hence accounts for and reflects the characteristics and specific features of the original real-world dataset. Once a dataset had been created, measurement error was introduced into the variable for previous stroke, to represent under- or over-recording of that variable, and an amended value generated for the PS value and CHA2DS2- VASc score. Variables for the simulated treatment allocation, simulated survival time and simulated survival outcome were created using the baseline variables, the chosen values for the effect size in the PS model of the variable with measurement error and the outcome prevalence. Under-recording was implemented as negative measurement error of previous stroke and over-recording of a was implemented as positive measurement error of previous stroke. The treatment effect was estimated from the dataset (using the simulated variables) and recorded. Performance measures of the PS methods, mean, SD, bias, mean squared error (MSE), percentage change MSE and mean Model SE, were calculated from the treatment effect estimates from all the generated datasets. The calculation for all simulation runs used an assumed true mean obtained from a single simulation run using the original dataset. It was generated as a plausible value to use in all simulations for estimations of both the ATE and the ATT. The implementation of the simulation experiment implies that the performance measures are relative to the assumed true mean estimated as 0.3674.</p>
<p>The number of simulations required for each PS method at each prevalence was chosen via a precision-based sample size calculation using an acceptable width of a 95%CI for the mean treatment effect estimate. The 95%CI was determined by calculating CI widths of the mean treatment effect estimate from simulations using 1,000 datasets, and determining an acceptable CI width. This was then used to calculate the number of simulations required. A rationale for choosing the acceptable CI width was based on the magnitude of the true value of the treatment effect, 0.3674, calculated using the dataset with the original characteristics. The CI width of no more than 10% of this effect parameter, 0.0367, was deemed as acceptable. This was supported by visual inspection of plots of the mean of the treatment effect estimate, from which a CI of 0.04 was thought to be too high and CI between 0.02 and 0.03 was thought to be acceptable. Combining this information, an acceptable CI width of 0.035 was decided upon. It is acknowledged that the selection of an acceptable CI is subjective.</p>
<p>The simulation process is shown as a flow diagram in <xref ref-type="fig" rid="F2">Figure 2</xref>. A dataset was generated using plasmode simulation, measurement error for previous stroke was introduced and additional variables generated using the previous stroke with measurement error and its effect size in the PS model. For the generated dataset, PS conditioning was applied and the outcome analysis performed using Cox PH regression and the treatment effect estimate recorded. This process was repeated for the required number of datasets and the performance measures calculated for the whole simulation run.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Flow diagram of the simulations process (CV_score is CHA2DS2-VASc score).</p>
</caption>
<graphic xlink:href="fphar-17-1380586-g002.tif">
<alt-text content-type="machine-generated">Flowchart titled &#x22;Simulations Process&#x22; outlines steps in a simulation, including model definitions, dataset creation with bootstrapping, measurement error amendments, case-specific data generation, dataset stratification or matching, Cox regression analysis, and calculation of estimates and errors. Blue rectangular boxes and arrows show the sequence and options.</alt-text>
</graphic>
</fig>
<p>Primary care data may under-record events such as stroke, which are treated in secondary care, by 25%&#x2013;35% (<xref ref-type="bibr" rid="B13">Burnell, 2015</xref>, <xref ref-type="bibr" rid="B32">Herrett et al., 2013</xref>). It is possible that there is over-recording of stroke so, to provide the complete picture, the current study looks at measurement error in both directions, that is both under-recording and over-recording. The chosen range of the measurement error was expanded to - 50% to &#x2b;50%, which included the provisional estimate of 25%&#x2013;35% under-recording.</p>
<p>Coefficients to represent high, medium and low effect size for previous stroke were generated using the following method.</p>
<p>The Odds Ratio (OR) of interest is<disp-formula id="equ1">
<mml:math id="m1">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>R</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>o</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>s</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>o</mml:mi>
<mml:mi>f</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>v</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>g</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>R</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>v</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>x</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>b</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>i</mml:mi>
<mml:mi>f</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>h</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>d</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>v</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>s</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>k</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>o</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>s</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>o</mml:mi>
<mml:mi>f</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>v</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>g</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>R</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>v</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>x</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>b</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>i</mml:mi>
<mml:mi>f</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>n</mml:mi>
<mml:mi>o</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>v</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>s</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>k</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>If <inline-formula id="inf1">
<mml:math id="m2">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b2;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the coefficient for previous stroke in the PS model, then <inline-formula id="inf2">
<mml:math id="m3">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>R</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>exp</mml:mi>
<mml:mo>&#x2061;</mml:mo>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b2;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> Cohen&#x2019;s <italic>d</italic> is the standardised mean difference between two group means, the effect size underlying power calculations for the two-sample t-test (<xref ref-type="bibr" rid="B20">Cohen, 1988</xref>). Cohen&#x2019;s <italic>d</italic> &#x3d; 0.2, 0.5, and 0.8 are often used to indicate a low, medium, and high effect size (<xref ref-type="bibr" rid="B19">Chen, Cohen and Chen, 2010</xref>). <xref ref-type="bibr" rid="B19">Chen, Cohen and Chen (2010)</xref> calculated the Odds Ratios (OR) equivalent to Cohen&#x2019;s <italic>d</italic>, for low, medium and large effect size and presented the OR for different disease rates in the non-exposed group.</p>
<p>The calculated values of ORs, which were relevant to this study, are given in <xref ref-type="table" rid="T3">Table 3</xref> and informed the values of the coefficient used to represent the low, medium and large effect size based on Cohen&#x2019;s <italic>d</italic>. The coefficient of previous stroke in the PS model was generated as <inline-formula id="inf3">
<mml:math id="m4">
<mml:mrow>
<mml:mi>ln</mml:mi>
<mml:mo>&#x2061;</mml:mo>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>R</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>. This value was supplied as a parameter to the simulations and used in the PS model.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Effect sizes for prevalence of RI is generated treatment of 1% and 10%.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left">Prevalence&#x2a;&#x2a;</th>
<th colspan="3" align="center">Low effect<break/>Cohen&#x2019;s d &#x3d; 0.2</th>
<th colspan="3" align="center">Medium effect<break/>Cohen&#x2019;s d &#x3d; 0.5</th>
<th colspan="3" align="center">Large effect<break/>Cohen&#x2019;s d &#x3d; 0.8</th>
</tr>
<tr>
<th align="center">OR</th>
<th align="center">Coefficient</th>
<th align="center">Xorig&#x2a;</th>
<th align="center">OR</th>
<th align="center">Coefficient</th>
<th align="center">Xorig&#x2a;</th>
<th align="center">OR</th>
<th align="center">Coefficient</th>
<th align="center">Xorig&#x2a;</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="right">0.01 (1%)</td>
<td align="right">1.6814</td>
<td align="right">0.519627</td>
<td align="right">4.2</td>
<td align="right">3.4739</td>
<td align="right">1.24528</td>
<td align="right">10.1</td>
<td align="right">6.7128</td>
<td align="right">1.90402</td>
<td align="right">15.5</td>
</tr>
<tr>
<td align="right">0.1 (10%)</td>
<td align="right">1.4615</td>
<td align="right">0.379463</td>
<td align="right">3.1</td>
<td align="right">2.4972</td>
<td align="right">0.91517</td>
<td align="right">7.4</td>
<td align="right">4.1387</td>
<td align="right">1.42038</td>
<td align="right">11.6</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>&#x2a; The multiple of the original coefficient, 0.1229108.</p>
</fn>
<fn>
<p>&#x2a;&#x2a;Prevalence of RI (novel treatment) is generated treatment.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>This change of effect size related to the PS modelling which was used to correct for treatment allocation bias. The &#x2018;outcome&#x2019; in this case was the generated treatment, which was created using the participant&#x2019;s PS value. The &#x2018;untreated&#x2019; group was those with no previous stroke, those with a generated treatment of Rivaroxaban (the NOAC) contributed to the &#x2018;outcome prevalence&#x2019;. In the study data the outcome prevalence took values between 13% and 14.2%, so the values quoted for the 10% prevalence in <xref ref-type="table" rid="T3">Table 3</xref> were used to change the effect size of previous stroke in the PS model. Rounding these parameters for use in the simulation runs, the coefficient of previous stroke in the PS model took the values of 0.5 for low effect size, 1.0 for medium effect size and 1.5 for large effect size. When the PS model was fitted to the original data, the effect size of previous stroke was 0.123. This was &#x2018;very low&#x2019; compared with Cohen&#x2019;s classification. Simulations using this very low (or original) effect size are also presented.</p>
<p>For the outcome prevalence the values chosen for the simulation experiment were approximately 1% prevalence, which is similar to the original dataset, approximately 0.5% prevalence to investigate the effect of a lower prevalence, and approximately 10% prevalence to investigate the effect of data which does not suffer from substantial sparseness of outcomes. This was implemented in the Weibull baseline hazard function by varying &#x3bb; (the scale parameter) and keeping &#x3b3; (the shape parameter) constant.</p>
<p>In summary the parameters used in the simulations are given in <xref ref-type="table" rid="T4">Table 4</xref>.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Parameters and their values used in the simulation runs.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Parameter</th>
<th align="center">Values</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Measurement error in previous stroke in the<break/>PS model</td>
<td align="left">&#x2212;50%, &#x2212;30%, &#x2212;10%, 0%, &#x2b;10%, &#x2b;30%, &#x2b;50%</td>
</tr>
<tr>
<td align="left">Effect size of variable with measurement error</td>
<td align="left">0.123 (original), 0.5 (low), 1.0 (medium) and 1.5 (high)</td>
</tr>
<tr>
<td align="left">Outcome prevalence of future stroke</td>
<td align="left">0.5%, 1%&#x2a;, 10%</td>
</tr>
<tr>
<td align="left">Sample size, N, the number of simulated datasets</td>
<td align="left">Specific to each PS method for each outcome prevalence</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>&#x2a;Outcome prevalence in the original study dataset.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>A separate heatplot is displayed for each performance measure, using the same layout. On the y-axis, each PS method reports the results from the effect sizes of the covariate in the PS model with measurement error, Original, Low, Medium and High. On the x-axis within each outcome prevalence, 0.5%, 1% and 10%, results are reported for the measurement error, &#x2212;50% to &#x2b;50%. Each cell therefore reports the value of the performance measure for the given PS method, effect size of the covariate in the PS model with measurement error, outcome prevalence and measurement error of the covariate in the PS model.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<p>The performance measures of the treatment effect estimate generated presented as mean, SD, bias, absolute MSE, percentage change MSE and model SE are displayed in the heat plots, <xref ref-type="fig" rid="F3">Figures 3</xref>&#x2013;<xref ref-type="fig" rid="F8">8</xref>. The results display the estimate of the treatment effect (of Rivaroxaban over Warfarin) presented as the log(HR).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Heat plot for Mean treatment effect estimate. The x-axis shows the outcome prevalence and the measurement error. The y-axis shows the PS method and the &#x2018;effect size&#x2019; used. The horizontal line in the key indicates the true mean.</p>
</caption>
<graphic xlink:href="fphar-17-1380586-g003.tif">
<alt-text content-type="machine-generated">Heatmap showing mean treatment effect estimates across four propensity score methods (PS Stratification, IPTW for ATT, IPTW for ATE, 3:1 PS Matching) at varying adjustment levels, different percentage measurement errors, and three prevalence rates. Blue to yellow gradient bar at right indicates mean estimate range from point 0.3 to point 0.46, with a horizontal line marking the true mean at point close to 0.37.</alt-text>
</graphic>
</fig>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Heat plot for the Bias of the treatment effect estimate. The x-axis shows the outcome prevalence and the introduced measurement error. The y-axis shows the PS method and the &#x2018;effect size&#x2019;.</p>
</caption>
<graphic xlink:href="fphar-17-1380586-g004.tif">
<alt-text content-type="machine-generated">Heatmap illustrating bias of treatment effect estimates across four methods (PS Stratification, IPTW for ATT, IPTW for ATE, 3:1 PS Matching) and measurement error percentages, with three prevalence rates. Bias is indicated by a color scale ranging from green (positive bias) to purple (negative bias).</alt-text>
</graphic>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Heat plot of the SD of the treatment effect estimate. The x-axis shows the outcome prevalence and the introduced measurement error. The y-axis shows the PS method and the &#x2018;effect size&#x2019; used.</p>
</caption>
<graphic xlink:href="fphar-17-1380586-g005.tif">
<alt-text content-type="machine-generated">Heatmap depicting the standard deviation of treatment effect estimates by propensity score method and measurement error, with darker blue indicating higher SD and yellow lower SD, across different error percentages and prevalence rates.</alt-text>
</graphic>
</fig>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Heat plot of the MSE of the treatment effect estimate. The x-axis shows the outcome prevalence and the introduced measurement error. The y-axis shows the PS method and the &#x2018;effect size&#x2019; used.</p>
</caption>
<graphic xlink:href="fphar-17-1380586-g006.tif">
<alt-text content-type="machine-generated">Heatmap graphic showing mean squared error (MSE) of treatment effect estimates by analysis method, measurement error, and prevalence. Methods include PS Stratification, IPTW for ATT, IPTW for ATE, and 3:1 PS Matching at different adjustment levels. Columns separate results by measurement error (from negative to positive percentages) and prevalence (0.5, 1, 10 percent). Color scale ranges from blue (higher MSE) to yellow (zero MSE), with values detailed in the legend.</alt-text>
</graphic>
</fig>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Heat plot of the MSE percentage change of the treatment effect estimate. The x-axis shows the outcome prevalence and the introduced measurement error. The y-axis shows the PS method and the &#x2018;effect size&#x2019; used.</p>
</caption>
<graphic xlink:href="fphar-17-1380586-g007.tif">
<alt-text content-type="machine-generated">Heatmap visualizing MSE percent change in treatment effect estimate by analysis method and measurement error, with shading from purple (negative percentage) to green (positive percentage), stratified by prevalence and analysis method, including PS stratification, IPTW for ATT, IPTW for ATE, and 3:1 PS matching, with a legend indicating MSE percent scale from negative sixty to positive sixty.</alt-text>
</graphic>
</fig>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Heat plot of the Model SE of the treatment effect estimate. The x-axis shows the outcome prevalence and the introduced measurement error. The y-axis shows the PS method and the &#x2018;effect size&#x2019; used.</p>
</caption>
<graphic xlink:href="fphar-17-1380586-g008.tif">
<alt-text content-type="machine-generated">Heatmap visualizing model standard error for treatment effect estimates across four methods (PS Stratification, IPTW for ATT, IPTW for ATE, 3:1 PS Matching) and measurement error levels, with color from blue (higher error) to yellow (lower error), stratified by prevalence.</alt-text>
</graphic>
</fig>
<p>Comparing all four PS methods using simulations was firstly based on the original characteristics of the data&#x2013;no measurement error, the original effect size of previous stroke in the treatment allocation model and an outcome prevalence of 1%. 3:1&#xa0;PS matching (using nearest neighbour matching with replacement) appeared to perform the least well of the PS methods. It had larger bias and the bias was positive, 0.0428, as opposed to negative for the other PS methods, IPTW for ATE (&#x2212;0.0181), IPTW for ATT (&#x2212;0.0110) and PS stratification (&#x2212;0.0099).</p>
<p>For illustration and to aid clinical interpretability of the results, the bias figures above, based on the original characteristics of the data, were transformed to a HR scale. The biases would correspond to the following rHRs (ratio of HR for given method to the &#x201c;true&#x201d; HR &#x3d; 1.4440 corresponding to the true value of the treatment effect 0.3674, HRs of future stroke with Warfarin vs. Rivaroxaban): 1.0437 for 3:1&#xa0;PS matching, 0.9821 for IPTW for ATE, 0.9891 for IPTW for ATT and 0.9901 for PS stratification. These would correspond to the following HRs accordingly: 1.5071, 1.4181, 1.4282 and 1.4298, with differences between numbers being small to negligible. 3:1&#xa0;PS matching was retained for use in the later simulations to assess its performance with varying measurement error, effect size and outcome prevalence.</p>
<p>Under-recording of a variable in the treatment allocation model was implemented as negative measurement error of previous stroke [-50%, 0%). Previous stroke had a very small effect on treatment allocation. All PS methods used in this study showed there was little change in the bias of the treatment effect estimate and there was slightly lower precision and a small increase in the MSE for increasing the magnitude of negative measurement error. The increase in the MSE from 0% to &#x2212;50% measurement error in the treatment allocation model was, IPTW for ATE 0.0075, IPTW for ATT 0.0025, 3:1&#xa0;PS matching 0.0088 and PS Stratification 0.0028.</p>
<p>Over-recording of a variable in the treatment allocation model was implemented as positive measurement error of previous stroke (0%, &#x2b;50%]. In common with under-recording all PS methods used in this study showed there was little change in the bias of the treatment effect estimate. Over the measurement error range, as the size of the over-recording increased, the precision in the estimation increased as did the MSE. The increase in the MSE from &#x2b;50% to 0% measurement error in the treatment allocation model was, IPTW for ATE 0.0261, IPTW for ATT 0.0149, 3:1&#xa0;PS matching 0.0297, PS Stratification 0.0145. Higher over-recording of previous stroke generates a higher prevalence of stroke, generating more outcomes of future stroke, which in turn increases the precision of the treatment effect estimate, hence a lower MSE.</p>
<p>The impact that the variable with under- or over-recording has on determining the treatment allocation (the effect size) was varied using values representing Low, Medium and High for comparison with the Original (very low) effect size. There was still little variation in the mean, and bias, over the measurement error range for all the effect sizes. When the variable with measurement error had greater impact on the treatment allocation model, (the PS model), the treatment effect estimate had lower bias and higher precision. For example, using the characteristics of the original dataset the reduction in bias from small effect size to high effect size is IPTW for ATE 0.0029, IPTW for ATT 0.0037, 3:1&#xa0;PS matching 0.0062, PS Stratification 0.0041. It does seem counterintuitive and could be due to the Data Generation Mechanism (DGM) used. In particular, when the variable with measurement error (previous stroke) had a high effect size in the PS model, for those with a previous stroke, their PS value will be higher than if the effect size were low. A higher PS value increases the probability of the generated treatment being Rivaroxaban. This in turn generates more outcome events in the simulations, making the outcome modelling more stable and the treatment effect estimate having lower bias and higher precision.</p>
<p>To investigate the impact of sparse outcome data, the outcome prevalence was varied by generating data with different numbers of participants with future strokes (the primary outcome). The lower prevalence (&#x2264;1%) data gave treatment effect estimates with a higher bias and lower precision and using the higher prevalence data, with lower bias and higher precision. These results were to be expected, as higher EPV in the outcome model generates more stable models. For example, with no added measurement error, the difference in the bias of the low prevalence data (0.5%) and the high prevalence data (10%) is IPTW for ATE 0.1514, IPTW for ATT 0.0160, 3:1&#xa0;PS matching 0.0758, PS Stratification 0.0177. At lower prevalences, there was more variation in the performance measures of the treatment effect estimate over the measurement error range of a variable in the treatment allocation model.</p>
<p>The differences in the performance measures of the treatment effect due to different effect sizes are greater when the data has lower outcome prevalence. The treatment effect estimates with the highest bias, lowest precision and highest MSE were obtained with low prevalence outcome data and when the variable with measurement error had a low (or very low) impact in the PS model.</p>
<p>PS stratification and IPTW for ATE were the PS methods used which estimate the ATE. Both methods gave treatment effect estimates which followed the patterns described above in all the simulation scenarios. There was only a little difference in the bias from both methods, but the bias was slightly closer to 0 for PS stratification. PS stratification had a higher precision and lower MSE, than those for IPTW for ATE over the measurement error range.</p>
<p>3:1&#xa0;PS Matching and IPTW for ATT were the PS methods used which estimate the ATT. Both methods gave treatment effect estimates which followed the patterns described above in all the simulation scenarios. In all scenarios IPTW for ATT had lower bias and higher precision than 3:1&#xa0;PS Matching.</p>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>The real-world treatment effect can be estimated from EHR by forming an observational study, in which the treatment allocation is not randomised and PS methods are used to adjust for treatment allocation bias, prior to fitting a statistical model to the outcome data. The aims of this study were to investigate the effect of under- or over-recording of a dichotomous covariate in the treatment allocation model with sparse outcome data when estimating the real-world treatment effect via PS methods, and to compare the performance of different PS methods in these scenarios. The simulation experiments were rigorously designed and implemented to account for and reflect the characteristics and specific features of the real-world dataset used.</p>
<p>When using PS methods to correct for treatment allocation bias, the bias of the treatment effect estimate appears to be robust to measurement error/misclassification of a variable with very low impact in the treatment allocation model. When there is more under-recording of this variable, there is lower precision in this estimate. When there is more over-recording of this variable, the method produces an estimate with higher precision. Under-recording or over-recording in a covariate which affects the treatment allocation does not affect the relative performance of the PS methods used in this study. Although there are a small number of studies which report on the effect of varying measurement error and compare PS methods their study designs are different to the current one. They implement measurement error in different ways and use different performance measures, making a direct comparison with the current study difficult. In <xref ref-type="bibr" rid="B24">De Gil et al. (2015)</xref> covariate measurement error affected bias but not the root mean squared error (RMSE), which is different to the current study. <xref ref-type="bibr" rid="B21">Conover et al. (2021)</xref> reported that scenarios with only false positive misclassifications (over-recording) produced higher bias than scenarios with only false negative misclassifications (under-recording). In the current study there was little variation in the bias and any change was in the opposite direction, with slightly lower bias for over-recording (positive measurement error). <xref ref-type="bibr" rid="B35">Hong et al. (2019)</xref> showed that the bias and MSE reduced as the reliability of mismeasured confounders approached one (i.e. as measurement error approached zero). These results are different to the current study, as positive measurement error behaved in a different manner than negative measurement error. This could be due to the small changes to the number of outcomes that the measurement error produced, which is noticeable when the outcome prevalence is low, close to 1%. Varying the effect size of the covariate in the treatment allocation model with measurement error made little difference to the simulation results. The simulations in this study were run to investigate the effect of under-recording or over-recording of a single covariate. Also, there is likely to be measurement error in several covariates and the primary outcome variable (future stroke). These were not considered in this study and further research is required to explore effect of errors in multiple co-variates.</p>
<p>The study dataset had rare (sparse) outcomes (prevalence approx. 1%) which could lead to a low EPV in the outcome models, hence bias in the outcome modelling. This type of sparse data, a large dataset with rare outcomes, is not uncommon (<xref ref-type="bibr" rid="B18">Chao, 1994</xref>; <xref ref-type="bibr" rid="B26">Franklin et al., 2017</xref>; <xref ref-type="bibr" rid="B45">Paul and Deng, 2000</xref>). Even though the outcome may be rare, it can be serious such as Serious Adverse Events in drug studies (<xref ref-type="bibr" rid="B50">Ross et al., 2015</xref>) and neonatal trials (<xref ref-type="bibr" rid="B23">Das et al., 2016</xref>). Few papers compare PS methods in the presence of sparse data, the exceptions being <xref ref-type="bibr" rid="B26">Franklin et al. (2017)</xref> for rare outcomes; and <xref ref-type="bibr" rid="B30">Hajage et al. (2016)</xref> for a rare exposure.</p>
<p>When varying the degree of under- or over-recording of a dichotomous variable in the treatment allocation model in addition to varying the outcome prevalence, the lower prevalence (&#x2264;1%) data gave treatment effect estimates with a higher bias and lower precision, whereas using the higher prevalence data gave a treatment effect estimate with lower bias and higher precision. The difference in the bias of the low prevalence outcome (0.5%) and the high prevalence outcome (10%) is: IPTW for ATE 0.1514; IPTW for ATT 0.0160; 3:1&#xa0;PS matching 0.0758; PS Stratification 0.0177. At lower prevalences, there was more variation in the performance measures of the treatment effect estimate over the measurement error range of a variable in the treatment allocation model. Studies using EHR with lower prevalence outcomes should take account of covariate measurement error.</p>
<p>The recommendation for the PS methods to use remained the same in all simulation scenarios (no introduced measurement error, introduced measurement error, introduced measurement error and varied effect size, introduced measurement error and varied outcome prevalence and introduced measurement error, varied effect size and varied outcome prevalence). Studies which compare the performance of PS methods seldom include both the effect of covariate measurement error and sparse outcome data, nor do they use time-to-event data. PS matching and IPTW are generally recommended for binary outcome data (<xref ref-type="bibr" rid="B2">Austin, 2009b</xref>; <xref ref-type="bibr" rid="B3">Austin, 2011a</xref>; <xref ref-type="bibr" rid="B4">Austin, 2011b</xref>) and also for time-to event outcomes (<xref ref-type="bibr" rid="B5">Austin, 2013</xref>). However, the properties of the dataset may guide the choice of PS conditioning (<xref ref-type="bibr" rid="B15">Busso et al., 2014</xref>).</p>
<p>Based on this study&#x2019;s data, for estimation of the ATE, PS stratification performed slightly better than IPTW for ATE. Its bias was similar to IPTW for ATE but its precision was higher (with a lower MSE), but the difference in performance was small. In the literature there were some reservations about the balance produced by PS stratification. The literature generally recommends IPTW for ATE as it provides the best balance (<xref ref-type="bibr" rid="B2">Austin, 2009b</xref>). However, <xref ref-type="bibr" rid="B26">Franklin et al. (2017)</xref>&#x2019;s averaged results from simulations varying outcome prevalence recommended PS stratification (using 10 strata) over IPTW for ATE in terms of absolute bias and MSE.</p>
<p>Based on this study&#x2019;s data, the recommendation was to use IPTW for ATT for estimating the ATT, which showed superior performance over 3:1&#xa0;PS matching using nearest neighbour matching with replacement. In all scenarios IPTW for ATT had lower bias and higher precision. PS matching and IPTW are reported to remove systematic differences to a similar extent (<xref ref-type="bibr" rid="B2">Austin, 2009b</xref>; <xref ref-type="bibr" rid="B3">Austin, 2011a</xref>; <xref ref-type="bibr" rid="B4">Austin, 2011b</xref>) and in some cases, PS matching is recommended over IPTW for ATT (<xref ref-type="bibr" rid="B21">Conover et al., 2021</xref>). <xref ref-type="bibr" rid="B30">Hajage et al. (2016)</xref> found IPTW for ATT performed better than PS matching using time-to-event data with sparseness in the exposure data (rare treatment).</p>
<p>This study has shown that PS methods recommended in the literature may not perform well for individual datasets and specific scenarios such as for time-to-event data. Although <xref ref-type="bibr" rid="B16">Caliendo and Kopeinig (2008)</xref> and <xref ref-type="bibr" rid="B27">Garrido et al. (2014)</xref> recommended applying several PS methods and selecting the one which produces the best balance for the outcome analysis, this study showed that PS methods which give relatively poor balance can produce a treatment effect estimate with lower bias and higher precision.</p>
<p>While most studies use binary outcomes, potentially time-to-event data might be used when there are few events (as it gives the small improvement in power), though it is also commonplace to consider these events simply as binary outcomes. For data characterised by sparse outcomes, the influence of both measurement error and effect size is amplified; consequently, their impact may be more pronounced in time-to-event analyses. When the outcome data are &#x2018;time-to-event&#x2019; data, guidance on the implementation of PS methods, particularly PS matching, and comparison of PS methods should be considered for future work. Further exploration of the modelling options to account more rigorously for the matched nature following PS matching of the data when Cox regression is performed could be undertaken.</p>
<p>The variables in the outcome model were selected by fitting the model to the analysis dataset used following PS matching. The same variables were used for the other PS methods without refitting the model to the full dataset. This may be regarded as a limitation of this study that the outcome model may be regarded as misspecified. Another limitation of this work is that in the estimation of treatment effect variance no account was taken of the uncertainty in estimating the PS. This means the CIs of the treatment effect produced were too wide. For PS stratification, using the analogous marginal variance method, which accounts for the uncertainty from estimating the PS model from the data, can reduce the variance by up to 12% depending on the data characteristics, compared to the commonly used variance estimation (<xref ref-type="bibr" rid="B57">Williamson et al., 2012</xref>). For IPTW the variance reduction can be 18% using the analogous marginal variance method compared to the commonly used variance estimation. Such changes are particularly noticeable for larger samples, n &#x3e; 1000 (<xref ref-type="bibr" rid="B57">Williamson et al., 2012</xref>). Use of the analogous marginal variance method may affect the performance of the different PS methods compared in this paper and requires further investigation.</p>
<p>This study used four PS methods (each with one outcome option) which is a limitation, as there are many variations of these basic categories of PS methods. It would be reasonable to assume that other PS methods may behave in a similar way, that is for lower outcome prevalences, more variation in the performance measures of the treatment effect estimate over the measurement error range of a variable in the treatment allocation model. To identify the most effective PS methods for estimating the ATT and ATE, a thorough comparative simulation is required similar to that conducted in this study. Also, it is currently not clear if the changes to the treatment effect estimate are due to changes in the effect size or the DGM used. The parameters varied in the simulations only took a limited range of values (see above for suggested extensions of the simulations). The results using additional PS methods or expanded parameter ranges could be compared with those of this study.</p>
<p>Both the US Food and Drug Administration draft guidance on real-world evidence (RWE) and Guidance on Non-Interventional Studies (ICH M14) of the European Medicines Agency incorporate principles of causal inference and recommend using rigorous study design and analytical methods, such as those within the causal inference framework, to minimise bias and generate reliable evidence from observational data. They emphasise that studies using RWE often aim to evaluate a causal association and that approaches to address bias and confounding are critical. The results of this study provide guidance for researchers in selecting appropriate PS methods and designing effective and robust analysis strategies to mitigate bias when inferring causality from observational data.</p>
</sec>
<sec id="s5">
<title>Summary/conclusion</title>
<p>Studies which use EHR to conduct observational studies should consider the impact of sparse outcome data, not just on the bias and precision of the treatment effect estimate, but also on the effect that covariate measurement error on the treatment allocation will have. For data with outcomes in the form of time-to-event, not all outcome events will be recorded in the dataset as some will be censored, making the data more sparse, which compounds these problems.</p>
<p>The findings of this study contribute to the body of knowledge, particularly when using PS methods and varying covariate measurement error, the covariate&#x2019;s effect size in the treatment allocation model and the outcome prevalence. Systematically varying a combination of these parameters constitutes novel approach. These simulations were applied to time-to-event data, which are generally not widely reported on. The majority of studies which compare PS methods, investigate the effect of measurement error or sparseness of data use data with binary outcomes. This study did make recommendations for the PS methods to use, but the recommendations have been guided by the characteristics of the study dataset, which may mean that they are limited to datasets with similar characteristics rather than being more widely generalisable.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The data analyzed in this study is subject to the following licenses/restrictions: The data were held by the University of Birmingham, approval for access to the data was granted for this study. Requests to access these datasets should be directed to ST, <email>stishkovskaya@lancashire.ac.uk</email>, for clarification of further enquires.</p>
</sec>
<sec sec-type="ethics-statement" id="s7">
<title>Ethics statement</title>
<p>The studies involving humans were approved by UCLan STEMH Ethics Committee (Reference Number STEMH 650). Also, Scientific Review Committee (SRC) approval was extended for use of the data extract from THIN already given for use in REWARD, to include the use of the data for this project. The studies were conducted in accordance with the local legislation and institutional requirements. Written informed consent for participation was not required from the participants or the participants&#x2019; legal guardians/next of kin in accordance with the national legislation and institutional requirements.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>JB: Conceptualization, Data curation, Formal Analysis, Investigation, Methodology, Resources, Software, Visualization, Writing &#x2013; original draft, Writing &#x2013; review and editing. AB: Conceptualization, Investigation, Methodology, Supervision, Writing &#x2013; review and editing, Data curation. GP: Methodology, Project administration, Supervision, Writing &#x2013; review and editing. CS: Conceptualization, Funding acquisition, Methodology, Project administration, Resources, Supervision, Writing &#x2013; review and editing. ST: Methodology, Project administration, Supervision, Validation, Writing &#x2013; review and editing</p>
</sec>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="s12">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fphar.2026.1380586/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fphar.2026.1380586/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table1.docx" id="SM1" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Austin</surname>
<given-names>P. C.</given-names>
</name>
</person-group> (<year>2009a</year>). <article-title>Balance diagnostics for comparing the distribution of baseline covariates between treatment groups in propensity-score matched samples</article-title>. <source>Statistics Med.</source> <volume>28</volume> (<issue>25</issue>), <fpage>3083</fpage>&#x2013;<lpage>3107</lpage>. <pub-id pub-id-type="doi">10.1002/sim.3697</pub-id>
<pub-id pub-id-type="pmid">19757444</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Austin</surname>
<given-names>P. C.</given-names>
</name>
</person-group> (<year>2009b</year>). <article-title>The relative ability of different propensity score methods to balance measured covariates between treated and untreated subjects in observational studies</article-title>. <source>Med. Decis. Mak.</source> <volume>29</volume> (<issue>6</issue>), <fpage>661</fpage>&#x2013;<lpage>677</lpage>. <pub-id pub-id-type="doi">10.1177/0272989x09341755</pub-id>
<pub-id pub-id-type="pmid">19684288</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Austin</surname>
<given-names>P. C.</given-names>
</name>
</person-group> (<year>2011a</year>). <article-title>An introduction to propensity score methods for reducing the effects of confounding in observational studies</article-title>. <source>Multivar. Behav. Res.</source> <volume>46</volume> (<issue>3</issue>), <fpage>399</fpage>&#x2013;<lpage>424</lpage>. <pub-id pub-id-type="doi">10.1080/00273171.2011.568786</pub-id>
<pub-id pub-id-type="pmid">21818162</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Austin</surname>
<given-names>P. C.</given-names>
</name>
</person-group> (<year>2011b</year>). <article-title>A tutorial and case study in propensity score analysis: an application to estimating the effect of In-Hospital smoking cessation counseling on mortality</article-title>. <source>Multivar. Behav. Res.</source> <volume>46</volume> (<issue>1</issue>), <fpage>119</fpage>&#x2013;<lpage>151</lpage>. <pub-id pub-id-type="doi">10.1080/00273171.2011.540480</pub-id>
<pub-id pub-id-type="pmid">22287812</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Austin</surname>
<given-names>P. C.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>The performance of different propensity score methods for estimating marginal hazard ratios</article-title>. <source>Statistics Med.</source> <volume>32</volume> (<issue>16</issue>), <fpage>2837</fpage>&#x2013;<lpage>2849</lpage>. <pub-id pub-id-type="doi">10.1002/sim.5705</pub-id>
<pub-id pub-id-type="pmid">23239115</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baczek</surname>
<given-names>V. L.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W. T.</given-names>
</name>
<name>
<surname>Kluger</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Coleman</surname>
<given-names>C. I.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Predictors of warfarin use in atrial fibrillation in the United States: a systematic review and meta-analysis</article-title>. <source>Bmc Fam. Pract.</source> <volume>13</volume>, <fpage>5</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2296-13-5</pub-id>
<pub-id pub-id-type="pmid">22304704</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Banerjee</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Benedetto</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Gichuru</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Burnell</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Antoniou</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Schilling</surname>
<given-names>R. J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Adherence and persistence to direct oral anticoagulants in atrial fibrillation: a population-based study</article-title>. <source>Heart</source> <volume>106</volume> (<issue>2</issue>), <fpage>119</fpage>&#x2013;<lpage>&#x2b;</lpage>. <pub-id pub-id-type="doi">10.1136/heartjnl-2019-315307</pub-id>
<pub-id pub-id-type="pmid">31601729</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhatia</surname>
<given-names>G. S.</given-names>
</name>
<name>
<surname>Lip</surname>
<given-names>G. Y.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Atrial fibrillation post-myocardial infarction: frequency, consequences, and management</article-title>. <source>Curr. Heart Failure Reports</source> <volume>1</volume> (<issue>4</issue>), <fpage>149</fpage>&#x2013;<lpage>155</lpage>. <pub-id pub-id-type="doi">10.1007/s11897-004-0002-y</pub-id>
<pub-id pub-id-type="pmid">16036038</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Black</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Berger</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Scott</surname>
<given-names>F. A.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Bounding parameter estimates with nonclassical measurement error</article-title>. <source>J. Am. Stat. Assoc.</source> <volume>95</volume> (<issue>451</issue>), <fpage>739</fpage>&#x2013;<lpage>748</lpage>. <pub-id pub-id-type="doi">10.2307/2669454</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Blackwell</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Honaker</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>King</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>A unified approach to measurement error and missing data: overview and applications</article-title>. <source>Sociol. Methods and Res.</source> <volume>46</volume> (<issue>3</issue>), <fpage>303</fpage>&#x2013;<lpage>341</lpage>. <pub-id pub-id-type="doi">10.1177/0049124115585360</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boriani</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Laroche</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Diemberger</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Popescu</surname>
<given-names>M. I.</given-names>
</name>
<name>
<surname>Rasmussen</surname>
<given-names>L. H.</given-names>
</name>
<name>
<surname>Petrescu</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Glomerular filtration rate in patients with atrial fibrillation and 1-year outcomes</article-title>. <source>Sci. Rep.</source> <volume>6</volume>, <fpage>30271</fpage>. <pub-id pub-id-type="doi">10.1038/srep30271</pub-id>
<pub-id pub-id-type="pmid">27466080</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Braun</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Gorfine</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Parmigiani</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Arvold</surname>
<given-names>N. D.</given-names>
</name>
<name>
<surname>Dominici</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Zigler</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Propensity scores with misclassified treatment assignment: a likelihood-based adjustment</article-title>. <source>Biostatistics</source> <volume>18</volume> (<issue>4</issue>), <fpage>695</fpage>&#x2013;<lpage>710</lpage>. <pub-id pub-id-type="doi">10.1093/biostatistics/kxx014</pub-id>
<pub-id pub-id-type="pmid">28419189</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Burnell</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2015</year>). <source>Sensitivity analysis for HES vs HES and THIN</source>. <publisher-name>University of Central Lancashire</publisher-name>. <comment>Technical Report (unpublished)</comment>.</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Burnell</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2022</year>). <source>Using propensity score methods for estimating real-world treatment effects in the presence of measurement error and sparse outcome data</source>. <publisher-name>MPhil thesis. Preston: University of Lancashire</publisher-name>. <pub-id pub-id-type="doi">10.17030/uclan.thesis.00057525</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Busso</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>DiNardo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>McCrary</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>New evidence on the finite sample properties of propensity score reweighting and matching estimators</article-title>. <source>Rev. Econ. Statistics</source> <volume>96</volume> (<issue>5</issue>), <fpage>885</fpage>&#x2013;<lpage>897</lpage>. <pub-id pub-id-type="doi">10.1162/REST_a_00431</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Caliendo</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kopeinig</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Some practical guidance for the implementation of propensity score matching</article-title>. <source>J. Econ. Surv.</source> <volume>22</volume> (<issue>1</issue>), <fpage>31</fpage>&#x2013;<lpage>72</lpage>. <pub-id pub-id-type="doi">10.1111/j.1467-6419.2007.00527.x</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carroll</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Stefanski</surname>
<given-names>L. A.</given-names>
</name>
</person-group> (<year>1990</year>). <article-title>Approximate quasi-likelihood estimation in models with surrogate predictors</article-title>. <source>J. Am. Stat. Assoc.</source> <volume>85</volume> (<issue>411</issue>), <fpage>652</fpage>&#x2013;<lpage>663</lpage>. <pub-id pub-id-type="doi">10.2307/2290000</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chao</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Population-size estimation for sparse data - reply</article-title>. <source>Biometrics</source> <volume>50</volume> (<issue>1</issue>), <fpage>303</fpage>.</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>H. N.</given-names>
</name>
<name>
<surname>Cohen</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>How big is a big odds ratio? Interpreting the magnitudes of odds ratios in epidemiological studies</article-title>. <source>Commun. Statistics- Simul. Comput.</source> <volume>39</volume> (<issue>4</issue>), <fpage>860</fpage>&#x2013;<lpage>864</lpage>. <pub-id pub-id-type="doi">10.1080/03610911003650383</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Cohen</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>1988</year>). <source>Statistical power analysis for the behavioral sciences</source>. <edition>2nd ed.</edition> <publisher-loc>Hillsdale, N.J</publisher-loc>: <publisher-name>L. Erlbaum Associates</publisher-name>.</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Conover</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Rothman</surname>
<given-names>K. J.</given-names>
</name>
<name>
<surname>Sturmer</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ellis</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Poole</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Funk</surname>
<given-names>M. J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Propensity score trimming mitigates bias due to covariate measurement error in inverse probability of treatment weighted analyses: a plasmode simulation</article-title>. <source>Statistics Med.</source> <volume>40</volume> (<issue>9</issue>), <fpage>2101</fpage>&#x2013;<lpage>2112</lpage>. <pub-id pub-id-type="doi">10.1002/sim.8887</pub-id>
<pub-id pub-id-type="pmid">33622016</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cook</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Stefanski</surname>
<given-names>L. A.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Simulation-extrapolation estimation in parametric measurement error models</article-title>. <source>J. Am. Stat. Assoc.</source> <volume>89</volume> (<issue>428</issue>), <fpage>1314</fpage>&#x2013;<lpage>1328</lpage>. <pub-id pub-id-type="doi">10.2307/2290994</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Das</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Tyson</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Pedroza</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Schmidt</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Gantz</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wallace</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Methodological issues in the design and analyses of neonatal research studies: experience of the NICHD neonatal research network</article-title>. <source>Seminars Perinatology</source> <volume>40</volume> (<issue>6</issue>), <fpage>374</fpage>&#x2013;<lpage>384</lpage>. <pub-id pub-id-type="doi">10.1053/j.semperi.2016.05.005</pub-id>
<pub-id pub-id-type="pmid">27344192</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>De Gil</surname>
<given-names>P. R.</given-names>
</name>
<name>
<surname>Bellara</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Lanehart</surname>
<given-names>R. E.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>E. S.</given-names>
</name>
<name>
<surname>Kromrey</surname>
<given-names>J. D.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>How do propensity score methods measure up in the presence of measurement error? A monte carlo study</article-title>. <source>Multivar. Behav. Res.</source> <volume>50</volume> (<issue>5</issue>), <fpage>520</fpage>&#x2013;<lpage>532</lpage>. <pub-id pub-id-type="doi">10.1080/00273171.2015.1022643</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dong</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Millimet</surname>
<given-names>D. L.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Propensity score weighting with mismeasured covariates: an application to two financial literacy interventions</article-title>. <source>J. Risk Financial Manag.</source> <volume>13</volume> (<issue>11</issue>), <fpage>290</fpage>. <pub-id pub-id-type="doi">10.3390/jrfm13110290</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Franklin</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Eddings</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Austin</surname>
<given-names>P. C.</given-names>
</name>
<name>
<surname>Stuart</surname>
<given-names>E. A.</given-names>
</name>
<name>
<surname>Schneeweiss</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Comparing the performance of propensity score methods in healthcare database studies with rare outcomes</article-title>. <source>Statistics Medicine</source> <volume>36</volume> (<issue>12</issue>), <fpage>1946</fpage>&#x2013;<lpage>1963</lpage>. <pub-id pub-id-type="doi">10.1002/sim.7250</pub-id>
<pub-id pub-id-type="pmid">28208229</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Garrido</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Kelley</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Paris</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Roza</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Meier</surname>
<given-names>D. E.</given-names>
</name>
<name>
<surname>Morrison</surname>
<given-names>R. S.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Methods for constructing and assessing propensity scores</article-title>. <source>Health Serv. Res.</source> <volume>49</volume> (<issue>5</issue>), <fpage>1701</fpage>&#x2013;<lpage>1720</lpage>. <pub-id pub-id-type="doi">10.1111/1475-6773.12182</pub-id>
<pub-id pub-id-type="pmid">24779867</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Giralt&#x2010;Steinhauer</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Cuadrado&#x2010;Godia</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Ois</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Jim&#xe9;nez&#x2010;Conde</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Rodr&#xed;guez&#x2010;Campello</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Soriano</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Comparison between CHADS 2 and CHA 2 DS 2&#x2010;VAS c score in a stroke cohort with atrial fibrillation</article-title>. <source>Eur. Journal Neurology</source> <volume>20</volume> (<issue>4</issue>), <fpage>623</fpage>&#x2013;<lpage>628</lpage>. <pub-id pub-id-type="doi">10.1111/j.1468-1331.2012.03807.x</pub-id>
<pub-id pub-id-type="pmid">22834861</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Greenland</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mansournia</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Altman</surname>
<given-names>D. G.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Sparse data bias: a problem hiding in plain sight</article-title>. <source>Bmj-British Med. J.</source> <volume>353</volume>, <fpage>i1981</fpage>. <pub-id pub-id-type="doi">10.1136/bmj.i1981</pub-id>
<pub-id pub-id-type="pmid">27121591</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hajage</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Tubach</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Steg</surname>
<given-names>P. G.</given-names>
</name>
<name>
<surname>Bhatt</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>De Rycke</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>On the use of propensity scores in case of rare exposure</article-title>. <source>Bmc Med. Res. Methodol.</source> <volume>16</volume>, <fpage>38</fpage>. <pub-id pub-id-type="doi">10.1186/s12874-016-0135-1</pub-id>
<pub-id pub-id-type="pmid">27036963</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hankey</surname>
<given-names>G. J.</given-names>
</name>
<name>
<surname>Patel</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Stevens</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Becker</surname>
<given-names>R. C.</given-names>
</name>
<name>
<surname>Breithardt</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Carolei</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Rivaroxaban compared with warfarin in patients with atrial fibrillation and previous stroke or transient ischaemic attack: a subgroup analysis of ROCKET AF</article-title>. <source>Lancet Neurol.</source> <volume>11</volume> (<issue>4</issue>), <fpage>315</fpage>&#x2013;<lpage>322</lpage>. <pub-id pub-id-type="doi">10.1016/s1474-4422(12)70042-x</pub-id>
<pub-id pub-id-type="pmid">22402056</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Herrett</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Shah</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Boggon</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Denaxas</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Smeeth</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>van Staa</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Completeness and diagnostic validity of recording acute myocardial infarction events in primary care, hospital care, disease registry, and national mortality records: cohort study</article-title>. <source>Bmj-British Med. J.</source> <volume>346</volume>, <fpage>f2350</fpage>. <pub-id pub-id-type="doi">10.1136/bmj.f2350</pub-id>
<pub-id pub-id-type="pmid">23692896</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ho</surname>
<given-names>D. E.</given-names>
</name>
<name>
<surname>Imai</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>King</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Stuart</surname>
<given-names>E. A.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Matching as nonparametric preprocessing for reducing model dependence in parametric causal inference</article-title>. <source>Polit. Anal.</source> <volume>15</volume> (<issue>3</issue>), <fpage>199</fpage>&#x2013;<lpage>236</lpage>. <pub-id pub-id-type="doi">10.1093/pan/mpl013</pub-id>
</mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Rudolph</surname>
<given-names>K. E.</given-names>
</name>
<name>
<surname>Stuart</surname>
<given-names>E. A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Bayesian approach for addressing differential covariate measurement error in propensity score methods</article-title>. <source>Psychometrika</source> <volume>82</volume> (<issue>4</issue>), <fpage>1078</fpage>&#x2013;<lpage>1096</lpage>. <pub-id pub-id-type="doi">10.1007/s11336-016-9533-x</pub-id>
<pub-id pub-id-type="pmid">27738956</pub-id>
</mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Aaby</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Siddique</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Stuart</surname>
<given-names>E. A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Propensity score-based estimators with multiple error-prone covariates</article-title>. <source>Am. J. Epidemiol.</source> <volume>188</volume> (<issue>1</issue>), <fpage>222</fpage>&#x2013;<lpage>230</lpage>. <pub-id pub-id-type="doi">10.1093/aje/kwy210</pub-id>
<pub-id pub-id-type="pmid">30358801</pub-id>
</mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Imbens</surname>
<given-names>G. W.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Nonparametric estimation of average treatment effects under exogeneity: a review</article-title>. <source>Rev. Econ. Statistics</source> <volume>86</volume> (<issue>1</issue>), <fpage>4</fpage>&#x2013;<lpage>29</lpage>. <pub-id pub-id-type="doi">10.1162/003465304323023651</pub-id>
</mixed-citation>
</ref>
<ref id="B37">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lai</surname>
<given-names>H. C.</given-names>
</name>
<name>
<surname>Chien</surname>
<given-names>W. C.</given-names>
</name>
<name>
<surname>Chung</surname>
<given-names>C. H.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>W. L.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>K. Y.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Atrial fibrillation, liver disease, antithrombotics and risk of cerebrovascular events: a population-based cohort study</article-title>. <source>Int. J. Cardiol.</source> <volume>223</volume>, <fpage>829</fpage>&#x2013;<lpage>837</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijcard.2016.08.297</pub-id>
<pub-id pub-id-type="pmid">27580216</pub-id>
</mixed-citation>
</ref>
<ref id="B38">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Monz</surname>
<given-names>B. U.</given-names>
</name>
<name>
<surname>Clemens</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Brueckmann</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lip</surname>
<given-names>G. Y. H.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Representativeness of the dabigatran, apixaban and rivaroxaban clinical trial populations to real-world atrial fibrillation patients in the United Kingdom: a cross-sectional analysis using the general practice research database</article-title>. <source>Bmj Open</source> <volume>2</volume> (<issue>6</issue>). <pub-id pub-id-type="doi">10.1136/bmjopen-2012-001768</pub-id>
<pub-id pub-id-type="pmid">23242482</pub-id>
</mixed-citation>
</ref>
<ref id="B39">
<mixed-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Leuven</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Sianesi</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>PSMATCH2: stata module to perform full mahalanobis and propensity score matching, common support graphing, and covariate imbalance testing</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="http://ideas.repec.org/c/boc/bocode/s432001.html">http://ideas.repec.org/c/boc/bocode/s432001.html</ext-link>.</comment>
</mixed-citation>
</ref>
<ref id="B40">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>M. X.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Using the propensity score method to estimate causal effects: a review and practical guide</article-title>. <source>Organ. Res. Methods</source> <volume>16</volume> (<issue>2</issue>), <fpage>188</fpage>&#x2013;<lpage>226</lpage>. <pub-id pub-id-type="doi">10.1177/1094428112447816</pub-id>
</mixed-citation>
</ref>
<ref id="B41">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lip</surname>
<given-names>G. Y. H.</given-names>
</name>
<name>
<surname>Nieuwlaat</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Pisters</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lane</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Crijns</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Refining clinical risk stratification for predicting stroke and thromboembolism in atrial fibrillation using a novel risk factor-based approach the euro heart survey on atrial fibrillation</article-title>. <source>Chest</source> <volume>137</volume> (<issue>2</issue>), <fpage>263</fpage>&#x2013;<lpage>272</lpage>. <pub-id pub-id-type="doi">10.1378/chest.09-1584</pub-id>
<pub-id pub-id-type="pmid">19762550</pub-id>
</mixed-citation>
</ref>
<ref id="B42">
<mixed-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Lunt</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Linden</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Propwt: generating weights for propensity analysis</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="http://personalpages.manchester.ac.uk/staff/mark.lunt">http://personalpages.manchester.ac.uk/staff/mark.lunt</ext-link>.</comment>
</mixed-citation>
</ref>
<ref id="B43">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Millimet</surname>
<given-names>D. L.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>The elephant in the corner: a cautionary tale about measurement error in treatment effects models</article-title>. <source>Adv. Econ.</source> <volume>27</volume>, <fpage>1</fpage>&#x2013;<lpage>39</lpage>. <pub-id pub-id-type="doi">10.1108/S0731-9053</pub-id>
</mixed-citation>
</ref>
<ref id="B44">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nguyen</surname>
<given-names>T. Q.</given-names>
</name>
<name>
<surname>Stuart</surname>
<given-names>E. A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Propensity score analysis with latent covariates: measurement error bias correction using the covariate&#x27;s posterior mean, aka the inclusive factor score</article-title>. <source>J. Educ. Behav. Statistics</source> <volume>45</volume> (<issue>5</issue>), <fpage>598</fpage>&#x2013;<lpage>636</lpage>. <pub-id pub-id-type="doi">10.3102/1076998620911920</pub-id>
</mixed-citation>
</ref>
<ref id="B59">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>O&#x2019;Caoimh</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Igras</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Ramesh</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Power</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>O&#x2019;Connor</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Liston</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Assessing the appropriateness of oral anticoagulation for atrial fibrillation in advanced frailty: use of stroke and bleeding risk-prediction models</article-title>. <source>J. Frailty Aging</source> <volume>6</volume> (<volume>1</volume>), <fpage>46</fpage>&#x2013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.14283/jfa.2016.118</pub-id>
</mixed-citation>
</ref>
<ref id="B45">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paul</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>D. L.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Goodness of fit of generalized linear models to sparse data</article-title>. <source>J. R. Stat. Soc. Ser. B-Statistical Methodol.</source> <volume>62</volume>, <fpage>323</fpage>&#x2013;<lpage>333</lpage>. <pub-id pub-id-type="doi">10.1111/1467-9868.00234</pub-id>
</mixed-citation>
</ref>
<ref id="B46">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Raykov</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Propensity score analysis with fallible covariates: a note on a latent variable modeling approach</article-title>. <source>Educ. Psychol. Meas.</source> <volume>72</volume> (<issue>5</issue>), <fpage>715</fpage>&#x2013;<lpage>733</lpage>. <pub-id pub-id-type="doi">10.1177/0013164412440999</pub-id>
</mixed-citation>
</ref>
<ref id="B47">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rosenbaum</surname>
<given-names>P. R.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>Model-based direct adjustment</article-title>. <source>J. Am. Stat. Assoc.</source> <volume>82</volume> (<issue>398</issue>), <fpage>387</fpage>&#x2013;<lpage>394</lpage>. <pub-id pub-id-type="doi">10.2307/2289440</pub-id>
</mixed-citation>
</ref>
<ref id="B48">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rosenbaum</surname>
<given-names>P. R.</given-names>
</name>
<name>
<surname>Rubin</surname>
<given-names>D. B.</given-names>
</name>
</person-group> (<year>1983</year>). <article-title>The central role of the propensity score in observational studies for causal effects</article-title>. <source>Biometrika</source> <volume>70</volume> (<issue>1</issue>), <fpage>41</fpage>&#x2013;<lpage>55</lpage>. <pub-id pub-id-type="doi">10.1093/biomet/70.1.41</pub-id>
</mixed-citation>
</ref>
<ref id="B49">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rosenbaum</surname>
<given-names>P. R.</given-names>
</name>
<name>
<surname>Rubin</surname>
<given-names>D. B.</given-names>
</name>
</person-group> (<year>1984</year>). <article-title>Reducing bias in observational studies using subclassification on the propensity score</article-title>. <source>J. Am. Stat. Assoc.</source> <volume>79</volume> (<issue>387</issue>), <fpage>516</fpage>&#x2013;<lpage>524</lpage>. <pub-id pub-id-type="doi">10.2307/2288398</pub-id>
</mixed-citation>
</ref>
<ref id="B50">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ross</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Kreider</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.-S.</given-names>
</name>
<name>
<surname>Matone</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Rubin</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Localio</surname>
<given-names>A. R.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Propensity score methods for analyzing observational data like randomized experiments: challenges and solutions for rare outcomes and exposures</article-title>. <source>Am. J. Epidemiol.</source> <volume>181</volume> (<issue>12</issue>), <fpage>989</fpage>&#x2013;<lpage>995</lpage>. <pub-id pub-id-type="doi">10.1093/aje/kwu469</pub-id>
<pub-id pub-id-type="pmid">25995287</pub-id>
</mixed-citation>
</ref>
<ref id="B51">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rudolph</surname>
<given-names>K. E.</given-names>
</name>
<name>
<surname>Stuart</surname>
<given-names>E. A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Using sensitivity analyses for unobserved confounding to address covariate measurement error in propensity score methods</article-title>. <source>Am. J. Epidemiol.</source> <volume>187</volume> (<issue>3</issue>), <fpage>604</fpage>&#x2013;<lpage>613</lpage>. <pub-id pub-id-type="doi">10.1093/aje/kwx248</pub-id>
<pub-id pub-id-type="pmid">28992211</pub-id>
</mixed-citation>
</ref>
<ref id="B52">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sibbald</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Roland</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Understanding controlled trials - why are randomised controlled trials important?</article-title> <source>Br. Med. J.</source> <volume>316</volume> (<issue>7126</issue>), <fpage>201</fpage>. <pub-id pub-id-type="doi">10.1136/bmj.316.7126.201</pub-id>
<pub-id pub-id-type="pmid">9468688</pub-id>
</mixed-citation>
</ref>
<ref id="B53">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Siino</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fasola</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Muggeo</surname>
<given-names>V. M. R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Inferential tools in penalized logistic regression for small and sparse data: a comparative study</article-title>. <source>Stat. Methods Medical Research</source> <volume>27</volume> (<issue>5</issue>), <fpage>1365</fpage>&#x2013;<lpage>1375</lpage>. <pub-id pub-id-type="doi">10.1177/0962280216661213</pub-id>
<pub-id pub-id-type="pmid">27510370</pub-id>
</mixed-citation>
</ref>
<ref id="B58">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Toso</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Recommendations for the use of new oral anticoagulants (NOACs) after TIA or stroke caused by atrial fibrillation (AF), after a consensus conference among Italian neurologists (the Venice group)</article-title>. <source>Neurol. Sci.</source> <volume>35</volume> (<volume>5</volume>), <fpage>723</fpage>&#x2013;<lpage>727</lpage>. <pub-id pub-id-type="doi">10.1007/s10072-013-1590-7</pub-id>
<pub-id pub-id-type="pmid">24322948</pub-id>
</mixed-citation>
</ref>
<ref id="B54">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vaughan</surname>
<given-names>L. K.</given-names>
</name>
<name>
<surname>Divers</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Padilla</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Redden</surname>
<given-names>D. T.</given-names>
</name>
<name>
<surname>Tiwari</surname>
<given-names>H. K.</given-names>
</name>
<name>
<surname>Pomp</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>The use of plasmodes as a supplement to simulations: a simple example evaluating individual admixture estimation methodologies</article-title>. <source>Comput. Statistics and Data Analysis</source> <volume>53</volume> (<issue>5</issue>), <fpage>1755</fpage>&#x2013;<lpage>1766</lpage>. <pub-id pub-id-type="doi">10.1016/j.csda.2008.02.032</pub-id>
<pub-id pub-id-type="pmid">20161321</pub-id>
</mixed-citation>
</ref>
<ref id="B55">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wallace</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Analysis in an imperfect world</article-title>. <source>Significance</source> <volume>17</volume> (<issue>1</issue>), <fpage>14</fpage>&#x2013;<lpage>19</lpage>. <pub-id pub-id-type="doi">10.1111/j.1740-9713.2020.01353.x</pub-id>
</mixed-citation>
</ref>
<ref id="B56">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Webb-Vargas</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Rudolph</surname>
<given-names>K. E.</given-names>
</name>
<name>
<surname>Lenis</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Murakami</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Stuart</surname>
<given-names>E. A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>An imputation-based solution to using mismeasured covariates in propensity score analysis</article-title>. <source>Stat. Methods Med. Res.</source> <volume>26</volume> (<issue>4</issue>), <fpage>1824</fpage>&#x2013;<lpage>1837</lpage>. <pub-id pub-id-type="doi">10.1177/0962280215588771</pub-id>
<pub-id pub-id-type="pmid">26037527</pub-id>
</mixed-citation>
</ref>
<ref id="B57">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Williamson</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Morley</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lucas</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Carpenter</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Variance estimation for stratified propensity score estimators</article-title>. <source>Statistics Med.</source> <volume>31</volume> (<issue>15</issue>), <fpage>1617</fpage>&#x2013;<lpage>1632</lpage>. <pub-id pub-id-type="doi">10.1002/sim.450</pub-id>
<pub-id pub-id-type="pmid">22362427</pub-id>
</mixed-citation>
</ref>
<ref id="B60">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wolff</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Shantsila</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Lip</surname>
<given-names>G. Y. H.</given-names>
</name>
<name>
<surname>Lane</surname>
<given-names>D. A.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Impact of advanced age on management and prognosis in atrial fibrillation: insights from a population-based study in general practice</article-title>. <source>Age Ageing</source> <volume>44</volume> (<issue>5</issue>), <fpage>874</fpage>&#x2013;<lpage>878</lpage>. <pub-id pub-id-type="doi">10.1093/ageing/afv071</pub-id>
<pub-id pub-id-type="pmid">26082176</pub-id>
</mixed-citation>
</ref>
</ref-list>
<sec id="s13">
<title>Glossary</title>
<def-list>
<def-item>
<term id="G1-fphar.2026.1380586">
<bold>AF</bold>
</term>
<def>
<p>Atrial Fibrillation</p>
</def>
</def-item>
<def-item>
<term id="G2-fphar.2026.1380586">
<bold>ATE</bold>
</term>
<def>
<p>Average Treatment Effect</p>
</def>
</def-item>
<def-item>
<term id="G3-fphar.2026.1380586">
<bold>ATT</bold>
</term>
<def>
<p>Average Treatment Effect on the Treated</p>
</def>
</def-item>
<def-item>
<term id="G4-fphar.2026.1380586">
<bold>BIC</bold>
</term>
<def>
<p>Bayesian Information Criteria</p>
</def>
</def-item>
<def-item>
<term id="G5-fphar.2026.1380586">
<bold>CHA2DS2-VASc</bold>
</term>
<def>
<p>Stroke risk score for patients with Atrial Fibrillation</p>
</def>
</def-item>
<def-item>
<term id="G6-fphar.2026.1380586">
<bold>CI</bold>
</term>
<def>
<p>Confidence Interval</p>
</def>
</def-item>
<def-item>
<term id="G7-fphar.2026.1380586">
<bold>DGM</bold>
</term>
<def>
<p>Data Generation Mechanism</p>
</def>
</def-item>
<def-item>
<term id="G8-fphar.2026.1380586">
<bold>EHR</bold>
</term>
<def>
<p>Electronic Health Record</p>
</def>
</def-item>
<def-item>
<term id="G9-fphar.2026.1380586">
<bold>EPV</bold>
</term>
<def>
<p>Events Per Variable</p>
</def>
</def-item>
<def-item>
<term id="G10-fphar.2026.1380586">
<bold>HAS-BLED</bold>
</term>
<def>
<p>Risk score for bleeding in patients with Atrial Fibrillation</p>
</def>
</def-item>
<def-item>
<term id="G11-fphar.2026.1380586">
<bold>HR</bold>
</term>
<def>
<p>Hazard ratio</p>
</def>
</def-item>
<def-item>
<term id="G12-fphar.2026.1380586">
<bold>IPTW</bold>
</term>
<def>
<p>Inverse Probability of Treatment Weighting</p>
</def>
</def-item>
<def-item>
<term id="G13-fphar.2026.1380586">
<bold>MO</bold>
</term>
<def>
<p>Multiple Overimputation</p>
</def>
</def-item>
<def-item>
<term id="G14-fphar.2026.1380586">
<bold>MSE</bold>
</term>
<def>
<p>Mean Squared Error</p>
</def>
</def-item>
<def-item>
<term id="G15-fphar.2026.1380586">
<bold>NICE</bold>
</term>
<def>
<p>National Institute for Health and Care Excellence</p>
</def>
</def-item>
<def-item>
<term id="G16-fphar.2026.1380586">
<bold>NOAC</bold>
</term>
<def>
<p>Novel Oral Anti-Coagulant</p>
</def>
</def-item>
<def-item>
<term id="G17-fphar.2026.1380586">
<bold>OAC</bold>
</term>
<def>
<p>Oral Anti-Coagulant</p>
</def>
</def-item>
<def-item>
<term id="G18-fphar.2026.1380586">
<bold>OR</bold>
</term>
<def>
<p>Odds Ratio</p>
</def>
</def-item>
<def-item>
<term id="G19-fphar.2026.1380586">
<bold>PH</bold>
</term>
<def>
<p>Proportional Hazards</p>
</def>
</def-item>
<def-item>
<term id="G20-fphar.2026.1380586">
<bold>PLE</bold>
</term>
<def>
<p>Penalized Maximum Likelihood</p>
</def>
</def-item>
<def-item>
<term id="G21-fphar.2026.1380586">
<bold>PS</bold>
</term>
<def>
<p>Propensity Score</p>
</def>
</def-item>
<def-item>
<term id="G22-fphar.2026.1380586">
<bold>RCT</bold>
</term>
<def>
<p>Randomised Control Trial</p>
</def>
</def-item>
<def-item>
<term id="G23-fphar.2026.1380586">
<bold>rHR</bold>
</term>
<def>
<p>Relative hazard ratio/ratio of hazard ratios</p>
</def>
</def-item>
<def-item>
<term id="G24-fphar.2026.1380586">
<bold>RI</bold>
</term>
<def>
<p>Rivaroxaban</p>
</def>
</def-item>
<def-item>
<term id="G25-fphar.2026.1380586">
<bold>RMSE</bold>
</term>
<def>
<p>Root Mean Squared Error</p>
</def>
</def-item>
<def-item>
<term id="G26-fphar.2026.1380586">
<bold>SD</bold>
</term>
<def>
<p>Standard Deviation</p>
</def>
</def-item>
<def-item>
<term id="G27-fphar.2026.1380586">
<bold>SE</bold>
</term>
<def>
<p>Standard Error</p>
</def>
</def-item>
<def-item>
<term id="G28-fphar.2026.1380586">
<bold>SIMEX</bold>
</term>
<def>
<p>Simulation Extrapolation</p>
</def>
</def-item>
<def-item>
<term id="G29-fphar.2026.1380586">
<bold>THIN</bold>
</term>
<def>
<p>The Health Improvement Network</p>
</def>
</def-item>
<def-item>
<term id="G30-fphar.2026.1380586">
<bold>WA</bold>
</term>
<def>
<p>Warfarin</p>
</def>
</def-item>
</def-list>
</sec>
<fn-group>
<fn fn-type="custom" custom-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/42464/overview">Bernd Rosenkranz</ext-link>, Fundisa African Academy of Medicines Development, South Africa</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2657831/overview">Samer Mouksassi</ext-link>, Certara, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2709317/overview">Nouran Omar El Said</ext-link>, Future University in Egypt, Egypt</p>
</fn>
</fn-group>
</back>
</article>