<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="brief-report" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Public Health</journal-id>
<journal-title-group>
<journal-title>Frontiers in Public Health</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Public Health</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-2565</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpubh.2025.1729822</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Perspective</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Addressing the need for economic modelling when designing and reporting a diagnostic testing accuracy study</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Xie</surname>
<given-names>Xuanqian</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3251681"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Guo</surname>
<given-names>Jennifer</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Holodinsky</surname>
<given-names>Jessalyn K.</given-names>
</name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/594976"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Fu</surname>
<given-names>Rui</given-names>
</name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
<xref ref-type="aff" rid="aff9"><sup>9</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3000711"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Acute and Hospital-Based Care, Ontario Health</institution>, <city>Toronto</city>, <state>ON</state>, <country country="ca">Canada</country></aff>
<aff id="aff2"><label>2</label><institution>Institute of Health Policy, Management and Evaluation, University of Toronto</institution>, <city>Toronto</city>, <state>ON</state>, <country country="ca">Canada</country></aff>
<aff id="aff3"><label>3</label><institution>Departments of Emergency Medicine, Community Health Sciences and Clinical Neurosciences, Cumming School of Medicine, University of Calgary</institution>, <city>Calgary</city>, <state>AB</state>, <country country="ca">Canada</country></aff>
<aff id="aff4"><label>4</label><institution>Centre for Health Informatics, Cumming School of Medicine, University of Calgary</institution>, <city>Calgary</city>, <state>AB</state>, <country country="ca">Canada</country></aff>
<aff id="aff5"><label>5</label><institution>O&#x2019;Brien Institute for Public Health, Cumming School of Medicine, University of Calgary</institution>, <city>Calgary</city>, <state>AB</state>, <country country="ca">Canada</country></aff>
<aff id="aff6"><label>6</label><institution>Alberta Children&#x2019;s Hospital Research Institute, Cumming School of Medicine, University of Calgary</institution>, <city>Calgary</city>, <state>AB</state>, <country country="ca">Canada</country></aff>
<aff id="aff7"><label>7</label><institution>Hotchkiss Brain Institute, Cumming School of Medicine, University of Calgary</institution>, <city>Calgary</city>, <state>AB</state>, <country country="ca">Canada</country></aff>
<aff id="aff8"><label>8</label><institution>Departments of Community Health Sciences, Surgery and Oncology, University of Calgary, Cumming School of Medicine</institution>, <city>Calgary</city>, <state>AB</state>, <country country="ca">Canada</country></aff>
<aff id="aff9"><label>9</label><institution>The Ohlson Research Initiative, Arnie Charbonneau Cancer Institute, University of Calgary</institution>, <city>Calgary</city>, <state>AB</state>, <country country="ca">Canada</country></aff>
<author-notes>
<corresp id="c001"><label>&#x002A;</label>Correspondence: Rui Fu, <email xlink:href="mailto:rui.fu@ucalgary.ca">rui.fu@ucalgary.ca</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-01-07">
<day>07</day>
<month>01</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2025</year>
</pub-date>
<volume>13</volume>
<elocation-id>1729822</elocation-id>
<history>
<date date-type="received">
<day>21</day>
<month>10</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>28</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>15</day>
<month>12</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2026 Xie, Guo, Holodinsky and Fu.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Xie, Guo, Holodinsky and Fu</copyright-holder>
<license>
<ali:license_ref start_date="2026-01-07">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Model-based economic evaluations rely on results of diagnostic test accuracy (DTA) studies to assess the value-for-money of a new diagnostic or prognostic test. The 30-item Standards for Reporting of Diagnostic Accuracy Studies (STARD) 2015 guidelines are the gold-standard guidelines for DTA studies. In this Perspective paper, we conducted a rapid review of publicly available economic evaluations of a new diagnostic test between 2012 and 2025 to formulate eight elements that we believe could be added to STARD 2015 to help enhance the credibility of DTA-based economic evaluations. Examples from the rapid review and practical recommendations were provided.</p>
</abstract>
<kwd-group>
<kwd>diagnostic test</kwd>
<kwd>economic evaluations</kwd>
<kwd>false negative</kwd>
<kwd>false positive</kwd>
<kwd>health technology assessment</kwd>
<kwd>test accuracy</kwd>
<kwd>true prevalence</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. RF is supported by the Alberta Cancer Foundation and the Arthur J.E. Child Foundation through an innovation catalyst grant.</funding-statement>
</funding-group>
<counts>
<fig-count count="0"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="24"/>
<page-count count="6"/>
<word-count count="4965"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Health Economics</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>Model-based economic evaluations are essential tools in health technology assessment (HTA) to inform funding recommendations for new interventions, including new diagnostic or prognostic tests (termed an index test henceforth) (<xref ref-type="bibr" rid="ref1">1</xref>). To populate an economic model, data on test performance are derived from diagnostic test accuracy (DTA) studies, which present standard test accuracy measures (e.g., sensitivity and specificity). However, to model the long-term cost and effectiveness of an index test, further information, that is often beyond the scope of a traditional DTA study, may be required. The Standards for Reporting Diagnostic Accuracy (STARD) 2015 statement is one of the gold-standard guidelines for reporting DTA studies (<xref ref-type="bibr" rid="ref2">2</xref>). However, STARD 2015 has been largely developed for ensuring reporting completeness and transparency in medical research and may not include items that are important for an economic evaluation. In this Perspective article, we proposed additional items for STARD 2015 based on the gaps identified from published economic evaluations. These preliminary findings may have implications on mitigating the gaps between the standard of reporting DTA studies and the conduct of high-quality economic evaluations.</p>
</sec>
<sec id="sec2">
<label>2</label>
<title>Study procedures</title>
<p>A rapid review was conducted on the International HTA Database of the International Network of Agencies for Health Technology Assessment<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref> for publicly available reports evaluating an index test using model-based economic evaluation from January 2012 to September 2025. For selected reports, we identified model parameters and/or underlying assumptions that had been recognized to have impacted the final results with limited information from a DTA study. Then, using the 30-item STARD 2015 guideline (<xref ref-type="bibr" rid="ref2">2</xref>), we delineated whether these missing data had been explicitly mentioned in this guideline; if not, we formulated items that we recommended to be added to STARD 2015 via discussion within the research team. The initial search combining keywords and MeSH headings (such as &#x2018;Diagnostic Screening Programs&#x2019;) yielded 166 records, of which 25 were relevant after the title/abstract and the full-text screen. We highlighted eight articles (<xref ref-type="bibr" rid="ref3 ref4 ref5 ref6 ref7 ref8 ref9 ref10">3&#x2013;10</xref>) in this paper.</p>
</sec>
<sec sec-type="results" id="sec3">
<label>3</label>
<title>Results</title>
<p>This study process yielded eight extended items for STARD 2015 (termed E1-E8, <xref ref-type="table" rid="tab1">Table 1</xref>) including five new items for reporting study results and three new items for reporting the discussion. Below we provide a brief description of each item with rationale and examples obtained from the rapid review.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Recommended items for extending the STARD 2015 guideline to facilitate the conduct of economic evaluations of a new diagnostic or prognostic test (an index test).</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Section and topic</th>
<th align="center" valign="top">No</th>
<th align="center" valign="top">Item</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" colspan="3">Results</td>
</tr>
<tr>
<td align="left" valign="middle">Consequences of false index test results</td>
<td align="center" valign="middle">E1</td>
<td align="center" valign="middle">The health and cost consequences of individuals receiving a false diagnosis from the index test should be clearly described, including when and how the false result can be identified and corrected.</td>
</tr>
<tr>
<td align="left" valign="middle">The role of the index test in a diagnostic pathway when multiple tests are involved</td>
<td align="center" valign="middle">E2</td>
<td align="center" valign="middle">The expected or observed role of an index test within an existing diagnostic pathway and the decision rules if multiple tests are involved should be clearly described.</td>
</tr>
<tr>
<td align="left" valign="middle">Distribution of other diseases in individuals receiving a negative index test result</td>
<td align="center" valign="middle">E3</td>
<td align="center" valign="middle">For &#x201C;symptomatic&#x201D; individuals who receive a negative test result, DTA studies should explore and report the underlying distribution of other diseases in this patient population.</td>
</tr>
<tr>
<td align="left" valign="middle">Use of composite reference standard to address an imperfect reference test</td>
<td align="center" valign="middle">E4</td>
<td align="center" valign="middle">It should be clearly stated if an imperfect reference test (e.g., composite reference standard or other methods) is used to evaluate an index test and how the associated limitations are addressed (if applicable).</td>
</tr>
<tr>
<td align="left" valign="middle">Health-related quality of life by the index test result and underlying disease status</td>
<td align="center" valign="middle">E5</td>
<td align="center" valign="middle">DTA studies should establish a baseline health-related quality of life (HRQOL) to allow economic evaluations to derive utility values based on the index test result and underlying disease status.</td>
</tr>
<tr>
<td align="left" valign="middle" colspan="3">Discussion</td>
</tr>
<tr>
<td align="left" valign="middle">Robust estimation of true disease prevalence</td>
<td align="center" valign="middle">E6</td>
<td align="center" valign="middle">Discussion and/or a sensitivity analysis on the limitations associated with a potentially biased disease prevalence estimate should be provided.</td>
</tr>
<tr>
<td align="left" valign="middle">Accuracy of an index test enabled by artificial intelligence (AI)</td>
<td align="center" valign="middle">E7</td>
<td align="center" valign="middle">DTA studies of an AI-enabled index test should report data on model performance over time or comment on the limitations associated with not being able to assess time-dependent accuracy.</td>
</tr>
<tr>
<td align="left" valign="middle">Resources used for performing the index test</td>
<td align="center" valign="middle">E8</td>
<td align="center" valign="middle">DTA studies should present data or comment on the resources and costs of performing the index test.</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>STARD, Standards for Reporting Diagnostic Accuracy; DTA, diagnostic test accuracy; AI, artificial intelligence; HRQOL, health related quality of life.</p>
</table-wrap-foot>
</table-wrap>
<sec id="sec4">
<label>3.1</label>
<title>Consequences of false index test results (E1)</title>
<p><italic>Description</italic>: The health and cost consequences of individuals receiving a false diagnosis from the index test should be clearly described, including when and how the false result can be identified and corrected.</p>
<p><italic>Rationale</italic>: While DTA studies present a direct comparison between the index and the reference tests, economic evaluations tend to model the real-world clinical pathway in which generally only one type of test (index or reference) is received by an individual at the time. This means that in order to accurately reflect the disease progression of individuals post-testing, false test results need to be explicitly modelled. We herein recommend DTA studies to report the health consequences of individuals with a false index test result to facilitate economic modelling. Furthermore, the timing of the potential detection and even correction of these false test results should be described. For instance, individuals with a false negative test result may be detected retroactively via the discovery of unexpected disease progression or exacerbations that are deemed to be attributed to a false diagnosis; the incurred losses of health may be quantified in a DTA study. Individuals with a false positive test may be subject to overtreatment, leading to a decrement in the quality of life.</p>
<p><italic>Example</italic>: In a systematic review of economic evaluations on hand-held electrochemical devices for monitoring fractions of exhaled nitric oxide for the diagnosis of asthma (<xref ref-type="bibr" rid="ref3">3</xref>), the omission of health consequences associated with an incorrect diagnosis was identified to be a major limitation of the published studies. A primary economic evaluation was then performed to overcome this limitation; however, given the paucity of data in the DTA literature, expert opinions were used to determine key model parameters including the number of years required to detect and correct a false diagnosis result, rendering the final modelling findings to be uncertain.</p>
</sec>
<sec id="sec5">
<label>3.2</label>
<title>The role of the index test in a diagnostic pathway when multiple tests are involved (E2)</title>
<p><italic>Description</italic>: The expected or observed role of an index test within an existing diagnostic pathway and the decision rules if multiple tests are involved should be clearly described.</p>
<p><italic>Rationale</italic>: To arrive at a final diagnosis, individuals are sometimes exposed to more than one type of test (<xref ref-type="bibr" rid="ref11">11</xref>). When an index test is part of a diagnostic pathway with other tests, the DTA study should clarify or propose the role of the index test as the following (<xref ref-type="bibr" rid="ref12">12</xref>): a replacement (i.e., replacing one or more existing tests due to an increase in diagnostic accuracy), a triage (i.e., preceding the conduct of existing tests for risk stratification so that some individuals may not require the subsequent tests), or an add-on (i.e., to be performed as an additional test in the existing diagnostic pathway). In the presence of multiple tests (<xref ref-type="bibr" rid="ref11">11</xref>), an &#x2018;OR&#x2019; rule may be applicable on some occasions where a positive diagnostic result is reached given any positive individual test result. In other instances, a positive diagnostic result may only be reached if all individual tests are positive (i.e., the &#x2018;AND&#x2019; rule). When the results of multiple tests are strongly correlated due to an underlying dependence structure (<xref ref-type="bibr" rid="ref13">13</xref>), the DTA study may want to report such pairwise correlations and discuss the possibility of omitting one of these tests to streamline the diagnostic pathway.</p>
<p><italic>Example</italic>: In 2024, an economic model (<xref ref-type="bibr" rid="ref4">4</xref>) was published comparing the budget impact of adopting four diagnostic pathways of latent tuberculosis infection involving an interferon-gamma release assay (IGRA) and/or the standard tuberculin skin test (TST), including: i) TST alone; ii) IGRA alone; iii) IGRA following a positive TST result where those tested positive in both tests were deemed to have the disease (i.e., applying the &#x2018;AND&#x2019; rule); and iv) TST following a negative IGRA result where individuals receiving a positive result in any test were diagnosed (i.e., applying the &#x2018;OR&#x2019; rule). Compared with single-test strategies (i or ii), the &#x2018;AND rule in strategy iii was associated with a lower probability of being treated and lower per-person costs, while the &#x2018;OR&#x2019; rule in strategy iv resulted in a higher probability of being treated and higher per-person costs.</p>
</sec>
<sec id="sec6">
<label>3.3</label>
<title>Distribution of other diseases in individuals receiving a negative index test result (E3)</title>
<p><italic>Description</italic>: For &#x201C;symptomatic&#x201D; individuals who receive a negative index test result, DTA studies should explore and report the underlying distribution of other diseases in this patient population.</p>
<p><italic>Rationale</italic>: Many symptoms such as cough and headache are associated with more than one possible underlying diseases. As such, an individual in receipt of a correct negative result from the index test (i.e., true negative) may have other undiagnosed health conditions with both cost and quality-of-life implications. In an economic model, these individuals are typically assumed to enter the &#x201C;healthy (disease-free)&#x201D; state following a true negative index test result. Until data are made available from DTA studies to illustrate the underlying distribution of diseases in this heterogenous patient population, a comprehensive modelling of the clinical pathway is not feasible.</p>
<p><italic>Example</italic>: Asthma, chronic obstructive pulmonary disease (COPD) and congestive heart failure (CHF) are distinct diseases that share many symptoms including the shortness of breath, while the latter two diseases are associated with considerably higher health and cost burdens. In a 2017 economic evaluation on diagnostic tests for asthma (<xref ref-type="bibr" rid="ref5">5</xref>), the possibility of individuals tested negative for asthma but otherwise had COPD or CHF was entertained in the economic model. However, due to the paucity of objective data on the distribution of COPD/CHF in this patient population, only expert opinions were used to populate the model.</p>
</sec>
<sec id="sec7">
<label>3.4</label>
<title>Use of composite reference standard to address an imperfect reference test (E4)</title>
<p><italic>Description:</italic> It should be clearly stated if an imperfect reference test (e.g., composite reference standard or other methods) is used to evaluate an index test and how the associated limitations are addressed (if applicable).</p>
<p><italic>Rationale:</italic> An imperfect reference test is used to evaluate an index test when a perfect test (i.e., the gold-standard test for determining disease status) is unavailable (<xref ref-type="bibr" rid="ref14">14</xref>). Due to the inherent limitations of an imperfect reference test, a biased estimation on the accuracy of the index test may arise. For example, despite an index test producing the correct diagnosis for an individual, a DTA study relying on an imperfect reference test may render that diagnosis to be incorrect/false, and thereby introduces errors in the subsequent economic evaluation. To address this limitation, one approach is to assess the index test against a composite reference standard, which classifies individuals into disease positive or negative groups using multiple imperfect tests, though this method has its own limitations related to the uncertainty of the true disease prevalence (<xref ref-type="bibr" rid="ref15">15</xref>). More sophisticated methods (e.g., latent-class models) are emerging to tackle this issue (<xref ref-type="bibr" rid="ref14">14</xref>, <xref ref-type="bibr" rid="ref15">15</xref>).</p>
<p><italic>Example:</italic> Diagnosis of community-acquired pneumonia caused by <italic>Streptococcus pneumoniae</italic> in adults is often based on a composite reference standard using culture methods (blood culture, sputum, and cultures of other respiratory samples) (<xref ref-type="bibr" rid="ref10">10</xref>). The BinaxNOW <italic>S. pneumoniae</italic> (BinaxNOW-SP, the index test) is a urine-based test that can potentially achieve a faster and better diagnosis. In a 2013 review of 27 DTA studies (<xref ref-type="bibr" rid="ref10">10</xref>), a Bayesian latent-class meta-analysis suggested that the sensitivity of BinaxNOW-SP was higher than the composite reference standard, while both achieved high specificities. An economic evaluation was further conducted using the meta-analyzed test accuracy of the BinaxNOW-SP to improve the precision of the modelling results (<xref ref-type="bibr" rid="ref6">6</xref>).</p>
</sec>
<sec id="sec8">
<label>3.5</label>
<title>Health-related quality of life by the index test result and underlying disease status (E5)</title>
<p><italic>Description:</italic> DTA studies may want to establish a baseline health-related quality of life (HRQOL) to allow economic evaluations to derive utility values based on the index test result and underlying disease status.</p>
<p><italic>Rationale:</italic> Due to the paucity of health utility (HRQOL) data, health economists are confronted with the challenge of assigning a utility value to the population based on the index test result and the underlying disease status (i.e., true/false positive and negative groups; a total of four groups). The common approach is to start with a &#x201C;baseline&#x201D; HRQOL value (typically for the true-negative group) using the utility of the general disease-free population (<xref ref-type="bibr" rid="ref16">16</xref>, <xref ref-type="bibr" rid="ref17">17</xref>), and then be able to adjust that utility for the other three groups by incorporating an appropriate decrement. However, this approach has several pitfalls including not being able to account for individuals who tested negative but are otherwise living with other health conditions (see section 3.3) and incorrectly classifying individuals (and thereby assigning the &#x2018;wrong&#x2019; utility) due to the use of an imperfect reference test (see section 3.4). Also, the symptom burden for the true-positive and false-negative groups may be different, although both are categorized as having the disease in an economic model and likely will share the same utility value to capture HRQOL. We thereby recommend DTA studies to provide data that can define the baseline HRQOL of the patient population and provide suggestions on the best way to estimate the HRQOL based on the index test result and the underlying disease status.</p>
<p><italic>Example:</italic> In the asthma example that we previously presented in section 3.1 (<xref ref-type="bibr" rid="ref3">3</xref>), individuals receiving a negative index test for asthma (including true and false negatives) were assumed to have the same health utility value as the healthy population, while those who received a false positive result were assumed to experience the same disutility as those with true underlying asthma condition (i.e., true positives). These assumptions may lead to uncertainties in the final modelling results.</p>
</sec>
<sec id="sec9">
<label>3.6</label>
<title>Robust estimation of true disease prevalence (E6)</title>
<p><italic>Description:</italic> Discussion and/or a sensitivity analysis on the limitations associated with a potentially biased disease prevalence estimate should be provided.</p>
<p><italic>Rationale:</italic> Disease prevalence is key to determine the cost-effectiveness of an index test compared to the standard of care; however, in many cases the true prevalence of disease cannot be reliably estimated. Specifically, individuals with a negative test result are often not investigated further (e.g., those tested negative in cancer screening), and consequently, the true disease status of these individuals (whether they are a true or false positive in the first place) remains unknown (<xref ref-type="bibr" rid="ref18">18</xref>), leading to an underestimated disease prevalence. Furthermore, in the absence of a perfect reference standard, the calculation using the accuracy of an index test ([TP&#x202F;+&#x202F;FN]/[TP&#x202F;+&#x202F;FN&#x202F;+&#x202F;FP&#x202F;+&#x202F;TN]) may not reflect the true prevalence of the disease (<xref ref-type="bibr" rid="ref15">15</xref>). Advanced methods including latent-class modeling (<xref ref-type="bibr" rid="ref15">15</xref>) are emerging to reduce bias in estimating disease prevalence and may be adopted in the reporting of DTA studies.</p>
<p><italic>Example:</italic> An economic evaluation was conducted on noninvasive prenatal testing for trisomy 21 (Down syndrome) at 12-week gestation in 2019 (<xref ref-type="bibr" rid="ref7">7</xref>). To estimate the true prevalence of trisomy 21 at 12&#x202F;weeks, the report used the prevalence of trisomy 21 in live birth and the rate of spontaneous pregnancy loss from 12&#x202F;weeks to term due to the chromosomal anomaly to arrive at an estimation. This estimated prevalence was ultimately used in the economic evaluation.</p>
</sec>
<sec id="sec10">
<label>3.7</label>
<title>Accuracy of an index test enabled by artificial intelligence (AI; E7)</title>
<p><italic>Description</italic>: DTA studies of an AI-enabled index test should report data on model performance over time or comment on the limitations associated with not being able to assess time-dependent accuracy.</p>
<p><italic>Rationale</italic>: While most economic evaluations assume the performance of the index test to be constant over the modelled time horizon, there is an emerging class of diagnostic systems powered by AI with improving or degrading performance over time (<xref ref-type="bibr" rid="ref19">19</xref>, <xref ref-type="bibr" rid="ref20">20</xref>). Until adequate information is made available on how often these algorithms are expected to be updated, how these updates will occur, and the time-dependent change of the underlying algorithm (i.e., learning curves), a comprehensive economic evaluation is not feasible (<xref ref-type="bibr" rid="ref21">21</xref>).</p>
<p><italic>Example</italic>: A 2022 evaluation found an AI-assisted computed tomography (CT) scan protocol for lung cancer screening in high-risk adults to be cost-effective over radiologist-interpreted CT scans for the healthcare system over a 20-year time horizon (<xref ref-type="bibr" rid="ref8">8</xref>). The sensitivity and specificity of the two protocols were obtained from a single DTA study (<xref ref-type="bibr" rid="ref22">22</xref>) and assumed to remain constant over time. Interestingly, this DTA study also found the underlying deep learning algorithms to be superior to radiologists only during the initial screening, but became on-par when radiologists had access to previous examinations. These results were not incorporated into the economic evaluation and thus may imply the cost-effectiveness results to be overly optimistic favoring the AI-assisted CT scan protocol in a longitudinal screening setting.</p>
</sec>
<sec id="sec11">
<label>3.8</label>
<title>Resources used for performing the index test (E8)</title>
<p><italic>Description</italic>: DTA studies should present data or comment on the resources and costs of performing the index test.</p>
<p><italic>Rationale</italic>: In an economic evaluation, the listing prices of products and services (e.g., technical support and maintenance agreement) obtained from the manufacturers are typically used to estimate the cost of an index test. This method has likely resulted in an underestimation as other cost components including infrastructure depreciation or new purchases, professional fees paid to technicians and other personnel, fees of obtaining the license or specialized software, and other operation costs, are not considered. For example, hospitals that need to establish a new lab (and recruiting personnel) to perform an index test may incur substantial upfront expenditures. We recommend investigators to present this information in a DTA study.</p>
<p><italic>Example</italic>: In an economic evaluation of a DNA methylation&#x2013;based classifier test for central nervous system tumors (<xref ref-type="bibr" rid="ref9">9</xref>), the capital costs were not included in the reference-case analysis. The inclusion of capital costs (e.g., purchase and equip the entire platform and obtain the license to use the technology) would substantially inflate the cost of testing, and thereby resulting in a less favorable cost-effectiveness profile for the index test. This index test is also powered by a random forest (a type of machine learning algorithm) classification model, which introduces further complexity on how to properly evaluate its cost-effectiveness against the usual care, given the lack of primary DTA data and analytical guidance (see section 3.7).</p>
</sec>
</sec>
<sec sec-type="discussion" id="sec12">
<label>4</label>
<title>Discussion</title>
<p>DTA studies often provide the foundational data to inform an economic evaluation of an index test. Through a structured process, we provided recommendations on five additional items that DTA investigators may want to assess as secondary outcomes (items E1 to E5) and three additional items to be elaborated in the discussion, if primary data collection/analysis is not feasible (items E6 to E8). Note that some of these recommended items are not entirely independent from the original items in STARD 2015 but we provided more specific and actionable instructions with the goal of improving the appropriate use of DTA data in economic evaluations. For example, the STARD 2015 guidelines recommend the reporting of &#x201C;the intended use and clinical role of the index test&#x201D; in the background and discussion sections of a DTA study (<xref ref-type="bibr" rid="ref2">2</xref>). Built upon this, our item E2 further specified that DTA studies may want to explicitly present the decision rules involving the index test in a diagnostic pathway and report the conditional dependence between tests. Similarly, the STARD 2015 has called for a description on the reference standard &#x201C;in sufficient details to allow replication&#x201D; (<xref ref-type="bibr" rid="ref2">2</xref>); in our item E4, we further clarified that in the case of using an imperfect reference standard, DTA researchers should explicitly discuss the associated limitations and consider exploring more sophisticated methods to minimize impact. In this paper, we did not elaborate on the implementation of our proposed items especially for E6&#x2013;E8 that we considered to be more difficult to examine. For example, in item E7 we recommend DTA studies to discuss the implications of time-dependent performance of an AI-enabled index test even if these longitudinal data are difficult to obtain due to barriers in implementing AI algorithms, even for pilot testing (<xref ref-type="bibr" rid="ref23">23</xref>). This recommendation also aligns with regulations such as those from the US Food and Drug Administration who only evaluates AI tools with a locked algorithm and requires new applications whenever the algorithm has been updated (<xref ref-type="bibr" rid="ref24">24</xref>). Overall, we recommend health economists and health decision scientists to actively participate in the creation of DTA reporting guidelines to ensure the inclusion of essential data elements for an economic evaluation.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec13">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="author-contributions" id="sec14">
<title>Author contributions</title>
<p>XX: Conceptualization, Formal analysis, Investigation, Methodology, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. JG: Investigation, Methodology, Writing &#x2013; review &#x0026; editing. JH: Investigation, Methodology, Writing &#x2013; review &#x0026; editing. RF: Conceptualization, Formal analysis, Funding acquisition, Investigation, Methodology, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="COI-statement" id="sec15">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec16">
<title>Generative AI statement</title>
<p>The author(s) declared that Generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec17">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="disclaimer" id="sec18">
<title>Author disclaimer</title>
<p>The opinions expressed in this publication do not necessarily represent the opinions of Ontario Health. No endorsement is intended or should be inferred. The Alberta Cancer Foundation and the Arthur J.E. Child Foundation had no role in the design, collection, analyses or interpretation of the results of this study or in the preparation, review or approval of the manuscript.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><label>1.</label><mixed-citation publication-type="other"><person-group person-group-type="author"><collab id="coll1">Canadian Agency for Drugs and Technologies in Health</collab></person-group>. Guidelines for the economic evaluation of health technologies: Canada, 4th Edition. <year>2017</year>. Available online at: <ext-link xlink:href="https://www.cadth.ca/sites/default/files/pdf/guidelines_for_the_economic_evaluation_of_health_technologies_canada_4th_ed.pdf" ext-link-type="uri">https://www.cadth.ca/sites/default/files/pdf/guidelines_for_the_economic_evaluation_of_health_technologies_canada_4th_ed.pdf</ext-link> (Accessed August 11, 2024)</mixed-citation></ref>
<ref id="ref2"><label>2.</label><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Bossuyt</surname><given-names>PM</given-names></name> <name><surname>Reitsma</surname><given-names>JB</given-names></name> <name><surname>Bruns</surname><given-names>DE</given-names></name> <name><surname>Gatsonis</surname><given-names>CA</given-names></name> <name><surname>Glasziou</surname><given-names>PP</given-names></name> <name><surname>Irwig</surname><given-names>L</given-names></name> <etal/></person-group>:<fpage>2015</fpage> <article-title>STARD 2015: an updated list of essential items for reporting diagnostic accuracy studies</article-title>. <source>BMJ</source> (<volume>351</volume>:<fpage>h5527</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmj.h5527</pub-id></mixed-citation></ref>
<ref id="ref3"><label>3.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Harnan</surname><given-names>SE</given-names></name> <name><surname>Tappenden</surname><given-names>P</given-names></name> <name><surname>Essat</surname><given-names>M</given-names></name> <name><surname>Gomersall</surname><given-names>T</given-names></name> <name><surname>Minton</surname><given-names>J</given-names></name> <name><surname>Wong</surname><given-names>R</given-names></name> <etal/></person-group>. <article-title>Measurement of exhaled nitric oxide concentration in asthma: a systematic review and economic evaluation of NIOX MINO, NIOX VERO and NObreath</article-title>. <source>Health Technol Assess</source>. (<year>2015</year>) <volume>19</volume>:<fpage>1</fpage>&#x2013;<lpage>330</lpage>. doi: <pub-id pub-id-type="doi">10.3310/hta19820</pub-id>, <pub-id pub-id-type="pmid">26484874</pub-id></mixed-citation></ref>
<ref id="ref4"><label>4.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><collab id="coll2">Ontario Health</collab></person-group>. <article-title>Interferon-gamma release assay testing for latent tuberculosis infection: a health technology assessment</article-title>. <source>Ont Health Technol Assess Ser</source>. (<year>2024</year>) <volume>24</volume>:<fpage>1</fpage>&#x2013;<lpage>183</lpage>.</mixed-citation></ref>
<ref id="ref5"><label>5.</label><mixed-citation publication-type="other"><person-group person-group-type="author"><collab id="coll3">National Institute for Health and Care Excellence</collab></person-group>. &#x201C;<article-title>Appendix M. Cost effectiveness analysis in diagnosis of asthma in adults and young people aged over 16</article-title>,&#x201D; <source>Asthma: diagnosis and monitoring of asthma in adults, children and young people (NICE guideline NG80)</source>. <publisher-name>National Guideline Centre</publisher-name>. <publisher-loc>London</publisher-loc>: <comment>NICE</comment> (<year>2017</year>). Available online at: <ext-link xlink:href="https://www.nice.org.uk/guidance/ng245/evidence/appendices-a-to-r-pdf-7079863937" ext-link-type="uri">https://www.nice.org.uk/guidance/ng245/evidence/appendices-a-to-r-pdf-7079863937</ext-link> (Accessed September 22, 2025)</mixed-citation></ref>
<ref id="ref6"><label>6.</label><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Sinclair</surname><given-names>A</given-names></name> <name><surname>Xie</surname><given-names>X</given-names></name> <name><surname>Dendukuri</surname><given-names>N</given-names></name></person-group>. <source>The clinical effectiveness and cost of a pneumococcal urine antigen immunochromatographic test (BinaxNOW <italic>Streptococcus pneumoniae</italic>) in the diagnosis of community acquired <italic>Streptococcus pneumoniae</italic> pneumonia in patients admitted to hospital</source>. <publisher-loc>Montreal (Canada): Technology Assessment Unit (TAU) of the McGill University Health Centre (MUHC). Report no. 57</publisher-loc>. (<year>2012</year>). p. <fpage>58</fpage>. Available online at: <ext-link xlink:href="https://secureweb.mcgill.ca/tau/sites/mcgill.ca.tau/files/muhc_tau_2011_57_binaxnow.pdf" ext-link-type="uri">https://secureweb.mcgill.ca/tau/sites/mcgill.ca.tau/files/muhc_tau_2011_57_binaxnow.pdf</ext-link> (Accessed October 3, 2025)</mixed-citation></ref>
<ref id="ref7"><label>7.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><collab id="coll4">Health Quality Ontario</collab></person-group>. <article-title>Noninvasive prenatal testing for trisomies 21, 18, and 13, sex chromosome aneuploidies, and microdeletions: a health technology assessment</article-title>. <source>Ont Health Technol Assess Ser</source>. (<year>2019</year>) <volume>19</volume>:<fpage>1</fpage>&#x2013;<lpage>166</lpage>.</mixed-citation></ref>
<ref id="ref8"><label>8.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ziegelmayer</surname><given-names>S</given-names></name> <name><surname>Graf</surname><given-names>M</given-names></name> <name><surname>Makowski</surname><given-names>M</given-names></name> <name><surname>Gawlitza</surname><given-names>J</given-names></name> <name><surname>Gassert</surname><given-names>F</given-names></name></person-group>. <article-title>Cost-effectiveness of artificial intelligence support in computed tomography-based lung Cancer screening</article-title>. <source>Cancer</source>. (<year>2022</year>) <volume>14</volume>:<fpage>1729</fpage>. doi: <pub-id pub-id-type="doi">10.3390/cancers14071729</pub-id>, <pub-id pub-id-type="pmid">35406501</pub-id></mixed-citation></ref>
<ref id="ref9"><label>9.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><collab id="coll5">Ontario Health</collab></person-group>. <article-title>DNA methylation&#x2013;based classification for central nervous system tumours: a health technology assessment</article-title>. <source>Ont Health Technol Assess Ser</source>. (<year>2025</year>) <volume>25</volume>:<fpage>1</fpage>&#x2013;<lpage>93</lpage>.</mixed-citation></ref>
<ref id="ref10"><label>10.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sinclair</surname><given-names>A</given-names></name> <name><surname>Xie</surname><given-names>X</given-names></name> <name><surname>Teltscher</surname><given-names>M</given-names></name> <name><surname>Dendukuri</surname><given-names>N</given-names></name></person-group>. <article-title>Systematic review and meta-analysis of a urine-based pneumococcal antigen test for diagnosis of community-acquired pneumonia caused by <italic>Streptococcus pneumoniae</italic></article-title>. <source>J Clin Microbiol</source>. (<year>2013</year>) <volume>51</volume>:<fpage>2303</fpage>&#x2013;<lpage>10</lpage>. doi: <pub-id pub-id-type="doi">10.1128/JCM.00137-13</pub-id>, <pub-id pub-id-type="pmid">23678060</pub-id></mixed-citation></ref>
<ref id="ref11"><label>11.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Xie</surname><given-names>X</given-names></name> <name><surname>Tiggelaar</surname><given-names>S</given-names></name> <name><surname>Guo</surname><given-names>J</given-names></name> <name><surname>Wang</surname><given-names>M</given-names></name> <name><surname>Vandersluis</surname><given-names>S</given-names></name> <name><surname>Ungar</surname><given-names>WJ</given-names></name></person-group>. <article-title>Developing economic models for assessing the cost-effectiveness of multiple diagnostic tests: methods and applications</article-title>. <source>Med Decis Mak</source>. (<year>2022</year>) <volume>42</volume>:<fpage>861</fpage>&#x2013;<lpage>71</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0272989X221089268</pub-id>, <pub-id pub-id-type="pmid">35373634</pub-id></mixed-citation></ref>
<ref id="ref12"><label>12.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bossuyt</surname><given-names>PM</given-names></name> <name><surname>Irwig</surname><given-names>L</given-names></name> <name><surname>Craig</surname><given-names>J</given-names></name> <name><surname>Glasziou</surname><given-names>P</given-names></name></person-group>. <article-title>Comparative accuracy: assessing new tests against existing diagnostic pathways</article-title>. <source>BMJ</source>. (<year>2006</year>) <volume>332</volume>:<fpage>1089</fpage>&#x2013;<lpage>92</lpage>. doi: <pub-id pub-id-type="doi">10.1136/bmj.332.7549.1089</pub-id>, <pub-id pub-id-type="pmid">16675820</pub-id></mixed-citation></ref>
<ref id="ref13"><label>13.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>Z</given-names></name> <name><surname>Dendukuri</surname><given-names>N</given-names></name> <name><surname>Joseph</surname><given-names>L</given-names></name></person-group>. <article-title>Understanding the effects of conditional dependence in research studies involving imperfect diagnostic tests</article-title>. <source>Stat Med</source>. (<year>2017</year>) <volume>36</volume>:<fpage>466</fpage>&#x2013;<lpage>80</lpage>. doi: <pub-id pub-id-type="doi">10.1002/sim.7148</pub-id>, <pub-id pub-id-type="pmid">27730659</pub-id></mixed-citation></ref>
<ref id="ref14"><label>14.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Xie</surname><given-names>X</given-names></name> <name><surname>Sinclair</surname><given-names>A</given-names></name> <name><surname>Dendukuri</surname><given-names>N</given-names></name></person-group>. <article-title>Evaluating the accuracy and economic value of a new test in the absence of a perfect reference test</article-title>. <source>Res Synth Methods</source>. (<year>2017</year>) <volume>8</volume>:<fpage>321</fpage>&#x2013;<lpage>32</lpage>. doi: <pub-id pub-id-type="doi">10.1002/jrsm.1243</pub-id>, <pub-id pub-id-type="pmid">28544646</pub-id></mixed-citation></ref>
<ref id="ref15"><label>15.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dendukuri</surname><given-names>N</given-names></name> <name><surname>Schiller</surname><given-names>I</given-names></name> <name><surname>De Groot</surname><given-names>J</given-names></name> <name><surname>Libman</surname><given-names>M</given-names></name> <name><surname>Moons</surname><given-names>K</given-names></name> <name><surname>Reitsma</surname><given-names>J</given-names></name> <etal/></person-group>. <article-title>Concerns about composite reference standards in diagnostic research</article-title>. <source>BMJ</source>. (<year>2018</year>):<fpage>j5779</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmj.j5779</pub-id>, <pub-id pub-id-type="pmid">29348126</pub-id></mixed-citation></ref>
<ref id="ref16"><label>16.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Poder</surname><given-names>TG</given-names></name> <name><surname>Carrier</surname><given-names>N</given-names></name> <name><surname>Kouakou</surname><given-names>CRC</given-names></name></person-group>. <article-title>Quebec health-related quality-of-life population norms using the EQ-5D-5L: decomposition by sociodemographic data and health problems</article-title>. <source>Value Health</source>. (<year>2020</year>) <volume>23</volume>:<fpage>251</fpage>&#x2013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jval.2019.08.008</pub-id>, <pub-id pub-id-type="pmid">32113631</pub-id></mixed-citation></ref>
<ref id="ref17"><label>17.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yan</surname><given-names>J</given-names></name> <name><surname>Xie</surname><given-names>S</given-names></name> <name><surname>Johnson</surname><given-names>JA</given-names></name> <name><surname>Pullenayegum</surname><given-names>E</given-names></name> <name><surname>Ohinmaa</surname><given-names>A</given-names></name> <name><surname>Bryan</surname><given-names>S</given-names></name> <etal/></person-group>. <article-title>Canada population norms for the EQ-5D-5L</article-title>. <source>Eur J Health Econ</source>. (<year>2024</year>) <volume>25</volume>:<fpage>147</fpage>&#x2013;<lpage>55</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10198-023-01570-1</pub-id>, <pub-id pub-id-type="pmid">36828968</pub-id></mixed-citation></ref>
<ref id="ref18"><label>18.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Xie</surname><given-names>X</given-names></name> <name><surname>Gajic-Veljanoski</surname><given-names>O</given-names></name> <name><surname>Falk</surname><given-names>L</given-names></name> <name><surname>Schaink</surname><given-names>AK</given-names></name> <name><surname>Lambrinos</surname><given-names>A</given-names></name> <name><surname>Wang</surname><given-names>M</given-names></name> <etal/></person-group>. <article-title>Challenges in health technology assessments of genetic tests</article-title>. <source>J Hosp Manag Health Policy</source>. (<year>2020</year>) <volume>4</volume>:<fpage>27</fpage>&#x2013;<lpage>7</lpage>. doi: <pub-id pub-id-type="doi">10.21037/jhmhp-20-47</pub-id></mixed-citation></ref>
<ref id="ref19"><label>19.</label><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Guan</surname><given-names>H</given-names></name> <name><surname>Bates</surname><given-names>D</given-names></name> <name><surname>Zhou</surname><given-names>L</given-names></name></person-group>. <article-title>Keeping medical AI healthy: a review of detection and correction methods for system degradation</article-title> <source>arXiv [Preprint]</source>. (<year>2025</year>) <fpage>2506.17442</fpage>. doi: <pub-id pub-id-type="doi">10.48550/arXiv.2506.17442</pub-id></mixed-citation></ref>
<ref id="ref20"><label>20.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vela</surname><given-names>D</given-names></name> <name><surname>Sharp</surname><given-names>A</given-names></name> <name><surname>Zhang</surname><given-names>R</given-names></name> <name><surname>Nguyen</surname><given-names>T</given-names></name> <name><surname>Hoang</surname><given-names>A</given-names></name> <name><surname>Pianykh</surname><given-names>OS</given-names></name></person-group>. <article-title>Temporal quality degradation in AI models</article-title>. <source>Sci Rep</source>. (<year>2022</year>) <volume>12</volume>:<fpage>11654</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-022-15245-z</pub-id>, <pub-id pub-id-type="pmid">35803963</pub-id></mixed-citation></ref>
<ref id="ref21"><label>21.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kwong</surname><given-names>JCC</given-names></name> <name><surname>Nguyen</surname><given-names>D-D</given-names></name> <name><surname>Khondker</surname><given-names>A</given-names></name> <name><surname>Li</surname><given-names>T</given-names></name> <name><surname>Kulkarni</surname><given-names>GS</given-names></name></person-group>. <article-title>Five years after CONSORT-AI, not much has changed: a call to action for artificial intelligence research in oncology</article-title>. <source>BMJ Oncol</source>. (<year>2025</year>) <volume>4</volume>:<fpage>e000891</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmjonc-2025-000891</pub-id>, <pub-id pub-id-type="pmid">40923021</pub-id></mixed-citation></ref>
<ref id="ref22"><label>22.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ardila</surname><given-names>D</given-names></name> <name><surname>Kiraly</surname><given-names>AP</given-names></name> <name><surname>Bharadwaj</surname><given-names>S</given-names></name> <name><surname>Choi</surname><given-names>B</given-names></name> <name><surname>Reicher</surname><given-names>JJ</given-names></name> <name><surname>Peng</surname><given-names>L</given-names></name> <etal/></person-group>. <article-title>End-to-end lung cancer screening with three-dimensional deep learning on low-dose chest computed tomography</article-title>. <source>Nat Med</source>. (<year>2019</year>) <volume>25</volume>:<fpage>954</fpage>&#x2013;<lpage>61</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41591-019-0447-x</pub-id>, <pub-id pub-id-type="pmid">31110349</pub-id></mixed-citation></ref>
<ref id="ref23"><label>23.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hassan</surname><given-names>M</given-names></name> <name><surname>Kushniruk</surname><given-names>A</given-names></name> <name><surname>Borycki</surname><given-names>E</given-names></name></person-group>. <article-title>Barriers to and facilitators of artificial intelligence adoption in health care: scoping review</article-title>. <source>JMIR Hum Factors</source>. (<year>2024</year>) <volume>11</volume>:<fpage>e48633</fpage>. doi: <pub-id pub-id-type="doi">10.2196/48633</pub-id>, <pub-id pub-id-type="pmid">39207831</pub-id></mixed-citation></ref>
<ref id="ref24"><label>24.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Singh</surname><given-names>V</given-names></name> <name><surname>Cheng</surname><given-names>S</given-names></name> <name><surname>Kwan</surname><given-names>AC</given-names></name> <name><surname>Ebinger</surname><given-names>J</given-names></name></person-group>. <article-title>United States Food and Drug Administration regulation of clinical software in the era of artificial intelligence and machine learning</article-title>. <source>Mayo Clinic Proc. Digital Health</source>. (<year>2025</year>) <volume>3</volume>:<fpage>100231</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.mcpdig.2025.100231</pub-id>, <pub-id pub-id-type="pmid">40673280</pub-id></mixed-citation></ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0002">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1577340/overview">George Gourzoulidis</ext-link>, Health Through Evidence, Greece</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0003">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1807485/overview">David Bardey</ext-link>, University of Los Andes, Colombia</p>
</fn>
</fn-group>
<fn-group>
<fn id="fn0001">
<label>1</label>
<p><ext-link xlink:href="https://database.inahta.org/" ext-link-type="uri">https://database.inahta.org/</ext-link></p>
</fn>
</fn-group>
</back>
</article>