<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Digit. Health</journal-id>
<journal-title>Frontiers in Digital Health</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Digit. Health</abbrev-journal-title>
<issn pub-type="epub">2673-253X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fdgth.2025.1523953</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Digital Health</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Using artificial intelligence to develop a measure of orthopaedic treatment success from clinical notes</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes"><name><surname>Floyd</surname><given-names>Sarah B.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref><uri xlink:href="https://loop.frontiersin.org/people/2888034/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/></contrib>
<contrib contrib-type="author"><name><surname>Almeldien</surname><given-names>Ahmed G.</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/></contrib>
<contrib contrib-type="author"><name><surname>Smith</surname><given-names>D. Hudson</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/></contrib>
<contrib contrib-type="author"><name><surname>Judkins</surname><given-names>Benjamin</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/></contrib>
<contrib contrib-type="author"><name><surname>Krohn</surname><given-names>Claire E.</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/></contrib>
<contrib contrib-type="author"><name><surname>Reynolds</surname><given-names>Zachary Cole</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/></contrib>
<contrib contrib-type="author"><name><surname>Jeray</surname><given-names>Kyle</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/></contrib>
<contrib contrib-type="author"><name><surname>Obeid</surname><given-names>Jihad S.</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/122113/overview" />
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/></contrib>
</contrib-group>
<aff id="aff1"><label><sup>1</sup></label><institution>Department of Public Health Sciences, Clemson University</institution>, <addr-line>Clemson, SC</addr-line>, <country>United States</country></aff>
<aff id="aff2"><label><sup>2</sup></label><institution>Biomedical Data Science and Informatics Program, Clemson University</institution>, <addr-line>Clemson, SC</addr-line>, <country>United States</country></aff>
<aff id="aff3"><label><sup>3</sup></label><institution>Department of Mathematical and Statistical Sciences, Clemson University</institution>, <addr-line>Clemson, SC</addr-line>, <country>United States</country></aff>
<aff id="aff4"><label><sup>4</sup></label><institution>Department of Orthopaedic Surgery, Prisma Health</institution>, <addr-line>Greenville, SC</addr-line>, <country>United States</country></aff>
<aff id="aff5"><label><sup>5</sup></label><institution>Department of Public Health Sciences, Medical University of South Carolina</institution>, <addr-line>Charleston, SC</addr-line>, <country>United States</country></aff>
<author-notes>
<fn fn-type="edited-by"><p><bold>Edited by:</bold> Phoey Lee Teh, Glynd&#x0175;r University, United Kingdom</p></fn>
<fn fn-type="edited-by"><p><bold>Reviewed by:</bold> Daisy Monika Lal, Lancaster University, United Kingdom</p>
<p>Chukwudi Uwasomba, The Open University, United Kingdom</p></fn>
<corresp id="cor1"><label>&#x002A;</label><bold>Correspondence:</bold> Sarah B. Floyd <email>sbf@clemson.edu</email></corresp>
</author-notes>
<pub-date pub-type="epub"><day>24</day><month>04</month><year>2025</year></pub-date>
<pub-date pub-type="collection"><year>2025</year></pub-date>
<volume>7</volume><elocation-id>1523953</elocation-id>
<history>
<date date-type="received"><day>04</day><month>12</month><year>2024</year></date>
<date date-type="accepted"><day>26</day><month>03</month><year>2025</year></date>
</history>
<permissions>
<copyright-statement>&#x00A9; 2025 Floyd, Almeldien, Smith, Judkins, Krohn, Reynolds, Jeray and Obeid.</copyright-statement>
<copyright-year>2025</copyright-year><copyright-holder>Floyd, Almeldien, Smith, Judkins, Krohn, Reynolds, Jeray and Obeid</copyright-holder><license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><sec><title>Introduction</title>
<p>A readily available outcome measure that reflects the success of a patient&#x0027;s treatment is needed to demonstrate the value of orthopaedic interventions. Patient-reported outcome measures (PROMs) are survey-based instruments that collect joint-specific and general health perceptions on symptoms, functioning, and health-related quality of life. PROMs are considered the gold standard outcome measure in orthopaedic medicine, but their use is limited in real-world practice due to challenges with technology integration, the pace of clinic workflows, and patient compliance. Clinical notes generated during each encounter patients have with their physician contain rich information on current disease symptoms, rehabilitation progress, and unexpected complications. Artificial intelligence (AI) methods can be used to identify phrases of treatment success or failure captured in clinical notes and discern an indicator of treatment success for orthopaedic patients.</p>
</sec><sec><title>Methods</title>
<p>This was a cross-sectional analysis of clinical notes from a sample of patients with an acute shoulder injury. The study included adult patients presenting to a Level-1 Trauma Center and regional health system for an acute Proximal Humerus Fracture (PHF) between January 1, 2019 and December 31, 2021. We used the progress note from the office visit for PHF-related care (ICD10: S42.2XXX) or shoulder pain (ICD10: M45.2XXX) closest to 1-year after the injury date. Clinical notes were reviewed by an orthopaedic resident and labeled as treatment success or failure. A structured comparative analysis of classifiers including both machine and deep learning algorithms was performed.</p>
</sec><sec><title>Results</title>
<p>The final sample included 868 clinical notes from patients treated by 123 physicians across 35 departments within one regional health system. The study sample was stratified into 465 notes labeled as treatment success and 403 labeled as treatment failure. The Bio-ClinicalBERT model had the highest performance of 87&#x0025; accuracy (AUC&#x2009;&#x003D;&#x2009;0.87&#x2009;&#x00B1;&#x2009;0.04) in correctly distinguishing between treatment success and failure notes.</p>
</sec><sec><title>Discussion</title>
<p>Our results suggest that text classifiers applied to clinical notes are capable of differentiating patients with successful treatment outcomes with high levels of accuracy. This finding is encouraging, signaling that routinely collected clinical note content may serve as a data source to develop an outcome measure for orthopaedic patients.</p>
</sec>
</abstract>
<kwd-group>
<kwd>proximal humerus fractures</kwd>
<kwd>artificial intelligence</kwd>
<kwd>treatment outcomes</kwd>
<kwd>clinical text</kwd>
<kwd>natural language processing</kwd>
<kwd>electronic health record system</kwd>
</kwd-group><contract-sponsor id="cn001">Agency for Healthcare Research and Quality</contract-sponsor><counts>
<fig-count count="2"/>
<table-count count="3"/><equation-count count="0"/><ref-count count="72"/><page-count count="10"/><word-count count="0"/></counts><custom-meta-wrap><custom-meta><meta-name>section-at-acceptance</meta-name><meta-value>Health Informatics</meta-value></custom-meta></custom-meta-wrap>
</article-meta>
</front>
<body><sec id="s1" sec-type="intro"><title>Introduction</title>
<p>A readily available outcome measure that reflects the success of a patients&#x0027; treatment is needed to demonstrate the value of orthopaedic interventions (<xref ref-type="bibr" rid="B1">1</xref>&#x2013;<xref ref-type="bibr" rid="B4">4</xref>). PROMs are viewed as the gold standard outcome measure in orthopaedics (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>), and could be used to track improvements in patient status over time to assess whether a patient achieved their treatment goals (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B8">8</xref>). However, PROM collection in real-world practice has proven difficult due to challenges with technology integration, data collection disruptions to clinic workflows, and low patient compliance completing PROM questionnaires (<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B10">10</xref>). Most orthopaedic practices in the United States view the collection of PROMs as time consuming, cumbersome, and costly (<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B11">11</xref>), and it is estimated that only half of orthopaedic practices collect PROMs (<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B12">12</xref>). Without widespread availability of PROMs, evaluating the success of orthopaedic treatments has been limited to process-based measures and end points such as survival and surgical complications, which can readily be found in structured fields in administrative data (<xref ref-type="bibr" rid="B4">4</xref>). Unfortunately, these data points paint an incomplete picture of a patient&#x0027;s medical experience and whether treatment was successful in achieving a patient&#x0027;s prioritized outcome goals (e.g., reduced pain, improved range of motion, return to sports or work, etc.) (<xref ref-type="bibr" rid="B13">13</xref>&#x2013;<xref ref-type="bibr" rid="B16">16</xref>). A crucial step to demonstrating if orthopaedic care achieves meaningful patient-specific improvement is to have outcome data available that measure if treatment was successful in achieving the outcome goals prioritized by patients.</p>
<p>Unstructured clinical notes represent untapped potential for evaluating the success of orthopaedic treatments for individual patients (<xref ref-type="bibr" rid="B17">17</xref>&#x2013;<xref ref-type="bibr" rid="B24">24</xref>). Clinical notes are generated for each encounter patients have with their physician. These notes contain rich information on current disease symptoms, rehabilitation progress, and unexpected complications, and captures an essence of the patient state that is not stored elsewhere in the Electronic Health Record (EHR) (<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B25">25</xref>&#x2013;<xref ref-type="bibr" rid="B30">30</xref>). However, because these notes are in an unstructured format, they have not historically been thought of as a useful data source to develop consistent measures of patient treatment success. Applications of artificial intelligence (AI) and natural language processing (NLP) methods in healthcare are rapidly expanding, and have been used to identify similar patient groups with a defined set of clinical markers and symptoms, automate patient cohort selection, and develop predictive models (<xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B31">31</xref>&#x2013;<xref ref-type="bibr" rid="B33">33</xref>). In orthopaedic medicine, NLP applications are been being deployed to solve a range of orthopaedic-related problems (<xref ref-type="bibr" rid="B34">34</xref>&#x2013;<xref ref-type="bibr" rid="B36">36</xref>). We proposed that NLP methods can be employed to identify phrases denoting treatment success or failure recorded in clinical notes, thereby discerning indicators of treatment success for orthopaedic patients.</p>
<p>Clinical notes are typically documented using a subjective, objective, assessment and plan (SOAP) format, where the subjective section of the progress note reflects the patient&#x0027;s story (the interim history since the last visit), told to and interpreted by the physician (<xref ref-type="bibr" rid="B28">28</xref>). The rest of the unstructured SOAP notes include physical findings (objective findings), medical reasoning (assessment), and patient care (the plan) and (<xref ref-type="bibr" rid="B37">37</xref>&#x2013;<xref ref-type="bibr" rid="B39">39</xref>) reveal distinct trajectories of patient outcomes after treatment (<xref ref-type="bibr" rid="B38">38</xref>, <xref ref-type="bibr" rid="B40">40</xref>). In successful cases the progress note documents the degree of improvement or relief experienced and reported by patients to their clinicians (<xref ref-type="bibr" rid="B30">30</xref>). Conversely when symptoms have not resolved, or when subsequent complications arise, these ongoing patient complaints and persistent treatment utilization are documented in the notes. Note content highlights symptoms and outcome dimensions, which are valued by patients and contribute to a patient&#x0027;s individual definition of success (<xref ref-type="bibr" rid="B41">41</xref>).</p>
<p>A patient-specific outcome measure is needed in orthopaedic medicine to assess if a patient&#x0027;s treatment goals were met and help demonstrate the value of orthopaedic treatments. The objective of this study was to develop a clinical text classifier, using different AI approaches, including traditional machine learning and deep learning, capable of identifying whether a patient achieved treatment success for a sample of patients receiving follow-up care for an acute proximal humerus fracture. Proximal humerus fracture (PHF) was chosen as a use case for testing this method of outcome generation because many different treatment options can be used for this injury and better outcome data are needed to guide future clinical decision-making for this condition (<xref ref-type="bibr" rid="B42">42</xref>&#x2013;<xref ref-type="bibr" rid="B45">45</xref>). To that end, we began by exploring the feasibility of generating an outcome measure from clinical notes by evaluating various AI-based text classifiers for patients treated for a PHF.</p>
</sec>
<sec id="s2" sec-type="methods"><title>Materials and methods</title>
<sec id="s2a"><title>Study sample</title>
<p>This was a cross-sectional analysis of clinical notes from a sample of patients with an acute PHF. The study included adult patients presenting to a Level-1 Trauma Center regional health system for an acute PHF between January 1, 2019 and December 31, 2021. The first visit for a patient for PHF during the study period was defined as the index visit. We then identified all health system encounters (hospital encounters, office visits, etc.) with a diagnosis of PHF or shoulder pain from the index PHF visit to 365 days after the index PHF visit and extracted the clinical note from the office visit for PHF-related care (ICD10: S42.2XXX) or shoulder pain (ICD10: M45.2XXX) closest to 1-year after the injury date. This resulted in one representative note per person. Patients were excluded from the study if they were less than 18 years of age, did not have at least one office visit with a diagnosis of PHF or shoulder pain that occurred 45 days or more days after the index visit, or if their last office visit was less than 500 characters, since smaller notes did not have the necessary sections for outcome information. We found that less than 1&#x0025; of the eligible sample had a note length less than 500 characters. A minimum of 45 days after index was used as this is the minimal time needed for healing of a PHF, prior to which, treatment success cannot be assessed. We randomly sampled 1,000 patients meeting these inclusion criteria, and after physician review of the sample, a total of 868 notes were used for this study. Additional exclusions after physician review included notes from patients receiving care for bilateral PHFs or notes that did not reflect care for PHF. This study was approved by the Prisma Health Institutional Review Board.</p>
</sec>
<sec id="s2b"><title>Data labeling process</title>
<p>The University of South Carolina Patient Engagement Studio brings together patients and caregivers, community groups, health system innovators, clinicians, and academic researchers to produce meaningful research that advances health research outcomes. The PES membership includes over 100 patients with diverse backgrounds and clinical experiences from across the United States trained to provide feedback and collaborate with research teams (<xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B47">47</xref>). The first author (S.F.) led three Patient Engagement Studio (PES) sessions to involve patients in the development of the definitions of treatment success. There is no one standard acceptable definition of treatment success, as it varies based upon patient lifestyle and desired goals (<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B48">48</xref>). However, generally, the goal of orthopaedic treatment is to restore the function of the joint, minimize pain and maximize quality of life for patients after the injury. Together, the PES members and research team defined four outcome states and associated labels that described the range of positive and negative outcomes that could follow care for PHF. The outcome states, definitions, and note text indicators can be found in <xref ref-type="table" rid="T1">Table&#x00A0;1</xref>.</p>
<table-wrap id="T1" position="float"><label>Table 1</label>
<caption><p>Outcome labels and corresponding definition and indicators.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Outcome state</th>
<th valign="top" align="center">Definition</th>
<th valign="top" align="center">Indicators of outcome state found in clinical notes</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Treatment success</td>
<td valign="top" align="left">Treatment success occurs when a patient is able to resume desired activities, has a sufficient range of motion, and is in minimal/mild or no pain. After PHF it is possible for there to be some lingering motion limitations (patient may never return to 100&#x0025;) or minimal pain, but these issues should not require ongoing treatment or be prohibitive to their desired lifestyle or daily activities.</td>
<td valign="top" align="left">
<list list-type="simple">
<list-item><label>&#x2022;</label>
<p>Radiographic healing</p></list-item>
<list-item><label>&#x2022;</label>
<p>Making good progress/improvements with current treatment or stopping treatment</p></list-item>
<list-item><label>&#x2022;</label>
<p>Patient returns to work or play.</p></list-item>
<list-item><label>&#x2022;</label>
<p>No major complaints documented.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Only follow-up as needed</p></list-item>
</list></td>
</tr>
<tr>
<td valign="top" align="left">Improvement of condition</td>
<td valign="top" align="left">Improvement occurs when there is a record of some levels of pain or functional problems that are somewhat prohibitive to the patient&#x0027;s desired activities, but improvement is occurring. In these situations, physicians may continue to monitor patients, but do not alter care or treatment courses.</td>
<td valign="top" align="left">
<list list-type="simple">
<list-item><label>&#x2022;</label>
<p>Radiographic healing or signs of healing occurring.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Moderate loss of function or pain which interferes with desired activities, but no change in treatment.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Ongoing treatment and monitoring progress</p></list-item>
<list-item><label>&#x2022;</label>
<p>Return in 2&#x2013;6 weeks for repeat x-rays and re-check</p></list-item>
</list></td>
</tr>
<tr>
<td valign="top" align="left">Deterioration of condition</td>
<td valign="top" align="left">Deterioration occurs when there is a record of some levels of pain or functional problems that are becoming more prohibitive to the patient&#x0027;s desired activities. No real improvements are occurring, and physicians may escalate or alter care or treatment courses.</td>
<td valign="top" align="left">
<list list-type="simple">
<list-item><label>&#x2022;</label>
<p>Negative radiographic changes observed.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Moderate loss of function or pain which interferes with desired activities requiring a change in treatment.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Initiating or continuing treatment and monitoring progress.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Return in 2&#x2013;6 weeks for repeat x-rays and re-check.</p></list-item>
</list></td>
</tr>
<tr>
<td valign="top" align="left">Treatment Failure</td>
<td valign="top" align="left">Treatment failure occurs when the patient is experiencing significant pain or limitations and requires subsequent fracture-related care. Failing is occurring when patients are unable to resume desired activities and may include fracture sequelae, complications, or nonunion.</td>
<td valign="top" align="left">
<list list-type="simple">
<list-item><label>&#x2022;</label>
<p>Ongoing, persistent treatment (injections, surgeries) for symptoms related to PHF.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Unrelenting pain</p></list-item>
<list-item><label>&#x2022;</label>
<p>Surgical complications</p></list-item>
<list-item><label>&#x2022;</label>
<p>Loss of significant motion</p></list-item>
<list-item><label>&#x2022;</label>
<p>Extreme pain</p></list-item>
<list-item><label>&#x2022;</label>
<p>Fracture related sequelae (e.g., avascular necrosis)</p></list-item>
</list></td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Four orthopaedic residents, each with a minimum of 2 years of experience in orthopaedic medicine participated in the labeling of the clinical notes. Each orthopaedic resident received a 1-h training session on the note labels and definitions. Residents were instructed to label each note based on the outcome state reflected in the current visit and documented in the note. In addition to the outcome labels, orthopaedic residents had the option to select &#x201C;Indeterminant&#x2014;not enough content to label&#x201D; or flag a note for expert review. We assigned overlap in note review subsets, so that agreement could be assessed across residents. An attending orthopaedic surgeon, the Chair of Department of Orthopaedic Surgery, served as the final arbitrator when discordance occurred between residents&#x2019; labels or when expert review was requested. Each label provided by the Chair was viewed as the final label for that note.</p>
<p>REDCap (<xref ref-type="bibr" rid="B49">49</xref>) was used to organize and store notes and labels. Notes were truncated to 10,000 words and HTML tags were added for formatting to aid in the review process. The final labeled dataset produced by the orthopaedic residents represented the gold standard dataset used for model development and validation. The four outcome labels were aggregated into a binary outcome representing treatment success or failure. Treatment success was represented by notes labeled as success. Failure was comprised of all remaining labels (improvement, deterioration and failure) as each of those notes had documentation of lingering, symptomatic problems requiring ongoing care. This was done to avoid class imbalance between the treatment success and failure classes, since our data set had many more cases in the treatment success category compared to the remaining three unfavorable outcome categories.</p>
</sec>
<sec id="s2c"><title>Stratified data segmentation protocol</title>
<p>We maintained a consistent data division strategy to ensure a fair and unbiased comparison across all models, so 90&#x0025; of the data was allocated for model training, while the remaining unseen 10&#x0025; was reserved for testing. Within these partitions, we preserved the proportion of outcome labels observed in the full labeled data set. We used a five-fold cross-validation strategy to robustly measure the generalizability of all models. Moreover, due to the relatively small number of cases, we repeated the testing cycle 10 times through train and test data partitioning (<xref ref-type="fig" rid="F1">Figure&#x00A0;1</xref>). A critical aspect of our experimental design was ensuring fair model comparison by using identical data splits across all models within each run. For each of the ten experimental iterations, we created a single stratified train-test split that was subsequently used for all models being evaluated. This approach eliminates potential confounding effects from data partitioning and ensures that any observed performance differences can be attributed to the models themselves rather than to variations in training or testing data.</p>
<fig id="F1" position="float"><label>Figure 1</label>
<caption><p>AI model training and evaluation pipeline for treatment success measure assessment.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-07-1523953-g001.tif"/>
</fig>
</sec>
<sec id="s2d"><title>Bag-of-words based models</title>
<p>We tested the performance of several baseline classifiers that utilize a bag-of-words approach, primarily to provide a reference point for comparing more advanced modeling techniques. For these traditional machine learning models, we employed GridSearchCV with 5-fold cross-validation to systematically search for optimal hyperparameters. The text data were vectorized using term frequency-inverse document frequency (TF-IDF) (<xref ref-type="bibr" rid="B50">50</xref>) with parameters set to ignore terms appearing in more than 90&#x0025; of documents (max_df&#x2009;&#x003D;&#x2009;0.9), include terms appearing in at least 5 documents (min_df&#x2009;&#x003D;&#x2009;5), and incorporate both unigrams and bigrams [ngram_range&#x2009;&#x003D;&#x2009;(1,2)]. Text preprocessing was consistent across all models, involving lowercase conversion, special character removal (except for periods, numbers, and alphabets), whitespace normalization, and lemmatization for words longer than three characters. This approach preserved medical abbreviations that might be clinically significant while reducing vocabulary size and standardizing word forms.</p>
<p>After applying TF-IDF vectorization, we tested five distinct machine learning classifiers: Logistic Regression, with an inverse regularization strength (C) equal to 0.1; Support Vector Machine with Linear Kernel (<xref ref-type="bibr" rid="B51">51</xref>); Random Forest model with 200 trees, with each tree having a maximum depth of 10 and using &#x201C;entropy&#x201D; as the criterion for measuring the quality of splits (<xref ref-type="bibr" rid="B52">52</xref>); Gradient Boosting Classifier with 200 boosting stages and a learning rate of 0.01, implying effectiveness in gradual learning over numerous iterations (<xref ref-type="bibr" rid="B53">53</xref>); and XGBClassifier with 100 estimators, a learning rate of 0.01, a maximum tree depth of 4, and a subsample ratio of 0.9, indicating a preference for moderate complexity and high sample coverage in training (<xref ref-type="bibr" rid="B54">54</xref>).</p>
</sec>
<sec id="s2e"><title>Transformer-based classifiers</title>
<p>In this study, we adopted a family of transformer-based language models to analyze clinical note content, primarily because transformers utilize a multi-head self-attention mechanism that pinpoints how different words in a sequence relate to each other, even when they are far apart. This mechanism effectively captures non-linear contextual dependencies by allowing multiple &#x201C;heads&#x201D; to attend to different segments of the input in parallel, thereby highlighting important clinical cues that might not be locally adjacent. Of the transformer-based models (<xref ref-type="bibr" rid="B55">55</xref>), we used BERT (<xref ref-type="bibr" rid="B56">56</xref>), BioBERT (<xref ref-type="bibr" rid="B57">57</xref>), and Bio-ClinicalBERT (<xref ref-type="bibr" rid="B58">58</xref>), and to analyze note content. We selected BERT as our base architecture model due to its bidirectional training paradigm, which uses both preceding and succeeding words for context. Building upon BERT, BioBERT further refines the model with additional pre-training on domain-specific biomedical corpora, effectively incorporating specialized terminology. Similarly, Bio-ClinicalBERT further refines BioBERT by fine-tuning on the Medical Information Mart for Intensive Care (MIMIC-III) (<xref ref-type="bibr" rid="B59">59</xref>) clinical notes dataset to augment its capability in deciphering medical terminology and understanding complex clinical semantics. Each of our transformer-based models accepted a maximum of 512 tokens. We selected the last 512 tokens instead of the first 512 tokens based on our observation that later parts of the note typically contained the most-clinically relevant information about ongoing symptoms and necessary treatment or discharge from care.</p>
<p>For these transformer-based models, we employed a consistent training approach. Each model was trained for 8 epochs with a batch size of 8, using the AdamW optimizer (<xref ref-type="bibr" rid="B71">71</xref>) with a learning rate of 3&#x2009;&#x00D7;&#x2009;10<sup>&#x2212;5</sup> and epsilon of 1&#x2009;&#x00D7;&#x2009;10<sup>&#x2212;8</sup>. To optimize the learning rate schedule, we implemented a cosine annealing learning rate scheduler that gradually reduced the learning rate from the initial value to zero throughout the training process. We applied gradient clipping with a maximum norm of 1.0 to prevent exploding gradients during backpropagation. This technique helped stabilize the training process, particularly important for the fine-tuning of pre-trained language models on domain-specific data. The transformer-based models processed our common data splits through their respective tokenization pipelines, ensuring consistent evaluation across experimental runs.</p>
</sec>
<sec id="s2f"><title>Convolutional neural network classifier</title>
<p>We also tested the performance of Convolutional Neural Network (CNN)-based classifiers for textual data, primarily because CNNs excel at extracting localized patterns from sequences&#x2014;such as n-gram features&#x2014;by sliding convolutional filters over the embedded text (<xref ref-type="bibr" rid="B60">60</xref>). We first converted the text into integer sequences and right padded these to a fixed sequence length (<xref ref-type="bibr" rid="B61">61</xref>, <xref ref-type="bibr" rid="B62">62</xref>). Our CNN architecture was specifically designed for text classification, featuring an embedding layer followed by multiple parallel convolutional layers with varying filter sizes (<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B12">12</xref>) to capture different n-gram patterns in the text. Each convolutional layer utilized 200 filters and was connected to an adaptive max pooling layer. The architecture incorporated a three-layer fully connected network (200 units&#x2009;&#x2192;&#x2009;100 units&#x2009;&#x2192;&#x2009;1 unit) with ReLU activations and dropout (rate&#x2009;&#x003D;&#x2009;0.5) for regularization. The CNN model was trained for up to 50 epochs with early stopping (patience&#x2009;&#x003D;&#x2009;5) using the Adam optimizer with an initial learning rate of 0.001 and a step learning rate scheduler (step size&#x2009;&#x003D;&#x2009;5, gamma&#x2009;&#x003D;&#x2009;0.1). Unlike the transformer models, the CNN implementation used a custom tokenizer and a batch size of 16, which resulted in a different processing pipeline for the same underlying data splits.</p>
</sec>
<sec id="s2g"><title>Statistical analysis and model evaluation</title>
<p>Fleiss&#x0027; kappa statistics were used to assess the degree of agreement in note labels between orthopaedic residents. We used the benchmarks for agreement measures for categorical data as described by Landis and Koch, where 0.00&#x2013;0.20, 0.21&#x2013;0.40, 0.41&#x2013;0.60, 0.61&#x2013;0.80, and 0.81&#x2013;1.00 indicate poor, fair, moderate, substantial, and almost perfect agreement, respectively (<xref ref-type="bibr" rid="B63">63</xref>). Patient characteristics including patient age, sex, race, insurance status, fracture diagnosis, and visit characteristics were extracted from the EHR and used to asses differences in patient and visit characteristics associated with note labels. Analyses were performed with SAS (Cary, NC) version 15.2, R studio, and excel.</p>
<p>To evaluate the performance of each model on the binary outcome measure we evaluated the F1 score, sensitivity, specificity, positive and negative predictive value, and Area Under the Receiver Operating Characteristic Curve (AUC-ROC) metric. The AUC-ROC metric provides a single value that encapsulates the trade-off between the true positive rate and the false positive rate at various decision threshold levels. Model comparisons are displayed using ordered Box and Whisker plots where each box represents the interquartile range (IQR) for a specific model&#x0027;s AUC scores and data points represent outliers. To assess statistical significance between model performance, we conducted paired <italic>t</italic>-tests between models that shared identical data splits and unpaired <italic>t</italic>-tests (Welch&#x0027;s <italic>t</italic>-test) for comparisons involving the CNN model. Since the transformer-based and traditional machine learning models used identical data splits in each run, paired <italic>t</italic>-tests were appropriate for these comparisons. In contrast, due to the CNN model&#x0027;s different tokenization and processing pipeline, unpaired <italic>t</italic>-tests were necessary for comparing CNN with other models. A significance level of <italic>p</italic>&#x2009;&#x003C;&#x2009;0.05 was set.</p>
</sec>
</sec>
<sec id="s3" sec-type="results"><title>Results</title>
<sec id="s3a"><title>Progress note characteristics</title>
<p>The sample of 868 clinical notes came from patients treated by 123 physicians across 35 departments within one regional health system. The average age of the patient was 67.5 years of age and 80&#x0025; of the sample were female patients. Patients were primarily white (91&#x0025;) and enrolled in the Medicare system (64&#x0025;). The notes came from fracture-related encounters ranging from the 2nd to the 22nd encounter after the index PHF visit, with a mean of 4, representing the 4th PHF-related encounter. The note lengths ranged from 981 to 15,297 characters with a mean length of 4,961 characters.</p>
<p>The sample was stratified into 465 notes labeled as treatment success and 403 notes labeled as treatment failure. Patients experiencing treatment success did not differ from those labeled as treatment failure in age, sex, or race. Additionally, treatment success notes did not differ in time since index visit, or the number of PHF-related encounters. However, notes labeled as treatment success had a higher proportion of Medicare (65.8&#x0025; vs. 62.3&#x0025;) and commercially insured patients (23.4&#x0025; vs. 22.1&#x0025;), compared to notes labeled as treatment failure. Additionally, treatment success notes had a lower proportion of surgically treated patients (16.3&#x0025; vs. 24.3&#x0025;) than notes labeled as treatment failure. Treatment success notes were also significantly shorter in length (4,673 vs. 5,291 characters). <xref ref-type="table" rid="T2">Table&#x00A0;2</xref> contains sample characteristics by note label status.</p>
<table-wrap id="T2" position="float"><label>Table 2</label>
<caption><p>Sample characteristics by note label Status.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left" rowspan="3">Patient and note characteristics</th>
<th valign="top" align="center">Total sample</th>
<th valign="top" align="center">Treatment success notes</th>
<th valign="top" align="center">Treatment failure notes</th>
<th valign="top" align="center" rowspan="3"><italic>P</italic>-value</th>
</tr>
<tr>
<th valign="top" align="center"><italic>N</italic> (&#x0025;)</th>
<th valign="top" align="center"><italic>N</italic> (&#x0025;)</th>
<th valign="top" align="center"><italic>N</italic> (&#x0025;)</th>
</tr>
<tr>
<th valign="top" align="center"><italic>N</italic>&#x2009;&#x003D;&#x2009;868 (100)</th>
<th valign="top" align="center"><italic>N</italic>&#x2009;&#x003D;&#x2009;465 (53.4)</th>
<th valign="top" align="center"><italic>N</italic>&#x2009;&#x003D;&#x2009;403 (46.4)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Patient Age, Mean (SD)</td>
<td valign="top" align="center">67.5 (14.9)</td>
<td valign="top" align="center">68.1 (15.1)</td>
<td valign="top" align="center">66.8 (14.7)</td>
<td valign="top" align="center">0.19</td>
</tr>
<tr>
<td valign="top" align="left" colspan="4">Patient Sex, N (&#x0025;)</td>
<td valign="top" align="center" colspan="1">0.18</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Male</td>
<td valign="top" align="center">175 (20.2)</td>
<td valign="top" align="center">86 (18.5)</td>
<td valign="top" align="center">89 (22.1)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Female</td>
<td valign="top" align="center">693 (79.8)</td>
<td valign="top" align="center">379 (81.5)</td>
<td valign="top" align="center">314 (77.9)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left" colspan="4">Patient Race, N (&#x0025;)</td>
<td valign="top" align="center" colspan="1">0.68</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;White</td>
<td valign="top" align="center">791 (91.1)</td>
<td valign="top" align="center">427 (91.8)</td>
<td valign="top" align="center">364 (90.3)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Black</td>
<td valign="top" align="center">46 (5.3)</td>
<td valign="top" align="center">23 (4.9)</td>
<td valign="top" align="center">23 (5.7)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;American Indian, Alaskan, or Hawaiian</td>
<td valign="top" align="center">4 (1.0)</td>
<td valign="top" align="center">3 (0.6)</td>
<td valign="top" align="center">1 (0.2)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Hispanic</td>
<td valign="top" align="center">13 (1.5)</td>
<td valign="top" align="center">6 (1.3)</td>
<td valign="top" align="center">7 (1.7)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Asian</td>
<td valign="top" align="center">4 (0.5)</td>
<td valign="top" align="center">2 (0.4)</td>
<td valign="top" align="center">2 (0.5)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Other</td>
<td valign="top" align="center">10 (1.0)</td>
<td valign="top" align="center">4 (1.0)</td>
<td valign="top" align="center">6 (1.5)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left" colspan="4">Insurance Provider</td>
<td valign="top" align="center" colspan="1">0.04</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Medicare</td>
<td valign="top" align="center">557 (64)</td>
<td valign="top" align="center">306 (65.8)</td>
<td valign="top" align="center">251 (62.3)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Medicaid</td>
<td valign="top" align="center">37 (4.2)</td>
<td valign="top" align="center">16 (3.4)</td>
<td valign="top" align="center">21 (5.2)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Private</td>
<td valign="top" align="center">198 (23)</td>
<td valign="top" align="center">109 (23.4)</td>
<td valign="top" align="center">89 (22.1)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Other</td>
<td valign="top" align="center">70 (8.1)</td>
<td valign="top" align="center">34 (7.3)</td>
<td valign="top" align="center">36 (8.9)</td>
<td valign="top" align="center"/>
</tr>
<tr>
<td valign="top" align="left" colspan="5">Note Characteristics</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Days from Index, Mean (SD)</td>
<td valign="top" align="center">135 (79.9)</td>
<td valign="top" align="center">131.2 (72.0)</td>
<td valign="top" align="center">140.8 (87.8)</td>
<td valign="top" align="center">0.08</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;PHF-related encounter, Mean (SD)</td>
<td valign="top" align="center">4.4 (1.8)</td>
<td valign="top" align="center">4.4 (1.6)</td>
<td valign="top" align="center">4.5 (2.01)</td>
<td valign="top" align="center">0.26</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Patient treated surgically, N (&#x0025;)</td>
<td valign="top" align="center">174 (20)</td>
<td valign="top" align="center">76 (16.3)</td>
<td valign="top" align="center">98 (24.3)</td>
<td valign="top" align="center">&#x003C;0.01</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Note character length, Mean (SD)</td>
<td valign="top" align="center">4,961 (2,725)</td>
<td valign="top" align="center">4,673.4 (2,511.9)</td>
<td valign="top" align="center">5,294.1 (2,921.3)</td>
<td valign="top" align="center">&#x003C;0.001</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3b"><title>Orthopaedic resident agreement in note labeling</title>
<p>Each orthopaedic resident was assigned and labeled 268 notes with overlap in note assignment across orthopaedic residents. Interrater agreement for classification of clinical notes was moderate [pairwise percent agreement&#x2009;&#x003D;&#x2009;75.31&#x0025;, Fleiss&#x0027; <italic>&#x03BA;</italic>&#x2009;&#x003D;&#x2009;0.49 (95&#x0025; CI: 0.30&#x2013;0.68)].</p>
</sec>
<sec id="s3c"><title>Model performance metrics</title>
<p>&#x00A0;<xref ref-type="table" rid="T3">Table&#x00A0;3</xref> shows results for both machine and deep learning models explored in our analysis. The XGB Classifier model achieved the highest AUC score (0.84&#x2009;&#x00B1;&#x2009;0.03) among the bag-of-words models and the Bio-ClinicalBERT model had the highest AUC (0.87&#x2009;&#x00B1;&#x2009;0.04) among the deep learning models. Overall, the Bio-ClinicalBERT model had the highest performance (AUC&#x2009;&#x003D;&#x2009;0.87&#x2009;&#x00B1;&#x2009;0.04) in correctly distinguishing between treatment success and failure notes. <xref ref-type="table" rid="T3">Table&#x00A0;3</xref> shows complete performance metrics for machine and deep learning models and <xref ref-type="fig" rid="F2">Figure&#x00A0;2</xref> displays comparative model performance for all models.</p>
<table-wrap id="T3" position="float"><label>Table 3</label>
<caption><p>Performance metrics for Bag-of-word and deep learning models.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Model name</th>
<th valign="top" align="center">F1 score</th>
<th valign="top" align="center">Specificity</th>
<th valign="top" align="center">Sensitivity</th>
<th valign="top" align="center">Precision</th>
<th valign="top" align="center">NPV</th>
<th valign="top" align="center">AUC</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="7">Bag-of-words models</td>
</tr>
<tr>
<td valign="top" align="left">Logistic regression</td>
<td valign="top" align="center">0.70 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.64 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.82 (&#x00B1;0.04)</td>
<td valign="top" align="center">0.72 (&#x00B1;0.02)</td>
<td valign="top" align="center">0.73 (&#x00B1;0.04)</td>
<td valign="top" align="center">0.80 (&#x00B1;0.03)</td>
</tr>
<tr>
<td valign="top" align="left">SVC</td>
<td valign="top" align="center">0.72 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.60 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.81 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.71 (&#x00B1;0.02)</td>
<td valign="top" align="center">0.74 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.79 (&#x00B1;0.03)</td>
</tr>
<tr>
<td valign="top" align="left">Random forest</td>
<td valign="top" align="center">0.72 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.68 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.80 (&#x00B1;0.02)</td>
<td valign="top" align="center">0.73 (&#x00B1;0.02)</td>
<td valign="top" align="center">0.73 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.80 (&#x00B1;0.01)</td>
</tr>
<tr>
<td valign="top" align="left">Gradient boosting classifier</td>
<td valign="top" align="center">0.75 (&#x00B1;0.02)</td>
<td valign="top" align="center">0.70 (&#x00B1;0.02)</td>
<td valign="top" align="center">0.81 (&#x00B1;0.02)</td>
<td valign="top" align="center">0.75 (&#x00B1;0.02)</td>
<td valign="top" align="center">0.75 (&#x00B1;0.02)</td>
<td valign="top" align="center">0.82 (&#x00B1;0.01)</td>
</tr>
<tr>
<td valign="top" align="left">XGBClassifier</td>
<td valign="top" align="center">0.75 (&#x00B1;0.02)</td>
<td valign="top" align="center">0.70 (&#x00B1;0.06)</td>
<td valign="top" align="center">0.78 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.75 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.74 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.84 (&#x00B1;0.03)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="7">Deep learning models</td>
</tr>
<tr>
<td valign="top" align="left">BERT</td>
<td valign="top" align="center">0.76 (&#x00B1;0.08)</td>
<td valign="top" align="center">0.76 (&#x00B1;0.04)</td>
<td valign="top" align="center">0.75 (&#x00B1;0.06)</td>
<td valign="top" align="center">0.79 (&#x00B1;0.05)</td>
<td valign="top" align="center">0.72 (&#x00B1;0.08)</td>
<td valign="top" align="center">0.83 (&#x00B1;0.05)</td>
</tr>
<tr>
<td valign="top" align="left">BioBERT</td>
<td valign="top" align="center">0.75 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.71 (&#x00B1;0.07)</td>
<td valign="top" align="center">0.77 (&#x00B1;0.04)</td>
<td valign="top" align="center">0.77 (&#x00B1;0.05)</td>
<td valign="top" align="center">0.73 (&#x00B1;0.03)</td>
<td valign="top" align="center">0.81 (&#x00B1;0.03)</td>
</tr>
<tr>
<td valign="top" align="left">Bio-ClinicalBERT</td>
<td valign="top" align="center">0.77 (&#x00B1;0.04)</td>
<td valign="top" align="center">0.74 (&#x00B1;0.09)</td>
<td valign="top" align="center">0.80 (&#x00B1;0.04)</td>
<td valign="top" align="center">0.78 (&#x00B1;0.07)</td>
<td valign="top" align="center">0.76 (&#x00B1;0.02)</td>
<td valign="top" align="center">0.87 (&#x00B1;0.04)</td>
</tr>
<tr>
<td valign="top" align="left">CNN</td>
<td valign="top" align="center">0.73 (&#x00B1;0.09)</td>
<td valign="top" align="center">0.65 (&#x00B1;0.14)</td>
<td valign="top" align="center">0.77 (&#x00B1;0.07)</td>
<td valign="top" align="center">0.71 (&#x00B1;0.10)</td>
<td valign="top" align="center">0.69 (&#x00B1;0.11)</td>
<td valign="top" align="center">0.80 (&#x00B1;0.05)</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F2" position="float"><label>Figure 2</label>
<caption><p>AUC scores across deep learning and machine learning models.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-07-1523953-g002.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion"><title>Discussion</title>
<p>This study is the first to develop a clinical text classifier capable of identifying whether a patient achieved treatment success following care for an acute PHF. Our results suggest that AI, more specifically, text classification models in combination with clinical note text can be used to differentiate patients with good and bad treatment outcomes. This finding is encouraging, and it suggests that routine clinical note content may offer a solution to the much-needed problem of outcome data availability in orthopaedic medicine. This AI approach could translate to producing a widely available treatment outcome measure, which could be used for comparative effectiveness research studies and for the development of clinical quality metrics (<xref ref-type="bibr" rid="B64">64</xref>) to improve the quality of orthopaedic care.</p>
<p>A crucial step in demonstrating that orthopaedic care achieves meaningful patient-specific improvement is to have outcome data available that closely measures if treatment was successful in achieving the outcome goals prioritized by patients. However, a leading challenge in outcome measurement remains that orthopaedic outcomes are highly individualized and patient specific. This fact undermines the value of even the industry-wide standard PROMs, as PROM overall scores often assume equal weighting of outcome dimensions for all patients. Yet, as an example, patients may more heavily value pain reduction over range of motion, which would not be accurately reflected in summary PROM scores. In contrast, our approach and resulting measure is highly flexible and responsive to each individual patient&#x0027;s treatment goals. Orthopaedic-related encounters are highly focused on each patient and how musculoskeletal conditions and treatment affect outcome dimensions and a patient&#x0027;s quality of life. Each encounter is naturally tailored to the patient and their unique musculoskeletal needs, and physicians record goal achievements or challenges that are revealed through the encounter discussion, exam and treatment planning.</p>
<p>The applications of AI and NLP are rapidly expanding in medicine (<xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B32">32</xref>, <xref ref-type="bibr" rid="B65">65</xref>, <xref ref-type="bibr" rid="B66">66</xref>) and orthopaedic medicine (<xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B34">34</xref>). Yet, our work is the first to use a text classifier to develop a binary measure of treatment success following care for an acute shoulder fracture. Recent studies have used similar methods to achieve related tasks. For example, Humbert-Droz et al., developed a NLP pipeline to extract documented PROMs from the EHR for patients with rheumatoid arthritis (<xref ref-type="bibr" rid="B24">24</xref>), and Zanotto et al., used NLP models to identify patient characteristics and health status PROMs (<xref ref-type="bibr" rid="B21">21</xref>). However, these studies differ from our approach in that they are still dependent upon the collection of PROM data during clinical care. Our approach offers advantages in that it does not require any additional data collection efforts on behalf of physicians, staff, or practice managers, as we know there are a myriad of challenges in collecting PROMs that may never be eliminated (<xref ref-type="bibr" rid="B10">10</xref>). Our approach is flexible and responsive with respect to the natural language typically recorded during the clinical encounter.</p>
<p>Our sample contained clinical notes from office visits for PHF-related care ranging from over 123 physicians across 35 departments within a regional health system. This finding signals that patients are receiving follow-up care for their PHFs from many different providers. While many of these visits were with an orthopaedic provider, this is an elderly patient population that regularly seeks care from primary care. Therefore, the diversity in providers and departments in our sample spans clinical notes authored by both orthopaedic and primary care physicians. This might signal that our approach is robust to notes beyond those authored just by orthopaedic physicians, to also include a variety of physicians that may discuss healing following orthopaedic treatment. Although there were not many differences observed between the characteristics of success and failure notes, we did find that treatment success notes were significantly shorter in length (4,673 vs. 5,291 characters) compared to treatment failure notes. This is not surprising, as good outcomes can be discussed and recorded more quickly and typically don&#x0027;t require ongoing treatment and related discussion and documentation. However, clinical documentation can be highly varied and more robust patient and visit characteristics should be assessed in future work to explore their relationship with clinical documentation and patient outcomes.</p>
<p>We found that of the models we tested, the Bio-ClinicalBERT model had the highest performance (AUC&#x2009;&#x003D;&#x2009;0.87&#x2009;&#x00B1;&#x2009;0.04) in correctly distinguishing between treatment success and failure notes. This finding was consistent with prior research, which has illustrated Bio-ClinicalBERT&#x0027;s enhanced capability in comprehending intricate medical terminologies and thematic elements inherent to clinical documentation compared to other models. In a similar study, Lee et al. also found that Bio-ClinicalBERT models performed well when identifying documented goals-of-care discussions within the EHR (<xref ref-type="bibr" rid="B22">22</xref>).</p>
<p>This work was the first study to develop a clinical text classifier capable of identifying whether a patient achieved treatment success following care for an acute PHF. Our ongoing work will continue to refine our approach to how to use clinical progress note content to form assessments of patient outcomes following orthopaedic treatment. Beyond validation and moving toward use in clinical practice, we envision the next step would be to consider integrating this measure with the EHR to support clinical decision support (CDS) use and quality reporting at the health system level. Development of this measure provides science at scale which enables unlimited comparative effectiveness studies across orthopaedic treatments and future tailored treatment decision making through CDS use to improve individual and population health.</p>
<p>This work is not without limitations. This was a relatively small feasibility study to assess if text classifiers could be applied to clinical notes to generate a measure of orthopaedic treatment success. Although we were successful in achieving an outcome measure with a high level of accuracy, we used a relatively small sample of patients with one shoulder condition. The patient sample we used lacked diversity, being primary female and white, and model performance should be assessed in more diverse patient samples to ensure unbiased model performance among patient subsets. Additionally, clinical note structure can vary significantly across physicians, medical specialties, and health systems. To inform the generalizability of our work, we must test our approach using multi-institutional data across a range of orthopaedic providers with variable documentation practices. Although we expect our approach would be generalizable to other orthopaedic conditions, we have not explored our methods in orthopaedic conditions beyond PHF. Future work will focus on applying our approach to acute and chronic orthopaedic conditions across adult and pediatric populations. Furthermore, the transformer-based models we adopted including BERT, BioBERT, and ClinicalBioBERT, are relatively limited in their parameter scope and the breadth of training data compared to more recent advancements in large language models (LLMs). These newer models, which boast significantly more parameters and have been trained on substantially larger datasets, may offer improved accuracy and better generalizability across diverse medical texts and clinical conditions. Exploring the application of LLMs in future studies could address some of the current limitations and provide a more robust tool for clinical text analysis.</p>
<p>As a next step for this work, we plan to assess the validity of our newly developed measure using PROMs or prospective patient follow-up. There are mixed reports of the accuracy of clinical note content, therefore we must evaluate if our measure accurately reflects a state of patient improvement or decline our new measure is reporting. However, multiple studies have found that healthcare professionals produce accurate documentation for concrete and overt symptoms, such as range of motion and impaired physical functioning (<xref ref-type="bibr" rid="B67">67</xref>&#x2013;<xref ref-type="bibr" rid="B70">70</xref>). Therefore, because of the highly focused nature of orthopaedic encounters and symptoms, we believe that clinical note content remains a valuable and valid source of data from which to develop an indicator of treatment success for patients (<xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B38">38</xref>). Lastly, although we engaged patients in the development of outcome labels and the definition of treatment success, we ultimately used the physician perspective to develop the gold standard dataset labels of treatment success or failure. It is recognized that patients and physicians may differ in their definition of treatment success, therefore future work will explore incorporating patient perspectives into the definition of treatment success.</p>
</sec>
<sec id="s5" sec-type="conclusions"><title>Conclusions</title>
<p>We believe the development of an AI-based measure of treatment success using clinical notes may represent a paradigm shift in how outcomes are collected in orthopaedic medicine. Orthopaedic-related healthcare encounters are highly focused on the ways in which musculoskeletal treatments affect outcome priorities such as pain, range of motion, and patient&#x0027;s quality of life. This method, if widely adopted and implemented on clinical note content stored in the EHR could translate to widely available success measures which could be used to for comparative effectiveness research studies and for the development of clinical quality metrics (<xref ref-type="bibr" rid="B64">64</xref>) to improve the quality of orthopaedic care.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability"><title>Data availability statement</title>
<p>The data used in this analysis is not readily available because patient identifiers are contained in the dataset and they must remain stored in a HIPAA compliant location. Requests to access the datasets should be directed to <email>sbf@clemson.edu</email>.</p>
</sec>
<sec id="s7" sec-type="ethics-statement"><title>Ethics statement</title>
<p>The studies involving humans were approved by Institutional Review Board at Prisma Health. The studies were conducted in accordance with the local legislation and institutional requirements. The ethics committee/institutional review board waived the requirement of written informed consent for participation from the participants or the participants&#x0027; legal guardians/next of kin because because the research poses minimal risk, is non-interventional, and obtaining consent would be impractical.</p>
</sec>
<sec id="s8" sec-type="author-contributions"><title>Author contributions</title>
<p>SF: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing, Conceptualization, Data curation, Formal analysis, Funding acquisition, Investigation, Methodology, Project administration, Supervision. AA: Writing &#x2013; review &#x0026; editing, Data curation, Formal analysis, Methodology, Writing &#x2013; original draft. DS: Writing &#x2013; review &#x0026; editing, Data curation, Formal analysis, Methodology, Supervision, Writing &#x2013; original draft. BJ: Writing &#x2013; review &#x0026; editing, Data curation, Formal analysis, Writing &#x2013; original draft. CK: Writing &#x2013; review &#x0026; editing, Data curation, Formal analysis, Writing &#x2013; original draft. ZR: Writing &#x2013; review &#x0026; editing, Data curation, Methodology, Writing &#x2013; original draft. KJ: Writing &#x2013; review &#x0026; editing, Conceptualization, Data curation, Methodology, Supervision, Writing &#x2013; original draft. JO: Writing &#x2013; review &#x0026; editing, Conceptualization, Formal analysis, Investigation, Methodology, Project administration, Supervision, Writing &#x2013; original draft.</p>
</sec>
<sec id="s9" sec-type="funding-information"><title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This work was supported by grant R03HS029060 from the Agency for Healthcare Research and Quality.</p>
</sec>
<sec id="s10" sec-type="COI-statement"><title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="ai-statement"><title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec id="s12" sec-type="disclaimer"><title>Publisher&#x0027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list><title>References</title>
<ref id="B1"><label>1.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jayakumar</surname><given-names>P</given-names></name><name><surname>Bozic</surname><given-names>KJ</given-names></name></person-group>. <article-title>Advanced decision-making using patient-reported outcome measures in total joint replacement</article-title>. <source>J Orthop Res</source>. (<year>2020</year>) <volume>38</volume>(<issue>7</issue>):<fpage>1414</fpage>&#x2013;<lpage>22</lpage>. <pub-id pub-id-type="doi">10.1002/jor.24614</pub-id><pub-id pub-id-type="pmid">31994752</pub-id></citation></ref>
<ref id="B2"><label>2.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Briffa</surname><given-names>N</given-names></name></person-group>. <article-title>The employment of patient-reported outcome measures to communicate the likely benefits of surgery</article-title>. <source>Patient Relat Outcome Meas</source>. (<year>2018</year>) <volume>9</volume>:<fpage>263</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.2147/PROM.S132746</pub-id><pub-id pub-id-type="pmid">30147385</pub-id></citation></ref>
<ref id="B3"><label>3.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Makhni</surname><given-names>EC</given-names></name></person-group>. <article-title>Meaningful clinical applications of patient-reported outcome measures in orthopaedics</article-title>. <source>J Bone Joint Surg Am</source>. (<year>2021</year>) <volume>103</volume>(<issue>1</issue>):<fpage>84</fpage>&#x2013;<lpage>91</lpage>. <pub-id pub-id-type="doi">10.2106/jbjs.20.00624</pub-id> (Accessed June 1, 2024).<pub-id pub-id-type="pmid">33079895</pub-id></citation></ref>
<ref id="B4"><label>4.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ayers</surname><given-names>D</given-names></name><name><surname>Bozic</surname><given-names>K</given-names></name></person-group>. <article-title>The importance of outcome measurement in orthopaedics</article-title>. <source>Clin Orthop Relat Res</source>. (<year>2013</year>) <volume>471</volume>(<issue>11</issue>):<fpage>3409</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1007/s11999-013-3224-z</pub-id><pub-id pub-id-type="pmid">23934032</pub-id></citation></ref>
<ref id="B5"><label>5.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gagnier</surname><given-names>J</given-names></name></person-group>. <article-title>Patient reported outcomes in orthopaedics</article-title>. <source>J Orthop Res</source>. (<year>2017</year>) <volume>35</volume>(<issue>10</issue>):<fpage>2098</fpage>&#x2013;<lpage>108</lpage>. <pub-id pub-id-type="doi">10.1002/jor.23604</pub-id><pub-id pub-id-type="pmid">28513993</pub-id></citation></ref>
<ref id="B6"><label>6.</label><citation citation-type="other"><collab>American Academy of Orthopaedic Surgeons</collab>. <article-title>Patient reported outcome measures</article-title>. (<year>2023</year>). <comment>Available at</comment>: <ext-link ext-link-type="uri" xlink:href="https://www.aaos.org/quality/research-resources/patient-reported-outcome-measures/performance-measures-by-orthopaedic-subspecialty/">https://www.aaos.org/quality/research-resources/patient-reported-outcome-measures/performance-measures-by-orthopaedic-subspecialty/</ext-link> <comment>(Accessed June 1, 2024).</comment></citation></ref>
<ref id="B7"><label>7.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Power</surname><given-names>JD</given-names></name><name><surname>Perruccio</surname><given-names>AV</given-names></name><name><surname>Canizares</surname><given-names>M</given-names></name><name><surname>McIntosh</surname><given-names>G</given-names></name><name><surname>Abraham</surname><given-names>E</given-names></name><name><surname>Attabib</surname><given-names>N</given-names></name><etal/></person-group> <article-title>Determining minimal clinically important difference estimates following surgery for degenerative conditions of the lumbar spine: analysis of the Canadian spine outcomes and research network (CSORN) registry</article-title>. <source>Spine J</source>. (<year>2023</year>) <volume>23</volume>(<issue>9</issue>):<fpage>1323</fpage>&#x2013;<lpage>33</lpage>. <pub-id pub-id-type="doi">10.1016/j.spinee.2023.05.001</pub-id><pub-id pub-id-type="pmid">37160168</pub-id></citation></ref>
<ref id="B8"><label>8.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Antosh</surname><given-names>IJ</given-names></name><name><surname>Svoboda</surname><given-names>SJ</given-names></name><name><surname>Peck</surname><given-names>KY</given-names></name><name><surname>Garcia</surname><given-names>EJ</given-names></name><name><surname>Cameron</surname><given-names>KL</given-names></name></person-group>. <article-title>Change in KOOS and WOMAC scores in a young athletic population with and without anterior cruciate ligament injury</article-title>. <source>Am J Sports Med</source>. (<year>2018</year>) <volume>46</volume>(<issue>7</issue>):<fpage>1606</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1177/0363546518768753</pub-id><pub-id pub-id-type="pmid">29733680</pub-id></citation></ref>
<ref id="B9"><label>9.</label><citation citation-type="other"><person-group person-group-type="author"><name><surname>DelPrete</surname><given-names>A.</given-names></name></person-group> <article-title>According to AAOE survey, only 35&#x0025; of orthopaedic practices are collecting PROMs</article-title> (<year>2017</year>). <comment>Available at:</comment> <ext-link ext-link-type="uri" xlink:href="https://www.aaoe.net/news/354456/According-to-AAOE-Survey-Only-35-of-Orthopaedic-Practices-are-Collecting-PROMs.htm">https://www.aaoe.net/news/354456/According-to-AAOE-Survey-Only-35-of-Orthopaedic-Practices-are-Collecting-PROMs.htm</ext-link> (Accessed June 1, 2024).</citation></ref>
<ref id="B10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nguyen</surname><given-names>H</given-names></name><name><surname>Butow</surname><given-names>P</given-names></name><name><surname>Dhillon</surname><given-names>H</given-names></name><name><surname>Sundaresan</surname><given-names>P</given-names></name></person-group>. <article-title>A review of the barriers to using patient-reported outcomes (PROs) and patient-reported outcome measures (PROMs) in routine cancer care</article-title>. <source>J Med Radiat Sci</source>. (<year>2021</year>) <volume>68</volume>(<issue>2</issue>):<fpage>186</fpage>&#x2013;<lpage>95</lpage>. <pub-id pub-id-type="doi">10.1002/jmrs.421</pub-id><pub-id pub-id-type="pmid">32815314</pub-id></citation></ref>
<ref id="B11"><label>11.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sisodia</surname><given-names>RC</given-names></name><name><surname>Dankers</surname><given-names>C</given-names></name><name><surname>Orav</surname><given-names>J</given-names></name><name><surname>Joseph</surname><given-names>B</given-names></name><name><surname>Meyers</surname><given-names>P</given-names></name><name><surname>Wright</surname><given-names>P</given-names></name><etal/></person-group> <article-title>Factors associated with increased collection of patient-reported outcomes within a large health care system</article-title>. <source>JAMA Network Open</source>. (<year>2020</year>) <volume>3</volume>(<issue>4</issue>):<fpage>e202764</fpage>. <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2020.2764</pub-id><pub-id pub-id-type="pmid">32286657</pub-id></citation></ref>
<ref id="B12"><label>12.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shapiro</surname><given-names>LM</given-names></name><name><surname>Spindler</surname><given-names>K</given-names></name><name><surname>Cunningham</surname><given-names>B</given-names></name><name><surname>Koh</surname><given-names>J</given-names></name></person-group>. <article-title>Patient-reported outcome measure collection and utilization: a survey of American academy of orthopaedic surgeons members</article-title>. <source>J Am Acad Orthop Surg</source>. (<year>2024</year>) <volume>32</volume>(<issue>3</issue>):<fpage>114</fpage>&#x2013;<lpage>22</lpage>. <pub-id pub-id-type="doi">10.5435/JAAOS-D-23-00879</pub-id><pub-id pub-id-type="pmid">38181401</pub-id></citation></ref>
<ref id="B13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Miller</surname><given-names>JM</given-names></name><name><surname>Velanovich</surname><given-names>V</given-names></name></person-group>. <article-title>The natural language of the surgeon&#x2019;s clinical note in outcomes assessment: a qualitative analysis of the medical record</article-title>. <source>Am J Surg</source>. (<year>2010</year>) <volume>199</volume>(<issue>6</issue>):<fpage>817</fpage>&#x2013;<lpage>22</lpage>. <pub-id pub-id-type="doi">10.1016/j.amjsurg.2009.06.037</pub-id><pub-id pub-id-type="pmid">20609725</pub-id></citation></ref>
<ref id="B14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Joarder</surname><given-names>I</given-names></name><name><surname>Taniguchi</surname><given-names>S</given-names></name><name><surname>Mendoza</surname><given-names>A</given-names></name><name><surname>Snow</surname><given-names>ME</given-names></name></person-group>. <article-title>Defining &#x201C;successful&#x201D; treatment outcomes in adolescent idiopathic scoliosis: a scoping review</article-title>. <source>Eur Spine J</source>. (<year>2023</year>) <volume>32</volume>(<issue>4</issue>):<fpage>1204</fpage>&#x2013;<lpage>44</lpage>. <pub-id pub-id-type="doi">10.1007/s00586-023-07592-w</pub-id><pub-id pub-id-type="pmid">36847911</pub-id></citation></ref>
<ref id="B15"><label>15.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Turcotte</surname><given-names>J</given-names></name><name><surname>Kelly</surname><given-names>M</given-names></name><name><surname>Lynch</surname><given-names>K</given-names></name><name><surname>Pipkin</surname><given-names>K</given-names></name><name><surname>Patton</surname><given-names>C</given-names></name></person-group>. <article-title>Patient goal-directed care in an orthopaedic spine specialty clinic</article-title>. <source>J Am Acad Orthop Surg</source>. (<year>2021</year>) <volume>29</volume>(<issue>17</issue>):<fpage>e880</fpage>&#x2013;<lpage>e7</lpage>. <pub-id pub-id-type="doi">10.5435/JAAOS-D-20-01105</pub-id><pub-id pub-id-type="pmid">34106092</pub-id></citation></ref>
<ref id="B16"><label>16.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Paradis</surname><given-names>BE</given-names></name><name><surname>Klein</surname><given-names>BJ</given-names></name><name><surname>Bartlett</surname><given-names>LE</given-names></name><name><surname>Cohn</surname><given-names>RM</given-names></name><name><surname>Bitterman</surname><given-names>AD</given-names></name></person-group>. <article-title>Goals of care discussions in orthopaedic surgery: geriatric hip fractures</article-title>. <source>J Arthroplasty</source>. (<year>2024</year>) <volume>39</volume>(<issue>5</issue>):<fpage>1144</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1016/j.arth.2024.03.001</pub-id><pub-id pub-id-type="pmid">38462140</pub-id></citation></ref>
<ref id="B17"><label>17.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shah</surname><given-names>RF</given-names></name><name><surname>Bini</surname><given-names>S</given-names></name><name><surname>Vail</surname><given-names>T</given-names></name></person-group>. <article-title>Data for registry and quality review can be retrospectively collected using natural language processing from unstructured charts of arthroplasty patients</article-title>. <source>Bone Joint J</source>. (<year>2020</year>) <volume>102-B</volume>(<issue>7 Suppl B</issue>):<fpage>99</fpage>&#x2013;<lpage>104</lpage>. <pub-id pub-id-type="doi">10.1302/0301-620X.102B7.BJJ-2019-1574.R1</pub-id><pub-id pub-id-type="pmid">32600201</pub-id></citation></ref>
<ref id="B18"><label>18.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Martin-Sanchez</surname><given-names>F</given-names></name><name><surname>Verspoor</surname><given-names>K</given-names></name></person-group>. <article-title>Big data in medicine is driving big changes</article-title>. <source>Yearb Med Inform</source>. (<year>2014</year>) <volume>23</volume>(<issue>01</issue>):<fpage>14</fpage>&#x2013;<lpage>20</lpage>. <pub-id pub-id-type="doi">10.15265/IY-2014-0020</pub-id><pub-id pub-id-type="pmid">25123716</pub-id></citation></ref>
<ref id="B19"><label>19.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hashir</surname><given-names>M</given-names></name><name><surname>Sawhney</surname><given-names>R</given-names></name></person-group>. <article-title>Towards unstructured mortality prediction with free-text clinical notes</article-title>. <source>J Biomed Inform</source>. (<year>2020</year>) <volume>108</volume>:<fpage>103489</fpage>. <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103489</pub-id><pub-id pub-id-type="pmid">32592755</pub-id></citation></ref>
<ref id="B20"><label>20.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Murdoch</surname><given-names>TB</given-names></name><name><surname>Detsky</surname><given-names>AS</given-names></name></person-group>. <article-title>The inevitable application of big data to health care</article-title>. <source>Jama</source>. (<year>2013</year>) <volume>309</volume>(<issue>13</issue>):<fpage>1351</fpage>&#x2013;<lpage>2</lpage>. <pub-id pub-id-type="doi">10.1001/jama.2013.393</pub-id><pub-id pub-id-type="pmid">23549579</pub-id></citation></ref>
<ref id="B21"><label>21.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zanotto</surname><given-names>BS</given-names></name><name><surname>Beck da Silva Etges</surname><given-names>AP</given-names></name><name><surname>Dal Bosco</surname><given-names>A</given-names></name><name><surname>Cortes</surname><given-names>EG</given-names></name><name><surname>Ruschel</surname><given-names>R</given-names></name><name><surname>De Souza</surname><given-names>AC</given-names></name><etal/></person-group> <article-title>Stroke outcome measurements from electronic medical records: cross-sectional study on the effectiveness of neural and nonneural classifiers</article-title>. <source>JMIR Med Inform</source>. (<year>2021</year>) <volume>9</volume>(<issue>11</issue>):<fpage>e29120</fpage>. <pub-id pub-id-type="doi">10.2196/29120</pub-id><pub-id pub-id-type="pmid">34723829</pub-id></citation></ref>
<ref id="B22"><label>22.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname><given-names>RY</given-names></name><name><surname>Kross</surname><given-names>EK</given-names></name><name><surname>Torrence</surname><given-names>J</given-names></name><name><surname>Li</surname><given-names>KS</given-names></name><name><surname>Sibley</surname><given-names>J</given-names></name><name><surname>Cohen</surname><given-names>T</given-names></name><etal/></person-group> <article-title>Assessment of natural language processing of electronic health records to measure goals-of-care discussions as a clinical trial outcome</article-title>. <source>JAMA Network Open</source>. (<year>2023</year>) <volume>6</volume>(<issue>3</issue>):<fpage>e231204</fpage>. <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.1204</pub-id><pub-id pub-id-type="pmid">36862411</pub-id></citation></ref>
<ref id="B23"><label>23.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bovonratwet</surname><given-names>P</given-names></name><name><surname>Shen</surname><given-names>TS</given-names></name><name><surname>Islam</surname><given-names>W</given-names></name><name><surname>Ast</surname><given-names>MP</given-names></name><name><surname>Haas</surname><given-names>SB</given-names></name><name><surname>Su</surname><given-names>EP</given-names></name></person-group>. <article-title>Natural language processing of patient-experience comments after primary total knee arthroplasty</article-title>. <source>J Arthroplasty</source>. (<year>2021</year>) <volume>36</volume>(<issue>3</issue>):<fpage>927</fpage>&#x2013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.1016/j.arth.2020.09.055</pub-id><pub-id pub-id-type="pmid">33127238</pub-id></citation></ref>
<ref id="B24"><label>24.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Humbert-Droz</surname><given-names>M</given-names></name><name><surname>Izadi</surname><given-names>Z</given-names></name><name><surname>Schmajuk</surname><given-names>G</given-names></name><name><surname>Gianfrancesco</surname><given-names>M</given-names></name><name><surname>Baker</surname><given-names>MC</given-names></name><name><surname>Yazdany</surname><given-names>J</given-names></name><etal/></person-group> <article-title>Development of a natural language processing system for extracting rheumatoid arthritis outcomes from clinical notes using the national rheumatology informatics system for effectiveness registry</article-title>. <source>Arthritis Care Res (Hoboken)</source>. (<year>2023</year>) <volume>75</volume>(<issue>3</issue>):<fpage>608</fpage>&#x2013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.1002/acr.24869</pub-id><pub-id pub-id-type="pmid">35157365</pub-id></citation></ref>
<ref id="B25"><label>25.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Assale</surname><given-names>M</given-names></name><name><surname>Dui</surname><given-names>LG</given-names></name><name><surname>Cina</surname><given-names>A</given-names></name><name><surname>Seveso</surname><given-names>A</given-names></name><name><surname>Cabitza</surname><given-names>F</given-names></name></person-group>. <article-title>The revival of the notes field: leveraging the unstructured content in electronic health records</article-title>. <source>Front Med (Lausanne)</source>. (<year>2019</year>) <volume>6</volume>:<fpage>66</fpage>. <pub-id pub-id-type="doi">10.3389/fmed.2019.00066</pub-id></citation></ref>
<ref id="B26"><label>26.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hanson</surname><given-names>JL</given-names></name><name><surname>Stephens</surname><given-names>MB</given-names></name><name><surname>Pangaro</surname><given-names>LN</given-names></name><name><surname>Gimbel</surname><given-names>RW</given-names></name></person-group>. <article-title>Quality of outpatient clinical notes: a stakeholder definition derived through qualitative research</article-title>. <source>BMC Health Serv Res</source>. (<year>2012</year>) <volume>12</volume>:<fpage>407</fpage>. <pub-id pub-id-type="doi">10.1186/1472-6963-12-407</pub-id><pub-id pub-id-type="pmid">23164470</pub-id></citation></ref>
<ref id="B27"><label>27.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Podder</surname><given-names>V</given-names></name><name><surname>Lew</surname><given-names>V</given-names></name><name><surname>Ghassemzadeh</surname><given-names>S</given-names></name></person-group>. <source>SOAP Notes</source>. <publisher-loc>Treasure Island, FL</publisher-loc>: <publisher-name>StatPearls Publishing</publisher-name> (<year>2021</year>).</citation></ref>
<ref id="B28"><label>28.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Hunter</surname><given-names>KM</given-names></name></person-group>. <source>Doctors&#x2019; Stories: The Narrative Structure of Medical Knowledge</source>. <publisher-loc>Princeton, N.J.</publisher-loc>: <publisher-name>Princeton Univ. Press</publisher-name> (<year>1993</year>).</citation></ref>
<ref id="B29"><label>29.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Raghupathi</surname><given-names>W</given-names></name><name><surname>Raghupathi</surname><given-names>V</given-names></name></person-group>. <article-title>Big data analytics in healthcare: promise and potential</article-title>. <source>Health Inf Sci Syst</source>. (<year>2014</year>) <volume>2</volume>:<fpage>3</fpage>. <pub-id pub-id-type="doi">10.1186/2047-2501-2-3</pub-id><pub-id pub-id-type="pmid">25825667</pub-id></citation></ref>
<ref id="B30"><label>30.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Resnik</surname><given-names>P</given-names></name><name><surname>Niv</surname><given-names>M</given-names></name><name><surname>Nossal</surname><given-names>M</given-names></name><name><surname>Kapit</surname><given-names>A</given-names></name><name><surname>Toren</surname><given-names>R</given-names></name></person-group>. <article-title>Communication of clinically relevant information in electronic health records: a comparison between structured data and unrestricted physician language</article-title>. <source>Perspect Health Inform Manag</source>. (<year>2008</year>) <volume>2008</volume>:<fpage>1</fpage>&#x2013;<lpage>10</lpage>.</citation></ref>
<ref id="B31"><label>31.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Obeid</surname><given-names>J</given-names></name><name><surname>Weeda</surname><given-names>E</given-names></name><name><surname>Matuskowitz</surname><given-names>A</given-names></name><name><surname>Gagnon</surname><given-names>K</given-names></name><name><surname>Crawford</surname><given-names>T</given-names></name><name><surname>Carr</surname><given-names>C</given-names></name><etal/></person-group> <article-title>Automated detection of altered mental status in emergency department clinical notes: a deep learning approach</article-title>. <source>BMC Med Inform Decis Mak</source>. (<year>2019</year>) <volume>19</volume>(<issue>1</issue>):<fpage>164</fpage>. <pub-id pub-id-type="doi">10.1186/s12911-019-0894-9</pub-id><pub-id pub-id-type="pmid">31426779</pub-id></citation></ref>
<ref id="B32"><label>32.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kreimeyer</surname><given-names>K</given-names></name><name><surname>Foster</surname><given-names>M</given-names></name><name><surname>Pandey</surname><given-names>A</given-names></name><name><surname>Arya</surname><given-names>N</given-names></name><name><surname>Halford</surname><given-names>G</given-names></name><name><surname>Jones</surname><given-names>SF</given-names></name><etal/></person-group> <article-title>Natural language processing systems for capturing and standardizing unstructured clinical information: a systematic review</article-title>. <source>J Biomed Inform</source>. (<year>2017</year>) <volume>73</volume>:<fpage>14</fpage>&#x2013;<lpage>29</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbi.2017.07.012</pub-id><pub-id pub-id-type="pmid">28729030</pub-id></citation></ref>
<ref id="B33"><label>33.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>Y</given-names></name><name><surname>Wang</surname><given-names>L</given-names></name><name><surname>Rastegar-Mojarad</surname><given-names>M</given-names></name><name><surname>Moon</surname><given-names>S</given-names></name><name><surname>Shen</surname><given-names>F</given-names></name><name><surname>Afzal</surname><given-names>N</given-names></name><etal/></person-group> <article-title>Clinical information extraction applications: a literature review</article-title>. <source>J Biomed Inform</source>. (<year>2018</year>) <volume>77</volume>:<fpage>34</fpage>&#x2013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbi.2017.11.011</pub-id><pub-id pub-id-type="pmid">29162496</pub-id></citation></ref>
<ref id="B34"><label>34.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>AlShehri</surname><given-names>Y</given-names></name><name><surname>Sidhu</surname><given-names>A</given-names></name><name><surname>Lakshmanan</surname><given-names>LVS</given-names></name><name><surname>Lefaivre</surname><given-names>KA</given-names></name></person-group>. <article-title>Applications of natural language processing for automated clinical data analysis in orthopaedics</article-title>. <source>J Am Acad Orthop Surg</source>. (<year>2024</year>) <volume>32</volume>(<issue>10</issue>):<fpage>439</fpage>&#x2013;<lpage>46</lpage>. <pub-id pub-id-type="doi">10.5435/JAAOS-D-23-00839</pub-id><pub-id pub-id-type="pmid">38626429</pub-id></citation></ref>
<ref id="B35"><label>35.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sasanelli</surname><given-names>F</given-names></name><name><surname>Le</surname><given-names>KDR</given-names></name><name><surname>Tay</surname><given-names>SBP</given-names></name><name><surname>Tran</surname><given-names>P</given-names></name><name><surname>Verjans</surname><given-names>JW</given-names></name></person-group>. <article-title>Applications of natural language processing tools in orthopaedic surgery: a scoping review</article-title>. <source>Appl Sci</source>. (<year>2023</year>) <volume>13</volume>(<issue>20</issue>):<fpage>11586</fpage>. <pub-id pub-id-type="doi">10.3390/app132011586</pub-id></citation></ref>
<ref id="B36"><label>36.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thirukumaran</surname><given-names>CP</given-names></name><name><surname>Zaman</surname><given-names>A</given-names></name><name><surname>Rubery</surname><given-names>PT</given-names></name><name><surname>Calabria</surname><given-names>C</given-names></name><name><surname>Li</surname><given-names>Y</given-names></name><name><surname>Ricciardi</surname><given-names>BF</given-names></name><etal/></person-group> <article-title>Natural language processing for the identification of surgical site infections in orthopaedics</article-title>. <source>J Bone Joint Surg Am</source>. (<year>2019</year>) <volume>101</volume>(<issue>24</issue>):<fpage>2167</fpage>&#x2013;<lpage>74</lpage>. <pub-id pub-id-type="doi">10.2106/JBJS.19.00661</pub-id><pub-id pub-id-type="pmid">31596819</pub-id></citation></ref>
<ref id="B37"><label>37.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Varpio</surname><given-names>L</given-names></name><name><surname>Rashotte</surname><given-names>J</given-names></name><name><surname>Day</surname><given-names>K</given-names></name><name><surname>King</surname><given-names>J</given-names></name><name><surname>Kuziemsky</surname><given-names>C</given-names></name><name><surname>Parush</surname><given-names>A</given-names></name></person-group>. <article-title>The EHR and building the patient&#x2019;s story: a qualitative investigation of how EHR use obstructs a vital clinical activity</article-title>. <source>Int J Med Inf</source>. (<year>2015</year>) <volume>84</volume>(<issue>12</issue>):<fpage>1019</fpage>&#x2013;<lpage>28</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2015.09.004</pub-id><pub-id pub-id-type="pmid">26432683</pub-id></citation></ref>
<ref id="B38"><label>38.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Boag</surname><given-names>W</given-names></name><name><surname>Doss</surname><given-names>D</given-names></name><name><surname>Naumann</surname><given-names>T</given-names></name><name><surname>Szolovits</surname><given-names>P</given-names></name></person-group>. <article-title>What&#x2019;s in a note? Unpacking predictive value in clinical note representations</article-title>. <source>AMIA Jt Summits Transl Sci Proc</source>. (<year>2018</year>) <volume>2018</volume>:<fpage>26</fpage>&#x2013;<lpage>34</lpage>.</citation></ref>
<ref id="B39"><label>39.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vest</surname><given-names>JR</given-names></name><name><surname>Grannis</surname><given-names>SJ</given-names></name><name><surname>Haut</surname><given-names>DP</given-names></name><name><surname>Halverson</surname><given-names>PK</given-names></name><name><surname>Menachemi</surname><given-names>N</given-names></name></person-group>. <article-title>Using structured and unstructured data to identify patients&#x2019; need for services that address the social determinants of health</article-title>. <source>Int J Med Inform</source>. (<year>2017</year>) <volume>107</volume>:<fpage>101</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2017.09.008</pub-id><pub-id pub-id-type="pmid">29029685</pub-id></citation></ref>
<ref id="B40"><label>40.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carrell</surname><given-names>DS</given-names></name><name><surname>Schoen</surname><given-names>RE</given-names></name><name><surname>Leffler</surname><given-names>DA</given-names></name><name><surname>Morris</surname><given-names>M</given-names></name><name><surname>Rose</surname><given-names>S</given-names></name><name><surname>Baer</surname><given-names>A</given-names></name><etal/></person-group> <article-title>Challenges in adapting existing clinical natural language processing systems to multiple, diverse health care settings</article-title>. <source>J Am Med Inform Assoc</source>. (<year>2017</year>) <volume>24</volume>(<issue>5</issue>):<fpage>986</fpage>&#x2013;<lpage>91</lpage>. <pub-id pub-id-type="doi">10.1093/jamia/ocx039</pub-id><pub-id pub-id-type="pmid">28419261</pub-id></citation></ref>
<ref id="B41"><label>41.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bayley</surname><given-names>KB</given-names></name><name><surname>London</surname><given-names>MR</given-names></name><name><surname>Grunkemeier</surname><given-names>GL</given-names></name><name><surname>Lansky</surname><given-names>DJ</given-names></name></person-group>. <article-title>Measuring the success of treatment in patient terms</article-title>. <source>Med Care</source>. (<year>1995</year>) <volume>33</volume>(<issue>4 Suppl</issue>):<fpage>As226</fpage>&#x2013;<lpage>35</lpage>.<pub-id pub-id-type="pmid">7723451</pub-id></citation></ref>
<ref id="B42"><label>42.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Davey</surname><given-names>MS</given-names></name><name><surname>Hurley</surname><given-names>ET</given-names></name><name><surname>Anil</surname><given-names>U</given-names></name><name><surname>Condren</surname><given-names>S</given-names></name><name><surname>Kearney</surname><given-names>J</given-names></name><name><surname>O&#x0027;Tuile</surname><given-names>C</given-names></name><etal/></person-group> <article-title>Management options for proximal humerus fractures&#x2014;a systematic review &#x0026; network meta-analysis of randomized control trials</article-title>. <source>Injury</source>. (<year>2022</year>) <volume>53</volume>(<issue>2</issue>):<fpage>244</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1016/j.injury.2021.12.022</pub-id><pub-id pub-id-type="pmid">34974908</pub-id></citation></ref>
<ref id="B43"><label>43.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Patel</surname><given-names>AH</given-names></name><name><surname>Wilder</surname><given-names>JH</given-names></name><name><surname>Ofa</surname><given-names>SA</given-names></name><name><surname>Lee</surname><given-names>OC</given-names></name><name><surname>Savoie</surname><given-names>FH</given-names></name><name><surname>Brien</surname><given-names>O</given-names></name><etal/></person-group> <article-title>Trending a decade of proximal humerus fracture management in older adults</article-title>. <source>JSES International</source>. (<year>2022</year>) <volume>6</volume>(<issue>1</issue>):<fpage>137</fpage>&#x2013;<lpage>43</lpage>. <pub-id pub-id-type="doi">10.1016/j.jseint.2021.08.006</pub-id><pub-id pub-id-type="pmid">35141688</pub-id></citation></ref>
<ref id="B44"><label>44.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baker</surname><given-names>HP</given-names></name><name><surname>Gutbrod</surname><given-names>J</given-names></name><name><surname>Strelzow</surname><given-names>JA</given-names></name><name><surname>Maassen</surname><given-names>NH</given-names></name><name><surname>Shi</surname><given-names>L</given-names></name></person-group>. <article-title>Management of proximal humerus fractures in adults&#x2014;a scoping review</article-title>. <source>J Clin Med</source>. (<year>2022</year>) <volume>11</volume>(<issue>20</issue>):<fpage>6140</fpage>. <pub-id pub-id-type="doi">10.3390/jcm11206140</pub-id><pub-id pub-id-type="pmid">36294459</pub-id></citation></ref>
<ref id="B45"><label>45.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hao</surname><given-names>KA</given-names></name><name><surname>Patch</surname><given-names>DA</given-names></name><name><surname>Reed</surname><given-names>LA</given-names></name><name><surname>Spitler</surname><given-names>CA</given-names></name><name><surname>Horneff</surname><given-names>JG</given-names></name><name><surname>Ahn</surname><given-names>J</given-names></name><etal/></person-group> <article-title>Factors influencing surgical management of proximal humerus fractures: do shoulder and trauma surgeons differ?</article-title> <source>J Shoulder Elbow Surg</source>. (<year>2022</year>) <volume>31</volume>(<issue>6</issue>):<fpage>e259</fpage>&#x2013;<lpage>69</lpage>. <pub-id pub-id-type="doi">10.1016/j.jse.2021.11.016</pub-id><pub-id pub-id-type="pmid">34973423</pub-id></citation></ref>
<ref id="B46"><label>46.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kennedy</surname><given-names>AB</given-names></name><name><surname>Mitcham</surname><given-names>A</given-names></name><name><surname>Parris</surname><given-names>K</given-names></name><name><surname>Albertson</surname><given-names>F</given-names></name><name><surname>Sanchez Ferrer</surname><given-names>L</given-names></name><name><surname>O&#x0027;Boyle</surname><given-names>C</given-names></name><etal/></person-group> <article-title>Wonderings to research questions: engaging patients in long COVID research prioritization within a learning health system</article-title>. <source>Learn Health Syst</source>. (<year>2024</year>) <volume>8</volume>(<issue>S1</issue>):<fpage>e10410</fpage>. <pub-id pub-id-type="doi">10.1002/lrh2.10410</pub-id><pub-id pub-id-type="pmid">38883877</pub-id></citation></ref>
<ref id="B47"><label>47.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Natafgi</surname><given-names>N</given-names></name><name><surname>Parris</surname><given-names>K</given-names></name><name><surname>Walker</surname><given-names>E</given-names></name><name><surname>Gartner</surname><given-names>T</given-names></name><name><surname>Coffin</surname><given-names>J</given-names></name><name><surname>Mitcham</surname><given-names>A</given-names></name><etal/></person-group> <article-title>Through their eyes: using photovoice to capture the capacity-building journey of long COVID patient experts</article-title>. <source>Health Expect</source>. (<year>2024</year>) <volume>27</volume>(<issue>6</issue>):<fpage>e70094</fpage>. <pub-id pub-id-type="doi">10.1111/hex.70094</pub-id><pub-id pub-id-type="pmid">39529266</pub-id></citation></ref>
<ref id="B48"><label>48.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wright</surname><given-names>AA</given-names></name><name><surname>Hensley</surname><given-names>CP</given-names></name><name><surname>Gilbertson</surname><given-names>J</given-names></name><name><surname>Leland</surname><given-names>JM</given-names><suffix>III</suffix></name><name><surname>Jackson</surname><given-names>S</given-names></name></person-group>. <article-title>Defining patient acceptable symptom state thresholds for commonly used patient reported outcomes measures in general orthopedic practice</article-title>. <source>Man Ther</source>. (<year>2015</year>) <volume>20</volume>(<issue>6</issue>):<fpage>814</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1016/j.math.2015.03.011</pub-id><pub-id pub-id-type="pmid">25843266</pub-id></citation></ref>
<ref id="B49"><label>49.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Harris</surname><given-names>PA</given-names></name><name><surname>Taylor</surname><given-names>R</given-names></name><name><surname>Thielke</surname><given-names>R</given-names></name><name><surname>Payne</surname><given-names>J</given-names></name><name><surname>Gonzalez</surname><given-names>N</given-names></name><name><surname>Conde</surname><given-names>JG</given-names></name></person-group>. <article-title>Research electronic data capture (REDCap)&#x2013;a metadata-driven methodology and workflow process for providing translational research informatics support</article-title>. <source>J Biomed Inform</source>. (<year>2009</year>) <volume>42</volume>(<issue>2</issue>):<fpage>377</fpage>&#x2013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbi.2008.08.010</pub-id><pub-id pub-id-type="pmid">18929686</pub-id></citation></ref>
<ref id="B50"><label>50.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Manning</surname><given-names>CD</given-names></name><name><surname>Sch&#x00FC;tze</surname><given-names>H</given-names></name><name><surname>Raghavan</surname><given-names>P</given-names></name></person-group>. <source>Introduction to Information Retrieval</source>. <publisher-loc>Cambridge, USA</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name> (<year>2008</year>).</citation></ref>
<ref id="B51"><label>51.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Ma</surname><given-names>Y</given-names></name><name><surname>Guo</surname><given-names>G</given-names></name></person-group>, editors. <source>Support Vector Machines Applications</source>. <publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>2014</year>).</citation></ref>
<ref id="B52"><label>52.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Breiman</surname><given-names>L</given-names></name></person-group>. <article-title>Random forests</article-title>. <source>Mach Learn</source>. (<year>2001</year>) <volume>45</volume>(<issue>1</issue>):<fpage>5</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id></citation></ref>
<ref id="B53"><label>53.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Klug</surname><given-names>M</given-names></name><name><surname>Barash</surname><given-names>Y</given-names></name><name><surname>Bechler</surname><given-names>S</given-names></name><name><surname>Resheff</surname><given-names>YS</given-names></name><name><surname>Tron</surname><given-names>T</given-names></name><name><surname>Ironi</surname><given-names>A</given-names></name><etal/></person-group> <article-title>A gradient boosting machine learning model for predicting early mortality in the emergency department triage: devising a nine-point triage score</article-title>. <source>J Gen Intern Med</source>. (<year>2020</year>) <volume>35</volume>(<issue>1</issue>):<fpage>220</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1007/s11606-019-05512-7</pub-id><pub-id pub-id-type="pmid">31677104</pub-id></citation></ref>
<ref id="B54"><label>54.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Inoue</surname><given-names>T</given-names></name><name><surname>Ichikawa</surname><given-names>D</given-names></name><name><surname>Ueno</surname><given-names>T</given-names></name><name><surname>Cheong</surname><given-names>M</given-names></name><name><surname>Inoue</surname><given-names>T</given-names></name><name><surname>Whetstone</surname><given-names>WD</given-names></name><etal/></person-group> <article-title>XGBoost, a machine learning method, predicts neurological recovery in patients with cervical spinal cord injury</article-title>. <source>Neurotrauma Rep</source>. (<year>2020</year>) <volume>1</volume>(<issue>1</issue>):<fpage>8</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1089/neur.2020.0009</pub-id><pub-id pub-id-type="pmid">34223526</pub-id></citation></ref>
<ref id="B55"><label>55.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vaswani</surname><given-names>A</given-names></name><name><surname>Shazeer</surname><given-names>N</given-names></name><name><surname>Parmar</surname><given-names>N</given-names></name><name><surname>Uszkoreit</surname><given-names>J</given-names></name><name><surname>Jones</surname><given-names>L</given-names></name><name><surname>Gomez</surname><given-names>AN</given-names></name><etal/></person-group> <article-title>Attention is all you need</article-title>. In: <source>Proceedings of the 31st International Conference on Neural Information Processing Systems</source>. <publisher-loc>Red Hook, NY</publisher-loc>: <publisher-name>Curran Associates Inc.</publisher-name> (<year>2017</year>). p. <fpage>6000</fpage>&#x2013;<lpage>10</lpage>.</citation></ref>
<ref id="B56"><label>56.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Devlin</surname><given-names>J</given-names></name><name><surname>Chang</surname><given-names>MW</given-names></name><name><surname>Lee</surname><given-names>K</given-names></name><name><surname>Toutanova</surname><given-names>K</given-names></name></person-group>. <article-title>Bert: pre-training of deep bidirectional transformers for language understanding</article-title>. In: <person-group person-group-type="editor"><name><surname>Burstein</surname><given-names>J</given-names></name><name><surname>Doran</surname><given-names>C</given-names></name><name><surname>Solorio</surname><given-names>T</given-names></name></person-group>, editors. <source>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers)</source>. <publisher-loc>Minneapolis, MN</publisher-loc>: <publisher-name>Association for Computational Linguistics</publisher-name> (<year>2019</year>). p. <fpage>4171</fpage>&#x2013;<lpage>86</lpage>.</citation></ref>
<ref id="B57"><label>57.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname><given-names>J</given-names></name><name><surname>Yoon</surname><given-names>W</given-names></name><name><surname>Kim</surname><given-names>S</given-names></name><name><surname>Kim</surname><given-names>D</given-names></name><name><surname>Kim</surname><given-names>S</given-names></name><name><surname>So</surname><given-names>CH</given-names></name><etal/></person-group> <article-title>BioBERT: a pre-trained biomedical language representation model for biomedical text mining</article-title>. <source>Bioinformatics</source>. (<year>2019</year>) <volume>36</volume>(<issue>4</issue>):<fpage>1234</fpage>&#x2013;<lpage>40</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id></citation></ref>
<ref id="B58"><label>58.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alsentzer</surname><given-names>E</given-names></name><name><surname>Murphy</surname><given-names>JR</given-names></name><name><surname>Boag</surname><given-names>W</given-names></name><name><surname>Weng</surname><given-names>WH</given-names></name><name><surname>Jin</surname><given-names>D</given-names></name><name><surname>Naumann</surname><given-names>T</given-names></name><etal/></person-group> <article-title>Publicly available clinical BERT embeddings</article-title>. <comment><italic>arXiv</italic> [Preprint]. <italic>arXiv:1904.03323</italic></comment> (<year>2019</year>). <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1904.03323">https://arxiv.org/abs/1904.03323</ext-link> (Accessed December 3, 2023)</comment>.</citation></ref>
<ref id="B59"><label>59.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Johnson</surname><given-names>AEW</given-names></name><name><surname>Pollard</surname><given-names>TJ</given-names></name><name><surname>Shen</surname><given-names>L</given-names></name><name><surname>Lehman</surname><given-names>L-w</given-names></name><name><surname>Feng</surname><given-names>M</given-names></name><name><surname>Ghassemi</surname><given-names>M</given-names></name><etal/></person-group> <article-title>MIMIC-III, a freely accessible critical care database</article-title>. <source>Sci Data</source>. (<year>2016</year>) <volume>3</volume>(<issue>1</issue>):<fpage>160035</fpage>. <pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id><pub-id pub-id-type="pmid">27219127</pub-id></citation></ref>
<ref id="B60"><label>60.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>Y</given-names></name><name><surname>Wallace</surname><given-names>B</given-names></name></person-group>. <article-title>A sensitivity analysis of (and practitioners&#x0027; guide to) convolutional neural networks for sentence classification</article-title>. <comment><italic>arXiv</italic> [Preprint]. <italic>arXiv:1510.03820</italic></comment> (<year>2015</year>). <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1510.03820">https://arxiv.org/abs/1510.03820</ext-link> (Accessed December 3, 2023)</comment>.</citation></ref>
<ref id="B61"><label>61.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jacovi</surname><given-names>A</given-names></name><name><surname>Shalom</surname><given-names>OS</given-names></name><name><surname>Goldberg</surname><given-names>Y</given-names></name></person-group>. <article-title>Understanding convolutional neural networks for text classification</article-title>. <comment><italic>arXiv</italic> [Preprint]. <italic>arXiv:1809.08037</italic></comment> (<year>2018</year>). <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1809.08037">https://arxiv.org/abs/1809.08037</ext-link> (Accessed December 3, 2023)</comment>.</citation></ref>
<ref id="B62"><label>62.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rios</surname><given-names>A</given-names></name><name><surname>Kavuluru</surname><given-names>R</given-names></name></person-group>. <article-title>Convolutional neural networks for biomedical text classification: application in indexing biomedical articles</article-title>. <source>ACM BCB</source>. (<year>2015</year>) <volume>2015</volume>:<fpage>258</fpage>&#x2013;<lpage>67</lpage>. <pub-id pub-id-type="doi">10.1145/2808719.2808746</pub-id><pub-id pub-id-type="pmid">28736769</pub-id></citation></ref>
<ref id="B63"><label>63.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Landis</surname><given-names>JR</given-names></name><name><surname>Koch</surname><given-names>GG</given-names></name></person-group>. <article-title>The measurement of observer agreement for categorical data</article-title>. <source>Biometrics</source>. (<year>1977</year>) <volume>33</volume>(<issue>1</issue>):<fpage>159</fpage>&#x2013;<lpage>74</lpage>.<pub-id pub-id-type="pmid">843571</pub-id></citation></ref>
<ref id="B64"><label>64.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tonner</surname><given-names>C</given-names></name><name><surname>Schmajuk</surname><given-names>G</given-names></name><name><surname>Yazdany</surname><given-names>J</given-names></name></person-group>. <article-title>A new era of quality measurement in rheumatology: electronic clinical quality measures and national registries</article-title>. <source>Curr Opin Rheumatol</source>. (<year>2017</year>) <volume>29</volume>(<issue>2</issue>):<fpage>131</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1097/bor.0000000000000364</pub-id><pub-id pub-id-type="pmid">27941392</pub-id></citation></ref>
<ref id="B65"><label>65.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Allada</surname><given-names>AK</given-names></name><name><surname>Wang</surname><given-names>Y</given-names></name><name><surname>Jindal</surname><given-names>V</given-names></name><name><surname>Babee</surname><given-names>M</given-names></name><name><surname>Tizhoosh</surname><given-names>HR</given-names></name><name><surname>Crowley</surname><given-names>M</given-names></name></person-group>. <article-title>Analysis of language embeddings for classification of unstructured pathology reports</article-title>. <conf-name>Annu Int Conf IEEE Eng Med Biol Soc</conf-name>. (<year>2021</year>) <volume>2021</volume>:<fpage>2378</fpage>&#x2013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1109/EMBC46164.2021.9630347</pub-id></citation></ref>
<ref id="B66"><label>66.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Velupillai</surname><given-names>S</given-names></name><name><surname>Suominen</surname><given-names>H</given-names></name><name><surname>Liakata</surname><given-names>M</given-names></name><name><surname>Roberts</surname><given-names>A</given-names></name><name><surname>Shah</surname><given-names>AD</given-names></name><name><surname>Morley</surname><given-names>K</given-names></name><etal/></person-group> <article-title>Using clinical natural language processing for health outcomes research: overview and actionable suggestions for future advances</article-title>. <source>J Biomed Inform</source>. (<year>2018</year>) <volume>88</volume>:<fpage>11</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbi.2018.10.005</pub-id><pub-id pub-id-type="pmid">30368002</pub-id></citation></ref>
<ref id="B67"><label>67.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sneeuw</surname><given-names>KC</given-names></name><name><surname>Sprangers</surname><given-names>MA</given-names></name><name><surname>Aaronson</surname><given-names>NK</given-names></name></person-group>. <article-title>The role of health care providers and significant others in evaluating the quality of life of patients with chronic disease</article-title>. <source>J Clin Epidemiol</source>. (<year>2002</year>) <volume>55</volume>(<issue>11</issue>):<fpage>1130</fpage>&#x2013;<lpage>43</lpage>. <pub-id pub-id-type="doi">10.1016/S0895-4356(02)00479-1</pub-id><pub-id pub-id-type="pmid">12507678</pub-id></citation></ref>
<ref id="B68"><label>68.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Field</surname><given-names>D</given-names></name><name><surname>Douglas</surname><given-names>C</given-names></name><name><surname>Jagger</surname><given-names>C</given-names></name><name><surname>Dand</surname><given-names>P</given-names></name></person-group>. <article-title>Terminal illness: views of patients and their lay carers</article-title>. <source>Palliat Med</source>. (<year>1995</year>) <volume>9</volume>(<issue>1</issue>):<fpage>45</fpage>&#x2013;<lpage>54</lpage>. <pub-id pub-id-type="doi">10.1177/026921639500900107</pub-id><pub-id pub-id-type="pmid">7719517</pub-id></citation></ref>
<ref id="B69"><label>69.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jones</surname><given-names>JM</given-names></name><name><surname>McPherson</surname><given-names>CJ</given-names></name><name><surname>Zimmermann</surname><given-names>C</given-names></name><name><surname>Rodin</surname><given-names>G</given-names></name><name><surname>Le</surname><given-names>LW</given-names></name><name><surname>Cohen</surname><given-names>SR</given-names></name></person-group>. <article-title>Assessing agreement between terminally ill cancer patients&#x2019; reports of their quality of life and family caregiver and palliative care physician proxy ratings</article-title>. <source>J Pain Symptom Manage</source>. (<year>2011</year>) <volume>42</volume>(<issue>3</issue>):<fpage>354</fpage>&#x2013;<lpage>65</lpage>. <pub-id pub-id-type="doi">10.1016/j.jpainsymman.2010.11.018</pub-id><pub-id pub-id-type="pmid">21454041</pub-id></citation></ref>
<ref id="B70"><label>70.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname><given-names>JS</given-names></name><name><surname>Keener</surname><given-names>JD</given-names></name><name><surname>Yamaguchi</surname><given-names>K</given-names></name><name><surname>Chen</surname><given-names>J</given-names></name><name><surname>Stobbs-Cucchi</surname><given-names>G</given-names></name><name><surname>Patton</surname><given-names>R</given-names></name><etal/></person-group> <article-title>Reliability of patient self-assessment of shoulder range of motion and strength after shoulder arthroplasty</article-title>. <source>J Shoulder Elbow Surg</source>. (<year>2015</year>) <volume>24</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1016/j.jse.2014.08.025</pub-id><pub-id pub-id-type="pmid">25440517</pub-id></citation></ref>
<ref id="B71"><label>71.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Loshchilov</surname><given-names>I</given-names></name><name><surname>Hutter</surname><given-names>F</given-names></name></person-group>. <article-title>Decoupled weight decay regularization</article-title>. <comment><italic>arXiv</italic> [Preprint]. <italic>arXiv:1711.05101</italic></comment> (<year>2017</year>). <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1711.05101">https://arxiv.org/abs/1711.05101</ext-link> (Accessed January 8, 2024)</comment>.<pub-id pub-id-type="pmid">26426070</pub-id></citation></ref></ref-list>
</back>
</article>