<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Surg.</journal-id>
<journal-title>Frontiers in Surgery</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Surg.</abbrev-journal-title>
<issn pub-type="epub">2296-875X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fsurg.2023.1271775</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Surgery</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Natural language processing for the automated detection of intra-operative elements in lumbar spine surgery</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name><surname>Biswas</surname><given-names>Sayan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref>
<xref ref-type="author-notes" rid="an1"><sup>&#x2020;</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/2362586/overview"/><role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/><role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/><role content-type="https://credit.niso.org/contributor-roles/methodology/"/><role content-type="https://credit.niso.org/contributor-roles/supervision/"/><role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author" equal-contrib="yes"><name><surname>McMenemy</surname><given-names>Lareyna</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="an1"><sup>&#x2020;</sup></xref><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/><role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/></contrib>
<contrib contrib-type="author"><name><surname>Sarkar</surname><given-names>Ved</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/2406065/overview" /><role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/><role content-type="https://credit.niso.org/contributor-roles/software/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>MacArthur</surname><given-names>Joshua</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref><role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Snowdon</surname><given-names>Ella</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref><role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Tetlow</surname><given-names>Callum</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/2398764/overview" /><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/methodology/"/><role content-type="https://credit.niso.org/contributor-roles/supervision/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>George</surname><given-names>K. Joshi</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref></contrib>
</contrib-group>
<aff id="aff1"><label><sup>1</sup></label><institution>Faculty of Biology, Medicine and Health, University of Manchester</institution>, <addr-line>Manchester</addr-line>, <country>United Kingdom</country></aff>
<aff id="aff2"><label><sup>2</sup></label><institution>College of Letters and Sciences, University of California</institution>, <addr-line>Berkeley, CA</addr-line>, <country>United States</country></aff>
<aff id="aff3"><label><sup>3</sup></label><institution>Division of Data Science, The Northern Care Alliance NHS Group</institution>, <addr-line>Manchester</addr-line>, <country>United Kingdom</country></aff>
<aff id="aff4"><label><sup>4</sup></label><institution>Department of Neurosurgery, Manchester Centre for Clinical Neurosciences, Salford Royal Hospital</institution>, <addr-line>Manchester</addr-line>, <country>United Kingdom</country></aff>
<author-notes>
<fn fn-type="edited-by"><p><bold>Edited by:</bold> Mohammed Ali Alvi, University Health Network (UHN), Canada</p></fn>
<fn fn-type="edited-by"><p><bold>Reviewed by:</bold> Alessandro Boaro, University of Verona, Italy</p>
<p>Redi Rahmani, Barrow Neurological Institute (BNI), United States</p></fn>
<corresp id="cor1"><label>&#x002A;</label><bold>Correspondence:</bold> Sayan Biswas <email>sayan.biswas@nca.nhs.uk</email></corresp>
<fn fn-type="equal" id="an1"><label><sup>&#x2020;</sup></label><p>These authors have contributed equally to this work and share first authorship</p></fn>
<fn fn-type="other" id="fn001"><p><bold>Abbreviations</bold> AUC, area under the receiver-operating curve; CI, confidence intervals; CPT, current procedural terminology; DCA, decision curve analysis; ICD, international statistical classification of diseases; NLP, natural language processing; PPV, positive predictive value; TRIPOD, transparent reporting of multivariable prediction models for individual prognosis or diagnosis; XGBoost, extreme gradient boosting.</p></fn>
</author-notes>
<pub-date pub-type="epub"><day>18</day><month>12</month><year>2023</year></pub-date>
<pub-date pub-type="collection"><year>2023</year></pub-date>
<volume>10</volume><elocation-id>1271775</elocation-id>
<history>
<date date-type="received"><day>02</day><month>08</month><year>2023</year></date>
<date date-type="accepted"><day>27</day><month>11</month><year>2023</year></date>
</history>
<permissions>
<copyright-statement>&#x00A9; 2023 Biswas, McMenemy, Sarkar, MacArthur, Snowdon, Tetlow and George.</copyright-statement>
<copyright-year>2023</copyright-year><copyright-holder>Biswas, McMenemy, Sarkar, MacArthur, Snowdon, Tetlow and George</copyright-holder><license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<sec><title>Background</title>
<p>The aim of this study was to develop natural language processing (NLP) algorithms to conduct automated identification of incidental durotomy, wound drains, and the use of sutures or skin clips for wound closure, in free text operative notes of patients following lumbar surgery.</p>
</sec>
<sec><title>Methods</title>
<p>A single-centre retrospective case series analysis was conducted between January 2015 and June 2022, analysing operative notes of patients aged &#x003E;18 years who underwent a primary lumbar discectomy and/or decompression at any lumbar level. Extreme gradient-boosting NLP algorithms were developed and assessed on five performance metrics: accuracy, area under receiver-operating curve (AUC), positive predictive value (PPV), specificity, and Brier score.</p>
</sec>
<sec><title>Results</title>
<p>A total of 942 patients were used in the training set and 235 patients, in the testing set. The average age of the cohort was 53.900&#x2009;&#x00B1;&#x2009;16.153 years, with a female predominance of 616 patients (52.3&#x0025;). The models achieved an aggregate accuracy of &#x003E;91&#x0025;, a specificity of &#x003E;91&#x0025;, a PPV of &#x003E;84&#x0025;, an AUC of &#x003E;0.933, and a Brier score loss of &#x2264;0.082. The decision curve analysis also revealed that these NLP algorithms possessed great clinical net benefit at all possible threshold probabilities. Global and local model interpretation analyses further highlighted relevant clinically useful features (words) important in classifying the presence of each entity appropriately.</p>
</sec>
<sec><title>Conclusions</title>
<p>These NLP algorithms can help monitor surgical performance and complications in an automated fashion by identifying and classifying the presence of various intra-operative elements in lumbar spine surgery.</p>
</sec>
</abstract>
<kwd-group>
<kwd>clips</kwd>
<kwd>dural tears</kwd>
<kwd>natural language processing</kwd>
<kwd>sutures</kwd>
<kwd>spine surgery</kwd>
<kwd>wound drains</kwd>
</kwd-group>
<contract-sponsor id="cn001">The authors declare that no financial support was received for the research, authorship, and/or publication of this paper.</contract-sponsor>
<counts>
<fig-count count="5"/>
<table-count count="3"/><equation-count count="0"/><ref-count count="45"/><page-count count="0"/><word-count count="0"/></counts><custom-meta-wrap><custom-meta><meta-name>section-at-acceptance</meta-name><meta-value>Neurosurgery</meta-value></custom-meta></custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro"><label>1.</label><title>Introduction</title>
<p>Administrative, billing, and coding tasks are a major source of financial and economic burden on healthcare systems worldwide (<xref ref-type="bibr" rid="B1">1</xref>). With the increase in healthcare and labour costs in recent years, major health systems are shifting towards minimising financial expenditure while maximising patient care. A key component in this process is optimising the clinical coding pipeline by reducing the burden on labour with limited manual review and intervention. The clinical coding process involves transforming medical records, usually presented as free text written by clinicians, into structured codes using the standardised Current Procedural Terminology (CPT) and the International Statistical Classification of Diseases (ICD) codes. The purpose of such clinical coding is to characterise the use of hospital services, document patient outcomes, and quantify clinical and surgical practices to allow for optimal financial reimbursement and to inform healthcare service planning and policy (<xref ref-type="bibr" rid="B2">2</xref>, <xref ref-type="bibr" rid="B3">3</xref>).</p>
<p>Natural language processing (NLP) is a domain of machine learning that focuses on the analysis of structured and unstructured free text. NLP techniques are well suited for clinical coding due to their ability to analyse free text in real time with great precision. In the United Kingdom, the General Medical Council states that maintaining accurate and detailed clinical documentation is essential across all specialties for good medical practice (<xref ref-type="bibr" rid="B4">4</xref>), in addition to providing information for research, audits, and medicolegal records (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>). The current epidemic of defensive practice due to fear of medicolegal repercussions has had an extensive impact on neurosurgical documentation practices, resulting in more detailed documentation of procedures (<xref ref-type="bibr" rid="B7">7</xref>). Despite guidelines being available for the documentation of operative notes (<xref ref-type="bibr" rid="B8">8</xref>), many studies have demonstrated the inadequate quality of operative notes with much salient information missing, including the nature of the surgery, indication of surgery, estimated blood loss, incidence of complications, and postoperative instructions (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B9">9</xref>&#x2013;<xref ref-type="bibr" rid="B11">11</xref>). Such non-standardised documentation can lead to greater manual review times, making the extraction of relevant information more labour-intensive. The creation of accurate NLP algorithms trained on a large number of heterogeneous documents can be used to supplement the current clinical coding process, reducing the need for extensive and tedious manual reviews.</p>
<p>Spine surgery comprises the majority of operative cases in neurological surgery. Incidental durotomy, lumbar drains, and type of skin closure (sutures or clips) are important elements included in operative notes and are associated with patient outcomes, and therefore accurate documentation is vital to inform best clinical practice (<xref ref-type="bibr" rid="B12">12</xref>&#x2013;<xref ref-type="bibr" rid="B16">16</xref>). At present, CPT and ICD-10 codes are used to identify incidental durotomies and &#x201C;dural tears&#x201D; within operative notes. However, these modalities have been shown to lack sensitivity, resulting in the underreporting of these complications (<xref ref-type="bibr" rid="B17">17</xref>&#x2013;<xref ref-type="bibr" rid="B19">19</xref>). To the best of our knowledge, no such codes exist for the identification of the use of drains or wound closure technique used. Hence, the aim of this study is to develop NLP algorithms to conduct automated surveillance for identification of incidental durotomy, wound drains, and the use of sutures or skin clips for wound closure, in free text operative notes of patients following lumbar surgery. Towards this, in this study we attempted to evaluate if NLP techniques could be harnessed to analyse operative notes to detect the three important elements of spine surgery: incidental durotomy, the use of wound drains, and type of skin closure (suture or clips).</p>
</sec>
<sec id="s2" sec-type="methods"><label>2.</label><title>Materials and methods</title>
<sec id="s2a"><label>2.1.</label><title>Guidelines</title>
<p>The following guidelines were followed in this study: the <italic>Journal of Medical Internet Research</italic> (JMIR) Guidelines for Developing and Reporting Machine Learning Predictive Models in Biomedical Research, and the Transparent Reporting of Multivariable Prediction Models for Individual Prognosis or Diagnosis (TRIPOD) checklist (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B21">21</xref>).</p>
</sec>
<sec id="s2b"><label>2.2.</label><title>Data source and outcome measure</title>
<p>A single tertiary neurosurgical centre retrospective case series analysis was conducted for all patients who underwent lumbar spine surgery between January 2015 and June 2022. The inclusion criteria for this study were as follows: (1) patient age more than or equal to 18 years, (2) patient underwent a primary lumbar discectomy and/or decompression at any lumbar level, and (3) availability of index surgery operation notes in our electronic health records. The exclusion criteria included any patients with incomplete data and patients who underwent primary lumbar discectomy and/or fusion. The hospital&#x0027;s electronic patient records were examined and a total of 1,177 patients were identified. Each patient&#x0027;s operation note was then blinded and extracted in an anonymised manner. Our study was approved by the local hospital&#x0027;s institutional review board because of the retrospective and anonymised operative note data collection method. The study was registered as a health improvement project with the requirement for patient consent being waived. All methods were conducted in accordance with local and national guidelines and regulations.</p>
<p>Along with the operation notes, the age (continuous) and gender of the patient (male or female) were also collected as independent variables. There were three primary outcomes for each operation note: (1) the presence of intra-operative durotomies (binary outcome), (2) the placement of wound drains (binary outcome), and (3) the use of clips or sutures for skin closure (binary outcome). The terms durotomies and dural tears are used interchangeably in this paper. Each patient&#x0027;s operation note was reviewed and annotated by blinded researchers (LM and SB) who were not involved in the care of these patients. The results of each outcome category were then verified by the senior author.</p>
</sec>
<sec id="s2c"><label>2.3.</label><title>Data pre-processing</title>
<p>The data acquisition, pre-processing, model development, and evaluation pipeline have been highlighted in <xref ref-type="fig" rid="F1">Figure&#x00A0;1</xref>. The dataset was initially cleaned with a custom data-cleaning function that consisted of the removal of special characters retrieved from the Natural Language Toolkit (NLTK) such as &#x201C;@/&#x007B;&#x0024;&#x0023;&#x0025;&#x0026;&#x201D; and stopwords including &#x201C;<italic>and</italic>&#x201D;, &#x201C;<italic>or</italic>&#x201D;, and &#x201C;the&#x201D;. These words do not carry significant meaning or information in text analysis tasks, hence their removal helps to de-noise the text data resulting in the better efficiency and performance of NLP models. Stemming and lemmatisation are two common techniques used in the data-cleaning function, both of which aim to normalise words by reducing them to their base or root forms. Stemming achieves this by removing any suffixes at the end of a word, while lemmatisation is the process of reducing a word to its base or dictionary form (known as the lemma) while taking into account the context and part of speech of the word.</p>
<fig id="F1" position="float"><label>Figure 1</label>
<caption><p>Data acquisition, processing, analysis, and visualisation pipeline. DB, database.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fsurg-10-1271775-g001.tif"/>
</fig>
<p>Lastly, the CountVectorizer library function was used to pre-process the cleaned data. By default, CountVectorizer uses the &#x201C;term frequency&#x201D; weighting for single tokenisation, which means it represents each word by the number of times it appears in a document. This results in a document-term matrix where each element represents the frequency of a particular word in a specific document. The resulting matrix is then used as the input to various machine learning algorithms such as clustering, classification, and topic modelling. By representing text data in a numerical format, the CountVectorizer enables machine learning (ML) algorithms to process and analyse textual data, which would otherwise be difficult due to the unstructured nature of natural language.</p>
</sec>
<sec id="s2d"><label>2.4.</label><title>Model development</title>
<p>An 80:20 training&#x2013;testing split was carried out on the total cohort of 1,177 patients, with 942 patients in the training set and 235 patients in the testing set. The datasets were stratified for the outcome variables to account for class imbalances. An extreme gradient-boosting (XGBoost) NLP classifier was developed to predict each outcome category. XGBoost was selected as the classifier of choice owing to a number of factors: (1) its ability to handle high-dimensional feature spaces such as word to vector embeddings used in NLP, (2) the ability to handle and adjust for sparse and imbalanced datasets using weighted loss functions and subsampling, (3) its faster computational run time and scalability, and (4) explicit feature importance calculation for each input attribute (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B22">22</xref>). Three individual models were created for identifying each outcome category, and the outputs from the models were concatenated to produce a multilabel ensemble output with the predicted probabilities for each outcome. The three ML models will be referred to as the dural tear, drains, and clips vs. sutures models in this paper. An iterative process termed Grid Search was used to optimise the model hyperparameters. In grid search, a predefined set of hyperparameter values is defined, and the model is trained and evaluated on all possible combinations of these values to achieve the highest level of accuracy.</p>
<p>The models were trained on fivefold stratified K-fold cross-validation with five repeats on the training dataset. The training and testing datasets were stratified by each of the outcome categories to standardise the class imbalances within our outcome variables and provide us with the best overall performance results for the models. The performance of the models were evaluated via five performance metrics on the training and testing sets: accuracy, precision/positive predictive value (PPV), specificity, area under the receiver-operating curve (AUC)/discrimination, and the Brier score loss. All metrics were bootstrapped with 1,000 resamples to derive the associated 95&#x0025; confidence intervals (CIs). Each model was then calibrated on the testing set. Calibration refers to how well a model&#x0027;s predicted probabilities align with the true observed probabilities in the study population. This is evaluated using a calibration curve, which is ideally a 45&#x00B0; straight line starting from the origin, with a slope of 1 (indicating the spread of the model&#x0027;s estimated probabilities over the observed probabilities), and an intercept of 0 (indicating how much the model tends to over- or underestimate the true probability). In this study, the preferred method of calibration was Platt scaling or sigmoid binned calibration, which involved dividing the probability range into 10 bins and evaluating the shape of the calibration curve, as well as its slope, intercept, and the Brier score loss metric. In addition, the decision curve analysis (DCA) was used to evaluate and plot the clinical benefit of using the NLP algorithms to predict the presence of each outcome variable over a wide range of predicted threshold probabilities. The DCA illustrates the net benefit defined as the number of true positives detected for each outcome class when using the NLP algorithms on individual patient operation notes.</p>
<p>A model-specific global feature importance analysis was conducted on the trained models via retrieval of each model&#x0027;s relative feature weights that were averaged across all training folds. Furthermore, the Local Interpretable Model-agnostic Explanation analysis was performed to predict and highlight the important features on an individual patient operation note level.</p>
</sec>
<sec id="s2e"><label>2.5.</label><title>Statistical analysis</title>
<p>All statistical analyses were conducted using IBM SPSS software (Statistical Package for the Social Science; SPSS Inc., Chicago, IL, USA) Version 25 for Mac, Microsoft Excel (Office 365, Microsoft, Seattle, WA, USA), and the R coding language (R Foundation for Statistical Computing, Vienna, Austria). Histogram plots and the Kolmogorov&#x2013;Smirnov test were utilised for tests of normality for the continuous variables. The chi-squared tests were used to compare all categorical variables, and the independent samples <italic>t</italic>-test was used to compare the means of the continuous variables. Temporal trend analysis with a linear line of best fit was conducted for all variables, within our retrospective observation time period. A <italic>p</italic>-value &#x003C;0.05 was considered statistically significant.</p>
</sec>
</sec>
<sec id="s3" sec-type="results"><label>3.</label><title>Results</title>
<sec id="s3a"><label>3.1.</label><title>Cohort demographics</title>
<p>A total of 1,177 patients were included in the study, with 942 patients in the training set and 235 patients in the testing set. <xref ref-type="table" rid="T1">Table&#x00A0;1</xref> demonstrates the total cohort demographics. The average age of the cohort was 53.900&#x2009;&#x00B1;&#x2009;16.153 years, with a female predominance of 616 patients (52.3&#x0025;). The rates of intra-operative durotomy and the use of wounds drains were 9.9&#x0025; (117/1,177) and 31.6&#x0025; (373/1,177), respectively. Overall, the use of sutures [710 (60.3&#x0025;)] was more common for skin closure compared with the use of metal surgical clips [458 (38.9&#x0025;)]. The inter-variable comparative analysis (<xref ref-type="table" rid="T2">Table&#x00A0;2</xref>) demonstrated a significant relationship between increasing patient age and the use of sutures (<italic>p-</italic>value&#x2009;&#x003D;&#x2009;0.001). We also noted that with an ageing population, the operative age of our patients significantly increased over our observation period (<italic>p-</italic>value&#x2009;&#x003D;&#x2009;0.013). There was also a statistically significant relationship between the use of sutures for skin closure in cases with intra-operative dural tears and wound drains (<italic>p-</italic>value&#x2009;&#x003C;&#x2009;0.001). However, there was no statistically significant relationship between the use of wound drains and the presence of intra-operative dural tears (<italic>p-</italic>value&#x2009;&#x003D;&#x2009;0.554).</p>
<table-wrap id="T1" position="float"><label>Table 1</label>
<caption><p>Cohort demographics of the total patient cohort.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left"/>
<th valign="top" align="center">Total cohort (<italic>n</italic>&#x2009;&#x003D;&#x2009;1,177)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Age</td>
<td valign="top" align="center">53.900&#x2009;&#x00B1;&#x2009;16.153</td>
</tr>
<tr>
<td valign="top" align="left" colspan="2">Sex</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Female</td>
<td valign="top" align="center">616 (52.3&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Male</td>
<td valign="top" align="center">561 (47.7&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="2">Drain(s)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="top" align="center">373 (31.6&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;No</td>
<td valign="top" align="center">801 (67.8&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="2">Closure</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Clips</td>
<td valign="top" align="center">458 (38.9&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Sutures</td>
<td valign="top" align="center">710 (60.3&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="2">Dural tear(s)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="top" align="center">117 (9.9&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;No</td>
<td valign="top" align="center">1,060 (90.1&#x0025;)</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T2" position="float"><label>Table 2</label>
<caption><p>Inter-variable statistical correlation analysis using <italic>t</italic>-tests for continuous variables and Chi-square tests for categorical variables.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left" rowspan="2"/>
<th valign="top" align="center" colspan="6"><italic>p</italic>-value</th>
</tr>
<tr>
<th valign="top" align="center">Age</th>
<th valign="top" align="center">Sex</th>
<th valign="top" align="center">Drains</th>
<th valign="top" align="center">Closure</th>
<th valign="top" align="center">Dural tear(s)</th>
<th valign="top" align="center">Year of surgery</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Age</td>
<td valign="top" align="center"/>
<td valign="top" align="center">0.137</td>
<td valign="top" align="center">0.283</td>
<td valign="top" align="center">0.001<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></td>
<td valign="top" align="center">0.501</td>
<td valign="top" align="center">0.013<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></td>
</tr>
<tr>
<td valign="top" align="left" colspan="7">Sex</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Female</td>
<td valign="top" align="center" rowspan="2">0.137</td>
<td valign="top" align="center" rowspan="2"/>
<td valign="top" align="center" rowspan="2">0.278</td>
<td valign="top" align="center" rowspan="2">0.294</td>
<td valign="top" align="center" rowspan="2">0.217</td>
<td valign="top" align="center" rowspan="2">0.322</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Male</td>
</tr>
<tr>
<td valign="top" align="left" colspan="7">Drain(s)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="top" align="center" rowspan="2">0.283</td>
<td valign="top" align="center" rowspan="2">0.278</td>
<td valign="top" align="center" rowspan="2"/>
<td valign="top" align="center" rowspan="2">&#x003C;0.001<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></td>
<td valign="top" align="center" rowspan="2">0.554</td>
<td valign="top" align="center" rowspan="2">0.906</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;No</td>
</tr>
<tr>
<td valign="top" align="left" colspan="7">Closure</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Clips</td>
<td valign="top" align="center" rowspan="2">0.001<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></td>
<td valign="top" align="center" rowspan="2">0.294</td>
<td valign="top" align="center" rowspan="2">&#x003C;0.001<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></td>
<td valign="top" align="center" rowspan="2"/>
<td valign="top" align="center" rowspan="2">&#x003C;0.001<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></td>
<td valign="top" align="center" rowspan="2">0.017<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Sutures</td>
</tr>
<tr>
<td valign="top" align="left" colspan="7">Dural tear(s)</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;Yes</td>
<td valign="top" align="center" rowspan="2">0.501</td>
<td valign="top" align="center" rowspan="2">0.217</td>
<td valign="top" align="center" rowspan="2">0.554</td>
<td valign="top" align="center" rowspan="2">&#x003C;0.001<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></td>
<td valign="top" align="center" rowspan="2"/>
<td valign="top" align="center" rowspan="2">0.853</td>
</tr>
<tr>
<td valign="top" align="left">&#x2003;No</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn1"><label><sup>a</sup></label><p>Statistically significant <italic>p</italic>-value.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3b"><label>3.2.</label><title>Temporal trend analysis</title>
<p>The Mann&#x2013;Kendall test was used to analyse the temporal trends of the variables across our observation time period as shown in Supplementary Figure S1. During the study period, the total number of lumbar discectomies and/or decompressions decreased significantly from 220 surgeries in 2015 to 56 in the first half of 2022 (&#x2212;112 estimated in a year) (tau&#x2009;&#x003D;&#x2009;&#x2212;0.929, <italic>p-</italic>value&#x2009;&#x003D;&#x2009;0.002). This decline was observed in all the years with the exception of 2019, which saw an increase of one operation from the previous year. It was noted that there was also a decrease in all spinal procedures post COVID-19, which may account for the decrease. The frequency of intra-operative durotomies/dural tears did decrease over the study period; however, no statistical significance was observed (tau&#x2009;&#x003D;&#x2009;&#x2212;0.286, <italic>p-</italic>value&#x2009;&#x003D;&#x2009;0.386), with rates ranging from 5.8&#x0025; to 14.2&#x0025;. The frequency of intra-operative placement of wound drains also statistically significantly increased over the study period, rising from 18.6&#x0025; in 2015 to 41.1&#x0025; in 2022 (tau&#x2009;&#x003D;&#x2009;0.643, <italic>p-</italic>value&#x2009;&#x003D;&#x2009;0.035). The preferred method of skin closure also changed over the study period, demonstrating a preference for closure with sutures in later years (tau&#x2009;&#x003D;&#x2009;0.5, <italic>p-</italic>value&#x2009;&#x003D;&#x2009;0.108) with a rise from 54&#x0025; in 2015 to 75&#x0025; in 2022. We observed an exact yet complementary decrease in the use of surgical clips for skin closure over the years (tau&#x2009;&#x003D;&#x2009;&#x2212;0.5, <italic>p-</italic>value&#x2009;&#x003D;&#x2009;0.108).</p>
</sec>
<sec id="s3c"><label>3.3.</label><title>Model performance</title>
<p><xref ref-type="table" rid="T3">Table&#x00A0;3</xref> provides the performance metrics for the three ML models on the testing dataset. The dural tears model achieved an accuracy of 91.7615 (95&#x0025; CI: 88.636&#x2013;94.602), a PPV of 84.211&#x0025; (95&#x0025; CI: 80.667&#x2013;90.000), a specificity of 99.032&#x0025; (95&#x0025; CI: 96.959&#x2013;99.750), and an AUC of 0.946 (95&#x0025; CI: 0.917&#x2013;0.970). The drains model achieved an accuracy of 94.894&#x0025; (95&#x0025; CI: 92.330&#x2013;97.160), a PPV of 88.696&#x0025; (95&#x0025; CI: 82.308&#x2013;94.000), a specificity of 94.694&#x0025; (95&#x0025; CI: 90.886&#x2013;97.025), and an AUC of 0.950 (95&#x0025; CI: 0.923&#x2013;0.973). The clips vs. sutures model achieved an accuracy of 93.750&#x0025; (95&#x0025; CI: 91.193&#x2013;96.307), a PPV of 94.495&#x0025; (95&#x0025; CI: 91.379&#x2013;97.260), a specificity of 91.177&#x0025; (95&#x0025; CI: 84.770&#x2013;95.153), and an AUC of 0.933 (95&#x0025; CI: 0.923&#x2013;0.973). <xref ref-type="fig" rid="F2">Figure&#x00A0;2</xref> shows the calibration curves for each of the models. The dural tears model had a propensity to underpredict the presence of a dural tear, with a Brier score loss of 0.082 (95&#x0025; CI: 0.054&#x2013;0.114), an intercept of 0.91 (95&#x0025; CI: 0.46&#x2013;1.36), and a slope of 0.99 (95&#x0025; CI: 0.76&#x2013;1.23). The drains model demonstrated excellent calibration across all predicted probabilities with a Brier score loss of 0.051 (95&#x0025; CI: 0.028&#x2013;0.076), an intercept of &#x2212;0.71 (95&#x0025; CI: &#x2212;1.31 to &#x2212;0.12), and a slope of 0.75 (95&#x0025; CI: 0.60&#x2013;0.91). The clips vs. sutures model demonstrated a tendency to overpredict the use of sutures for skin closure, with a Brier score loss of 0.063 (95&#x0025; CI: 0.037&#x2013;0.088), an intercept of &#x2212;0.01 (95&#x0025; CI: &#x2212;0.61&#x2013;0.60), and a slope of 0.65 (95&#x0025; CI: 0.53&#x2013;0.77). Lastly, the decision curve analysis on the testing set revealed that all NLP algorithms ensured greater clinical net benefit at all possible threshold probabilities relative to the default decisions of changes made for all or none patients (<xref ref-type="fig" rid="F3">Figure&#x00A0;3</xref>).</p>
<table-wrap id="T3" position="float"><label>Table 3</label>
<caption><p>Performance metrics of the machine learning model on the testing set with 95&#x0025; confidence intervals.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="center">Accuracy (&#x0025;)</th>
<th valign="top" align="center">Precision/PPV (&#x0025;)</th>
<th valign="top" align="center">Specificity (&#x0025;)</th>
<th valign="top" align="center">AUC</th>
<th valign="top" align="center">Brier score loss</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="6">Testing set (<italic>n</italic>&#x2009;&#x003D;&#x2009;235)</td>
</tr>
<tr>
<td valign="top" align="left">Dural tears</td>
<td valign="top" align="center">91.761 (88.636&#x2013;94.602)</td>
<td valign="top" align="center">84.211 (80.667&#x2013;90.000)</td>
<td valign="top" align="center">99.032 (96.959&#x2013;99.750)</td>
<td valign="top" align="center">0.946 (0.917&#x2013;0.970)</td>
<td valign="top" align="center">0.082 (0.054&#x2013;0.114)</td>
</tr>
<tr>
<td valign="top" align="left">Drains</td>
<td valign="top" align="center">94.894 (92.330&#x2013;97.160)</td>
<td valign="top" align="center">88.696 (82.308&#x2013;94.000)</td>
<td valign="top" align="center">94.694 (90.886&#x2013;97.025)</td>
<td valign="top" align="center">0.950 (0.923&#x2013;0.973)</td>
<td valign="top" align="center">0.051 (0.028&#x2013;0.076)</td>
</tr>
<tr>
<td valign="top" align="left">Clips vs. sutures</td>
<td valign="top" align="center">93.750 (91.193&#x2013;96.307)</td>
<td valign="top" align="center">94.495 (91.379&#x2013;97.260)</td>
<td valign="top" align="center">91.177 (84.770&#x2013;95.153)</td>
<td valign="top" align="center">0.933 (0.923&#x2013;0.973)</td>
<td valign="top" align="center">0.063 (0.037&#x2013;0.088)</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F2" position="float"><label>Figure 2</label>
<caption><p>Calibration curves of the natural language processing models for identifying (<bold>A</bold>) dural tears, (<bold>B</bold>) wound drains, and (<bold>C</bold>) clips vs. sutures, in the testing set (<italic>n</italic>&#x2009;&#x003D;&#x2009;235).</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fsurg-10-1271775-g002.tif"/>
</fig>
<fig id="F3" position="float"><label>Figure 3</label>
<caption><p>Decision curve analyses comparing expected clinical net benefit of the three models: (<bold>A</bold>) dural tears, (<bold>B</bold>) wound drains, and (<bold>C</bold>) clips vs. sutures, on the testing set.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fsurg-10-1271775-g003.tif"/>
</fig>
</sec>
<sec id="s3d"><label>3.4.</label><title>Model explainability</title>
<p>The global feature importance calculations for the NLP algorithms are presented in <xref ref-type="fig" rid="F4">Figure&#x00A0;4</xref>. These explanations highlight that for identification of an intra-operative durotomy, the five most meaningful features (words) are: &#x201C;repair,&#x201D; &#x201C;intradural,&#x201D; &#x201C;dural,&#x201D; &#x201C;patch,&#x201D; and &#x201C;Valsalva.&#x201D; The five most important features (words) for detecting the intra-operative placement of a lumbar drain are: &#x201C;drain,&#x201D; &#x201C;fascial,&#x201D; &#x201C;scoliosis,&#x201D; &#x201C;clotting,&#x201D; and &#x201C;incision.&#x201D; Similarly, for detecting whether surgical clips or traditional sutures were utilised for skin closure, the following five words were the most important: &#x201C;clip,&#x201D; &#x201C;staple,&#x201D; &#x201C;warmer,&#x201D; &#x201C;lamina,&#x201D; and &#x201C;clamp.&#x201D; In addition, the local feature importance analysis for an example patient level operation note demonstrates that the dural tear model is able to identify the five most important clinically meaningful features to detect the presence of an intra-operative dural tear (<xref ref-type="fig" rid="F5">Figure&#x00A0;5</xref>). Interestingly, the local feature importance analysis for the drains and clips vs. sutures model demonstrated that the algorithm primarily searched only for the words &#x201C;drain&#x201D; and &#x201C;clip,&#x201D; respectively, to make the prediction, with the other aforementioned features possessing very little impact on the outcome.</p>
<fig id="F4" position="float"><label>Figure 4</label>
<caption><p>Global feature importance values for the NLP algorithms: (<bold>A</bold>) dural tears, (<bold>B</bold>) wound drains, and (<bold>C</bold>) clips vs. sutures.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fsurg-10-1271775-g004.tif"/>
</fig>
<fig id="F5" position="float"><label>Figure 5</label>
<caption><p>Local feature importance analysis for detecting dural tears in an example individual patient operation note as generated by the NLP algorithm.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fsurg-10-1271775-g005.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion"><label>4.</label><title>Discussion</title>
<p>This study analysed the trends in the use of various intra-operative elements in spine surgery and developed NLP algorithms capable of reliably identifying these elements in operative notes. The automated identification of these elements can facilitate more efficient clinical coding and billing processes, help optimise hospital quality improvement and safety efforts, assist clinicians in auditing surgical practices, and guide overall resource allocation. This study demonstrates that our NLP algorithms are capable of reliably and accurately identifying the placement of intra-operative wound drains, the presence of incidental dural tears, and whether surgical clips or sutures were utilised for skin closure. This is the first ever study from a country with a public healthcare system that has demonstrated the feasibility of using automated NLP systems in operative notes to potentially guide both surgical practices and resource allocation.</p>
<p>The use of NLP techniques in spine surgery has seen a rise in the recent years and is projected to rapidly grow in the future (<xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B24">24</xref>). The ability of NLP to perform precise automated surveillance of operative notes, to answer clinically relevant questions, serves to reduce the burden of time-intensive and error-prone reviews by clinical coders (<xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B26">26</xref>). The delays in clinical coding within the National Health Service (NHS) impose a significant burden, with the potential for funding to be blocked if coding is not completed within a prerequisite timeframe (<xref ref-type="bibr" rid="B27">27</xref>). The average accuracy of this coding has been reported at approximately 83&#x0025;, with large inter-study variability (<xref ref-type="bibr" rid="B28">28</xref>). Such problems exist in majority of healthcare systems worldwide and necessitate the development of automated techniques capable of facilitating these burdensome manual record review processes. Within this realm, Zaidat et al. have already developed an XLNet model capable of automatically generating CPT billing codes from operative notes for three specific surgical procedures: anterior cervical discectomy and fusion (ACDF), posterior cervical discectomy and fusion (PCDF), and cervical disc arthroplasty (CDA) (<xref ref-type="bibr" rid="B2">2</xref>). Such models have the potential to greatly reduce manual review/input, minimise errors in the coding process, and promote standardisation. Most recently, Shost et al. have also demonstrated a model capable of reliably identifying the type of spinal surgery performed via analysis of patient consent forms (<xref ref-type="bibr" rid="B29">29</xref>). The ability to rapidly classify surgical practices can be beneficial to both hospitals and the practicing surgeons. This will help track surgical volume, surgery-specific patient outcomes, and also provide trainees with a method of tracking individual surgical experience. In addition, NLP algorithms have also demonstrated predictive value in classifying lumbar spine imaging findings and in determining the need for surgical intervention in patients with low back pain via analysis of radiological and clinical reports (<xref ref-type="bibr" rid="B30">30</xref>). These examples highlight the importance of NLP techniques in improving the provision of patient care and demonstrate the clinical utility of such models in enhancing hospital and surgical practices.</p>
<p>Our NLP algorithms were developed to identify the presence of three important intra-operative factors that play a role in guiding the resource allocation and surgical practices of a neurosurgical department. In this study, the prevalence of incidental durotomy was 9.9&#x0025;, in line with the recent literature on lumbar surgery (<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B32">32</xref>). Our model demonstrated adequate discrimination and performance in identifying intra-operative dural tears and highlighted the use of clinically relevant features (words) to make its predictions. Previous studies by Karhade et al. have also been successful in the identification of incidental durotomy with an accuracy of 99&#x0025;, surpassing the performance of CPT and ICD-10 codes, which demonstrated an accuracy of only 64&#x0025; (<xref ref-type="bibr" rid="B18">18</xref>). Interestingly, however, the feature importance in their NLP algorithm showed different features compared with ours, further underscoring the potential variability in NLP algorithm performance across different cohorts that are geographically separated, and highlighting the need for broader validation studies (<xref ref-type="bibr" rid="B17">17</xref>). The importance of reliably identifying cases of intra-operative incidental durotomy is highlighted by evidence suggesting that patients with durotomies tend to have increased operative durations and inpatient length of stay (LOS) (<xref ref-type="bibr" rid="B33">33</xref>). Thus, accurate depiction of the rates of incidental durotomy can aid postoperative patient counselling, quantify surgical complication rates, and help track surgical performance.</p>
<p>For the wound drains model, our study demonstrated an accuracy of almost 95&#x0025;. Previous studies have concluded that postoperative drains are currently being overused in spinal surgery, potentially imposing an increased risk of unnecessary complications, while not lending substantial benefit (<xref ref-type="bibr" rid="B34">34</xref>). Most notably, reports have suggested an elevated risk of surgical site infections (SSI) (<xref ref-type="bibr" rid="B35">35</xref>, <xref ref-type="bibr" rid="B36">36</xref>), although this has been refuted by other papers (<xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B37">37</xref>&#x2013;<xref ref-type="bibr" rid="B39">39</xref>). Ho et al. interestingly report that both the absence of a wound drain and increased drainage when drains are used indicate an increased risk of delayed infection after posterior spine surgery (<xref ref-type="bibr" rid="B36">36</xref>). Walid et al. additionally found that the use of postoperative drains was linked to increased post-haemorrhagic anaemia, and a subsequent requirement of allogenic blood transfusions (<xref ref-type="bibr" rid="B40">40</xref>), which may impose greater costs to the healthcare system. Adogwa et al. have also demonstrated that patients with postoperative drains have a significantly longer LOS compared with patients with no drains (<xref ref-type="bibr" rid="B37">37</xref>). The combination of such factors highlights the importance of tracking and quantifying the use of drains in spine surgery, and therefore the development of our NLP algorithm will allow for its automated and reliable detection. The future application of this algorithm in tracking wound drain use and the associated SSI rates remains to be investigated.</p>
<p>Further, our clips vs. suture model demonstrated an accuracy of &#x003E;93&#x0025; accuracy, and our temporal trend analysis showed a preference for using sutures for wound closure. Various studies have concluded that suturing is more efficient when compared with the use of clips for good wound closure, resulting in lower rates of separation, prevention of SSI, and ultimately shorter hospital LOS (<xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B42">42</xref>). Contrastingly, postoperative analysis of visual analogue pain scores comparing the use of clips to non-absorbable sutures have also demonstrated a significantly quicker and pain-free experience for patients with stapled wounds (<xref ref-type="bibr" rid="B43">43</xref>). From an economic perspective as well, studies have demonstrated that staples/clips are less expensive than sutures and that the financial gain appears to increase as laceration length increases (<xref ref-type="bibr" rid="B44">44</xref>). However, conflicting literature exists on the impact of sutures and clips on patients postoperatively (<xref ref-type="bibr" rid="B22">22</xref>), with the need for future robust randomised control trials to further investigate their effects. Nevertheless, such single-use surgical items are the largest contributors to the surgical carbon footprint and hence precise quantification of such use can guide both financial and environmental practices (<xref ref-type="bibr" rid="B45">45</xref>). Therefore, such automated NLP techniques can facilitate accurate data collection and analysis of the use of clips and sutures in neurosurgery. Nevertheless, the utility of this NLP algorithm in identifying and predicting postoperative LOS, risk of SSI, and the estimated carbon footprint after a surgery remains to be explored in a future study.</p>
<sec id="s4a"><label>4.1.</label><title>Limitations</title>
<p>Despite these results, the study has several limitations. First, this was a retrospective analysis at a single centre and therefore the development and testing of the NLP algorithms was geographically limited to a specific region. This raises questions about the algorithms&#x2019; generalisability and their performance in diverse linguistic and clinical contexts. Furthermore, the surgeons affiliated with the healthcare entities in the study likely share practices that influence the specific terminology used to document the various intra-operative characteristics, which could bias the results. Hence, future prospective and external validation of the algorithms needs to be performed to validate the clinical utility of the algorithms. In addition, there are other approaches that can be utilised to adapt our general model to geographically distinct regions. Geographically customisable models can be implemented via techniques such as federated learning and transfer learning. Federated learning enables the collaborative training of models across multiple centres without data sharing, preserving both privacy and centre-specific relationships and trends in the data. Transfer learning further facilitates rapid fine-tuning, which can efficiently adapt a base model to new regions by learning from small local datasets, boosting model performance and reliability. Secondly, though these models are able to reliably identify the outcomes of interest, a further manual review by clinical coders will still be required to exclude any cases of false positives or false negatives. Thus, the need for manual review will still exist, though with a considerably lower level of burden. Hence, multicentre, linguistically different validation studies in hospitals with varying coding/billing practices are required to determine the reliability of these models. Lastly, with the advent of state-of-the-art large language models such as Bidirectional Encoder Representations from Transformers and Generative Pre-trained Transformer models, the need for manual annotation of unstructured, free text data may exponentially reduce. These models are capable of independently performing named entity recognition and can understand the contextual nuances of each outcome of interest. For example, these models would be able to interpret the reason/context for using a drain, or the reason for a durotomy. Thus, in the future the goal would be to develop such models capable of functioning independently without the need for any manual annotation or review.</p>
</sec>
</sec>
<sec id="s5" sec-type="conclusions"><label>5.</label><title>Conclusion</title>
<p>In conclusion, this study evaluated the feasibility and reliability of NLP algorithms in determining the presence of three intra-operative elements in lumbar spine surgery. We demonstrate that these NLP models possess great discriminative ability and accuracy in predicting the presence of wound drains, incidental dural tears, and the use of clips or sutures for wound closure. These models can help automate the clinical coding process, help optimise hospital quality improvement, and monitor surgical performance and practices. This is the first ever study from a country with a primarily public healthcare system that has demonstrated the feasibility of using automated NLP systems in operative notes to potentially guide both surgical practices and resource allocation.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability"><title>Data availability statement</title>
<p>The original contributions presented in this study are included in the article/<xref ref-type="sec" rid="s100">supplementary materials</xref> and further inquires should be directed to the corresponding author.</p>
</sec>
<sec id="s7" sec-type="ethics-statement"><title>Ethics statement</title>
<p>The studies involving humans were approved by Northern Care Alliance Research and Innovation Team. The studies were conducted in accordance with the local legislation and institutional requirements. Written informed consent for participation was not required from the participants or the participants&#x2019; legal guardians/next of kin in accordance with the national legislation and institutional requirements.</p>
</sec>
<sec id="s8" sec-type="author-contributions"><title>Author contributions</title>
<p>SB: Conceptualization, Formal analysis, Methodology, Supervision, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. LM: Data curation, Formal analysis, Writing &#x2013; original draft. VS: Formal analysis, Software, Writing &#x2013; review &#x0026; editing. JM: Conceptualization, Writing &#x2013; review &#x0026; editing. ES: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. CT: Data curation, Methodology, Supervision, Writing &#x2013; review &#x0026; editing. KG: Methodology, Supervision, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec id="s9" sec-type="funding-information"><title>Funding</title>
<p>The authors declare that no financial support was received for the research, authorship, and/or publication of this paper.</p>
</sec>
<ack><title>Acknowledgments</title>
<p>The authors wish to acknowledge the Department of Neurosurgery at Salford Royal Hospital for providing the data.</p>
</ack>
<sec id="s10" sec-type="COI-statement"><title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="disclaimer"><title>Publisher&#x0027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s100" sec-type="supplementary-material"><title>Supplementary material</title>
<p>The Supplementary Material for this paper can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fsurg.2023.1271775/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fsurg.2023.1271775/full&#x0023;supplementary-material</ext-link></p>
<supplementary-material id="SD1" content-type="local-data">
<media mimetype="application" mime-subtype="pdf" xlink:href="Image1.pdf"/>
</supplementary-material>
</sec>
<ref-list><title>References</title>
<ref id="B1"><label>1.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chernew</surname><given-names>M</given-names></name><name><surname>Mintz</surname><given-names>H</given-names></name></person-group>. <article-title>Administrative expenses in the US health care system: why so high?</article-title> <source>JAMA</source>. (<year>2021</year>) <volume>326</volume>(<issue>17</issue>):<fpage>1679</fpage>&#x2013;<lpage>80</lpage>. <pub-id pub-id-type="doi">10.1001/jama.2021.17318</pub-id><pub-id pub-id-type="pmid">34668530</pub-id></citation></ref>
<ref id="B2"><label>2.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zaidat</surname><given-names>B</given-names></name><name><surname>Tang</surname><given-names>J</given-names></name><name><surname>Arvind</surname><given-names>V</given-names></name><name><surname>Geng</surname><given-names>EA</given-names></name><name><surname>Cho</surname><given-names>B</given-names></name><name><surname>Duey</surname><given-names>AH</given-names></name><etal/></person-group> <article-title>Can a novel natural language processing model and artificial intelligence automatically generate billing codes from spine surgical operative notes?</article-title> <source>Global Spine J</source>. (<year>2023</year>):<fpage>21925682231164936</fpage>. <pub-id pub-id-type="doi">10.1177/21925682231164935</pub-id>. [Epub ahead of print]</citation></ref>
<ref id="B3"><label>3.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dong</surname><given-names>H</given-names></name><name><surname>Falis</surname><given-names>M</given-names></name><name><surname>Whiteley</surname><given-names>W</given-names></name><name><surname>Alex</surname><given-names>B</given-names></name><name><surname>Matterson</surname><given-names>J</given-names></name><name><surname>Ji</surname><given-names>S</given-names></name><etal/></person-group> <article-title>Automated clinical coding: what, why, and where we are?</article-title> <source>NPJ Digit Med</source>. (<year>2022</year>) <volume>5</volume>(<issue>1</issue>):<fpage>159</fpage>. <pub-id pub-id-type="doi">10.1038/s41746-022-00705-7</pub-id><pub-id pub-id-type="pmid">36273236</pub-id></citation></ref>
<ref id="B4"><label>4.</label><citation citation-type="other"><collab>GMC</collab>. <comment><italic>Good medical practice</italic> (2013). Available at</comment>: <ext-link ext-link-type="uri" xlink:href="https://www.gmc-uk.org/ethical-guidance/ethical-guidance-for-doctors/good-medical-practice">https://www.gmc-uk.org/ethical-guidance/ethical-guidance-for-doctors/good-medical-practice</ext-link> (accessed July 19, 2023).</citation></ref>
<ref id="B5"><label>5.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hamza</surname><given-names>A</given-names></name><name><surname>Abdalrahim</surname><given-names>H</given-names></name><name><surname>Idris</surname><given-names>S</given-names></name><name><surname>Ahmed</surname><given-names>O</given-names></name></person-group>. <article-title>Evaluating the operative notes of patients undergoing surgery at Omdurman Teaching Hospital, Sudan</article-title>. <source>Sch J App Med Sci</source>. (<year>2013</year>) <volume>1</volume>(<issue>6</issue>):<fpage>668</fpage>&#x2013;<lpage>72</lpage>. <pub-id pub-id-type="doi">10.36347/sjams.2013.v01i06.003</pub-id></citation></ref>
<ref id="B6"><label>6.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rogers</surname><given-names>A</given-names></name><name><surname>Bunting</surname><given-names>M</given-names></name><name><surname>Atherstone</surname><given-names>A</given-names></name></person-group>. <article-title>The quality of operative notes at a general surgery unit</article-title>. <source>S Afr Med J</source>. (<year>2008</year>) <volume>98</volume>(<issue>9</issue>):<fpage>726</fpage>&#x2013;<lpage>8</lpage>.<pub-id pub-id-type="pmid">19113057</pub-id></citation></ref>
<ref id="B7"><label>7.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gadjradj</surname><given-names>PS</given-names></name><name><surname>Ghobrial</surname><given-names>JB</given-names></name><name><surname>Harhangi</surname><given-names>BS</given-names></name></person-group>. <article-title>Experiences of neurological surgeons with malpractice lawsuits</article-title>. <source>Neurosurg Focus</source>. (<year>2020</year>) <volume>49</volume>(<issue>5</issue>):<fpage>E3</fpage>. <pub-id pub-id-type="doi">10.3171/2020.8.FOCUS20250</pub-id><pub-id pub-id-type="pmid">33130609</pub-id></citation></ref>
<ref id="B8"><label>8.</label><citation citation-type="other"><collab>RCS</collab>. <comment><italic>Good surgical practice</italic> (2019). Available at</comment>: <ext-link ext-link-type="uri" xlink:href="https://www.rcseng.ac.uk/standards-and-research/gsp/">https://www.rcseng.ac.uk/standards-and-research/gsp/</ext-link> (accessed July 19, 2023).</citation></ref>
<ref id="B9"><label>9.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lefter</surname><given-names>LP</given-names></name><name><surname>Walker</surname><given-names>SR</given-names></name><name><surname>Dewhurst</surname><given-names>F</given-names></name><name><surname>Turner</surname><given-names>RWL</given-names></name></person-group>. <article-title>An audit of operative notes: facts and ways to improve</article-title>. <source>ANZ J Surg</source>. (<year>2008</year>) <volume>78</volume>(<issue>9</issue>):<fpage>800</fpage>&#x2013;<lpage>2</lpage>. <pub-id pub-id-type="doi">10.1111/j.1445-2197.2008.04654.x</pub-id><pub-id pub-id-type="pmid">18844913</pub-id></citation></ref>
<ref id="B10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Malik</surname><given-names>S</given-names></name><name><surname>Nogaro</surname><given-names>M</given-names></name><name><surname>Shenoy</surname><given-names>R</given-names></name><name><surname>Mitchell</surname><given-names>P</given-names></name></person-group>. <article-title>Improving trauma operation notes at an emerging trauma unit in the regional trauma network</article-title>. <source>Bull R Coll Surg Engl</source>. (<year>2013</year>) <volume>95</volume>(<issue>6</issue>):<fpage>1</fpage>&#x2013;<lpage>3</lpage>. <pub-id pub-id-type="doi">10.1308/003588413X13643054410386</pub-id></citation></ref>
<ref id="B11"><label>11.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nyamulani</surname><given-names>N</given-names></name><name><surname>Mulwafu</surname><given-names>W</given-names></name></person-group>. <article-title>The quality of hand-written operative notes in a surgical unit at Queen Elizabeth central hospital (QECH), Malawi: a prospective completed audit loop study</article-title>. <source>Malawi Med J</source>. (<year>2018</year>) <volume>30</volume>(<issue>2</issue>):<fpage>86</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.4314/mmj.v30i2.6</pub-id><pub-id pub-id-type="pmid">30627334</pub-id></citation></ref>
<ref id="B12"><label>12.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nandyala</surname><given-names>SV</given-names></name><name><surname>Elboghdady</surname><given-names>IM</given-names></name><name><surname>Marquez-Lara</surname><given-names>A</given-names></name><name><surname>Noureldin</surname><given-names>MNB</given-names></name><name><surname>Sankaranarayanan</surname><given-names>S</given-names></name><name><surname>Singh</surname><given-names>K</given-names></name></person-group>. <article-title>Cost analysis of incidental durotomy in spine surgery</article-title>. <source>Spine (Phila Pa 1976)</source>. (<year>2014</year>) <volume>39</volume>(<issue>17</issue>):<fpage>E1042</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1097/BRS.0000000000000425</pub-id><pub-id pub-id-type="pmid">24859577</pub-id></citation></ref>
<ref id="B13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saxler</surname><given-names>G</given-names></name><name><surname>Kr&#x00E4;mer</surname><given-names>J</given-names></name><name><surname>Barden</surname><given-names>B</given-names></name><name><surname>Kurt</surname><given-names>A</given-names></name><name><surname>Pf&#x00F6;rtner</surname><given-names>J</given-names></name><name><surname>Bernsmann</surname><given-names>K</given-names></name></person-group>. <article-title>The long-term clinical sequelae of incidental durotomy in lumbar disc surgery</article-title>. <source>Spine (Phila Pa 1976)</source>. (<year>2005</year>) <volume>30</volume>(<issue>20</issue>):<fpage>2298</fpage>&#x2013;<lpage>302</lpage>. <pub-id pub-id-type="doi">10.1097/01.brs.0000182131.44670.f7</pub-id><pub-id pub-id-type="pmid">16227893</pub-id></citation></ref>
<ref id="B14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Str&#x00F6;mqvist</surname><given-names>F</given-names></name><name><surname>Sigmundsson</surname><given-names>FG</given-names></name><name><surname>Str&#x00F6;mqvist</surname><given-names>B</given-names></name><name><surname>J&#x00F6;nsson</surname><given-names>B</given-names></name><name><surname>Karlsson</surname><given-names>MK</given-names></name></person-group>. <article-title>Incidental durotomy in degenerative lumbar spine surgery&#x2014;a register study of 64,431 operations</article-title>. <source>Spine J</source>. (<year>2019</year>) <volume>19</volume>(<issue>4</issue>):<fpage>624</fpage>&#x2013;<lpage>30</lpage>. <pub-id pub-id-type="doi">10.1016/j.spinee.2018.08.012</pub-id></citation></ref>
<ref id="B15"><label>15.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kanayama</surname><given-names>M</given-names></name><name><surname>Oha</surname><given-names>F</given-names></name><name><surname>Togawa</surname><given-names>D</given-names></name><name><surname>Shigenobu</surname><given-names>K</given-names></name><name><surname>Hashimoto</surname><given-names>T</given-names></name></person-group>. <article-title>Is closed-suction drainage necessary for single-level lumbar decompression?: review of 560 cases</article-title>. <source>Clin Orthop Relat Res</source>. (<year>2010</year>) <volume>468</volume>(<issue>10</issue>):<fpage>2690</fpage>&#x2013;<lpage>4</lpage>. <pub-id pub-id-type="doi">10.1007/s11999-010-1235-6</pub-id><pub-id pub-id-type="pmid">20091386</pub-id></citation></ref>
<ref id="B16"><label>16.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yilmaz</surname><given-names>E</given-names></name><name><surname>Blecher</surname><given-names>R</given-names></name><name><surname>Moisi</surname><given-names>M</given-names></name><name><surname>Ankush</surname><given-names>C</given-names></name><name><surname>O&#x2019;Lynnger</surname><given-names>TM</given-names></name><name><surname>Abdul-Jabbar</surname><given-names>A</given-names></name><etal/></person-group> <article-title>Is there an optimal wound closure technique for major posterior spine surgery? A systematic review</article-title>. <source>Global Spine J</source>. (<year>2018</year>) <volume>8</volume>(<issue>5</issue>):<fpage>535</fpage>&#x2013;<lpage>44</lpage>. <pub-id pub-id-type="doi">10.1177/2192568218774323</pub-id><pub-id pub-id-type="pmid">30258761</pub-id></citation></ref>
<ref id="B17"><label>17.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Karhade</surname><given-names>AV</given-names></name><name><surname>Oosterhoff</surname><given-names>JHF</given-names></name><name><surname>Groot</surname><given-names>OQ</given-names></name><name><surname>Agaronnik</surname><given-names>N</given-names></name><name><surname>Ehresman</surname><given-names>J</given-names></name><name><surname>Bongers</surname><given-names>MER</given-names></name><etal/></person-group> <article-title>Can we geographically validate a natural language processing algorithm for automated detection of incidental durotomy across three independent cohorts from two continents?</article-title> <source>Clin Orthop Relat Res</source>. (<year>2022</year>) <volume>480</volume>(<issue>9</issue>):<fpage>1766</fpage>&#x2013;<lpage>75</lpage>. <pub-id pub-id-type="doi">10.1097/CORR.0000000000002200</pub-id><pub-id pub-id-type="pmid">35412473</pub-id></citation></ref>
<ref id="B18"><label>18.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Karhade</surname><given-names>A</given-names></name><name><surname>Bongers</surname><given-names>M</given-names></name><name><surname>Groot</surname><given-names>O</given-names></name><name><surname>Kazarian</surname><given-names>E</given-names></name><name><surname>Cha</surname><given-names>T</given-names></name><name><surname>Fogel</surname><given-names>H</given-names></name><etal/></person-group> <article-title>Natural language processing for automated detection of incidental durotomy</article-title>. <source>Spine J</source>. (<year>2020</year>) <volume>20</volume>(<issue>5</issue>):<fpage>695</fpage>&#x2013;<lpage>700</lpage>. <pub-id pub-id-type="doi">10.1016/j.spinee.2019.12.006</pub-id><pub-id pub-id-type="pmid">31877390</pub-id></citation></ref>
<ref id="B19"><label>19.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ehresman</surname><given-names>J</given-names></name><name><surname>Pennington</surname><given-names>Z</given-names></name><name><surname>Karhade</surname><given-names>A</given-names></name><name><surname>Huq</surname><given-names>S</given-names></name><name><surname>Medikonda</surname><given-names>R</given-names></name><name><surname>Schilling</surname><given-names>A</given-names></name><etal/></person-group> <article-title>Incidental durotomy: predictive risk model and external validation of natural language process identification algorithm</article-title>. <source>J Neurosurg Spine</source>. (<year>2020</year>) <volume>33</volume>(<issue>3</issue>):<fpage>342</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.3171/2020.2.SPINE20127</pub-id></citation></ref>
<ref id="B20"><label>20.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Collins</surname><given-names>GS</given-names></name><name><surname>Reitsma</surname><given-names>JB</given-names></name><name><surname>Altman</surname><given-names>DG</given-names></name><name><surname>Moons</surname><given-names>K</given-names></name></person-group>. <article-title>Transparent reporting of a multivariable prediction model for individual prognosis or diagnosis (TRIPOD): the TRIPOD statement</article-title>. <source>BMC Med</source>. (<year>2015</year>) <volume>13</volume>(<issue>1</issue>):<fpage>1</fpage>. <pub-id pub-id-type="doi">10.1186/s12916-014-0241-z</pub-id><pub-id pub-id-type="pmid">25563062</pub-id></citation></ref>
<ref id="B21"><label>21.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname><given-names>W</given-names></name><name><surname>Phung</surname><given-names>D</given-names></name><name><surname>Tran</surname><given-names>T</given-names></name><name><surname>Gupta</surname><given-names>S</given-names></name><name><surname>Rana</surname><given-names>S</given-names></name><name><surname>Karmakar</surname><given-names>C</given-names></name><etal/></person-group> <article-title>Guidelines for developing and reporting machine learning predictive models in biomedical research: a multidisciplinary view</article-title>. <source>J Med Internet Res</source>. (<year>2016</year>) <volume>18</volume>(<issue>12</issue>):<fpage>e323</fpage>. <pub-id pub-id-type="doi">10.2196/jmir.5870</pub-id><pub-id pub-id-type="pmid">27986644</pub-id></citation></ref>
<ref id="B22"><label>22.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Selvadurai</surname><given-names>D</given-names></name><name><surname>Wildin</surname><given-names>C</given-names></name><name><surname>Treharne</surname><given-names>G</given-names></name><name><surname>Choksy</surname><given-names>SA</given-names></name><name><surname>Heywood</surname><given-names>MM</given-names></name><name><surname>Nicholson</surname><given-names>ML</given-names></name></person-group>. <article-title>Randomised trial of subcuticular suture versus metal clips for wound closure after thyroid and parathyroid surgery</article-title>. <source>Ann R Coll Surg Engl</source>. (<year>1997</year>) <volume>79</volume>(<issue>4</issue>):<fpage>303</fpage>&#x2013;<lpage>6</lpage>.<pub-id pub-id-type="pmid">9244079</pub-id></citation></ref>
<ref id="B23"><label>23.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname><given-names>BB</given-names></name><name><surname>Huang</surname><given-names>J</given-names></name><name><surname>Swong</surname><given-names>KN</given-names></name></person-group>. <article-title>Natural language processing in spine surgery: a systematic review of applications, bias, and reporting transparency</article-title>. <source>World Neurosurg</source>. (<year>2022</year>) <volume>167</volume>:<fpage>156</fpage>&#x2013;<lpage>64.e6</lpage>. <pub-id pub-id-type="doi">10.1016/j.wneu.2022.08.109</pub-id><pub-id pub-id-type="pmid">36049723</pub-id></citation></ref>
<ref id="B24"><label>24.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Agaronnik</surname><given-names>ND</given-names></name><name><surname>Kwok</surname><given-names>A</given-names></name><name><surname>Schoenfeld</surname><given-names>AJ</given-names></name><name><surname>Lindvall</surname><given-names>C</given-names></name></person-group>. <article-title>Natural language processing for automated surveillance of intraoperative neuromonitoring in spine surgery</article-title>. <source>J Clin Neurosci</source>. (<year>2022</year>) <volume>97</volume>:<fpage>121</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1016/j.jocn.2022.01.015</pub-id><pub-id pub-id-type="pmid">35093791</pub-id></citation></ref>
<ref id="B25"><label>25.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bacco</surname><given-names>L</given-names></name><name><surname>Russo</surname><given-names>F</given-names></name><name><surname>Ambrosio</surname><given-names>L</given-names></name><name><surname>D&#x2019;Antoni</surname><given-names>F</given-names></name><name><surname>Vollero</surname><given-names>L</given-names></name><name><surname>Vadal&#x00E0;</surname><given-names>G</given-names></name><etal/></person-group> <article-title>Natural language processing in low back pain and spine diseases: a systematic review</article-title>. <source>Front Surg</source>. (<year>2022</year>) <volume>9</volume>:<fpage>957085</fpage>. <pub-id pub-id-type="doi">10.3389/fsurg.2022.957085</pub-id><pub-id pub-id-type="pmid">35910476</pub-id></citation></ref>
<ref id="B26"><label>26.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Groot</surname><given-names>O</given-names></name><name><surname>Ogink</surname><given-names>P</given-names></name><name><surname>Oosterhoff</surname><given-names>J</given-names></name><name><surname>Beam</surname><given-names>A</given-names></name></person-group>. <article-title>Natural language processing and its role in spine surgery: a narrative review of potentials and challenges</article-title>. <source>Semin Spine Surg</source>. (<year>2021</year>) <volume>33</volume>(<issue>1</issue>):<fpage>100877</fpage>. <pub-id pub-id-type="doi">10.1016/j.semss.2021.100877</pub-id></citation></ref>
<ref id="B27"><label>27.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alonso</surname><given-names>V</given-names></name><name><surname>Santos</surname><given-names>JV</given-names></name><name><surname>Pinto</surname><given-names>M</given-names></name><name><surname>Ferreira</surname><given-names>J</given-names></name><name><surname>Lema</surname><given-names>I</given-names></name><name><surname>Lopes</surname><given-names>F</given-names></name><etal/></person-group> <article-title>Problems and barriers during the process of clinical coding: a focus group study of Coders&#x2019; perceptions</article-title>. <source>J Med Syst</source>. (<year>2020</year>) <volume>44</volume>(<issue>3</issue>):<fpage>62</fpage>. <pub-id pub-id-type="doi">10.1007/s10916-020-1532-x</pub-id><pub-id pub-id-type="pmid">32036459</pub-id></citation></ref>
<ref id="B28"><label>28.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Burns</surname><given-names>EM</given-names></name><name><surname>Rigby</surname><given-names>E</given-names></name><name><surname>Mamidanna</surname><given-names>R</given-names></name><name><surname>Bottle</surname><given-names>A</given-names></name><name><surname>Aylin</surname><given-names>P</given-names></name><name><surname>Ziprin</surname><given-names>P</given-names></name><etal/></person-group> <article-title>Systematic review of discharge coding accuracy</article-title>. <source>J Public Health (Oxf)</source>. (<year>2012</year>) <volume>34</volume>(<issue>1</issue>):<fpage>138</fpage>&#x2013;<lpage>48</lpage>. <pub-id pub-id-type="doi">10.1093/pubmed/fdr054</pub-id><pub-id pub-id-type="pmid">21795302</pub-id></citation></ref>
<ref id="B29"><label>29.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shost</surname><given-names>MD</given-names></name><name><surname>Meade</surname><given-names>SM</given-names></name><name><surname>Steinmetz</surname><given-names>MP</given-names></name><name><surname>Mroz</surname><given-names>TE</given-names></name><name><surname>Habboub</surname><given-names>G</given-names></name></person-group>. <article-title>Surgical classification using natural language processing of informed consent forms in spine surgery</article-title>. <source>Neurosurg Focus</source>. (<year>2023</year>) <volume>54</volume>(<issue>6</issue>):<fpage>E10</fpage>. <pub-id pub-id-type="doi">10.3171/2023.3.FOCUS2371</pub-id><pub-id pub-id-type="pmid">37283446</pub-id></citation></ref>
<ref id="B30"><label>30.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krebs</surname><given-names>B</given-names></name><name><surname>Nataraj</surname><given-names>A</given-names></name><name><surname>McCabe</surname><given-names>E</given-names></name><name><surname>Clark</surname><given-names>S</given-names></name><name><surname>Sufiyan</surname><given-names>Z</given-names></name><name><surname>Yamamoto</surname><given-names>SS</given-names></name><etal/></person-group> <article-title>Developing a triage predictive model for access to a spinal surgeon using clinical variables and natural language processing of radiology reports</article-title>. <source>Eur Spine J</source>. (<year>2023</year>) <volume>32</volume>(<issue>1</issue>):<fpage>181</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1007/s00586-023-07552-4</pub-id><pub-id pub-id-type="pmid">36374335</pub-id></citation></ref>
<ref id="B31"><label>31.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mueller</surname><given-names>KB</given-names></name><name><surname>Garrett</surname><given-names>CT</given-names></name><name><surname>Kane</surname><given-names>S</given-names></name><name><surname>Sandhu</surname><given-names>FA</given-names></name><name><surname>Voyadzis</surname><given-names>JM</given-names></name></person-group>. <article-title>Incidental durotomy following surgery for degenerative lumbar disease and the impact of minimally invasive surgical technique on the rate and need for surgical revision: a case series</article-title>. <source>Oper Neurosurg (Hagerstown)</source>. (<year>2021</year>) <volume>21</volume>(<issue>5</issue>):<fpage>351</fpage>&#x2013;<lpage>5</lpage>. <pub-id pub-id-type="doi">10.1093/ons/opab282</pub-id><pub-id pub-id-type="pmid">34460926</pub-id></citation></ref>
<ref id="B32"><label>32.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Albayar</surname><given-names>A</given-names></name><name><surname>Spadola</surname><given-names>M</given-names></name><name><surname>Blue</surname><given-names>R</given-names></name><name><surname>Saylany</surname><given-names>A</given-names></name><name><surname>Dagli</surname><given-names>MM</given-names></name><name><surname>Santangelo</surname><given-names>G</given-names></name><etal/></person-group> <article-title>Incidental durotomy repair in lumbar spine surgery: institutional experience and review of literature</article-title>. <source>Global Spine J</source>. (<year>2022</year>):<fpage>21925682221141370</fpage>. <pub-id pub-id-type="doi">10.1177/21925682221141368</pub-id>. [Epub ahead of print]</citation></ref>
<ref id="B33"><label>33.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Desai</surname><given-names>A</given-names></name><name><surname>Ball</surname><given-names>PA</given-names></name><name><surname>Bekelis</surname><given-names>K</given-names></name><name><surname>Lurie</surname><given-names>J</given-names></name><name><surname>Mirza</surname><given-names>SK</given-names></name><name><surname>Tosteson</surname><given-names>TD</given-names></name><etal/></person-group> <article-title>SPORT: does incidental durotomy affect longterm outcomes in cases of spinal stenosis?</article-title> <source>Neurosurgery</source>. (<year>2015</year>) <volume>76 Suppl 1</volume>(<issue>01</issue>):<fpage>S57</fpage>&#x2013;<lpage>63</lpage>; <comment>discussion S63</comment>. <pub-id pub-id-type="doi">10.1227/01.neu.0000462078.58454.f4</pub-id><pub-id pub-id-type="pmid">25692369</pub-id></citation></ref>
<ref id="B34"><label>34.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Reier</surname><given-names>L</given-names></name><name><surname>Fowler</surname><given-names>JB</given-names></name><name><surname>Arshad</surname><given-names>M</given-names></name><name><surname>Siddiqi</surname><given-names>J</given-names></name></person-group>. <article-title>Drains in spine surgery for degenerative disc diseases: a literature review to determine its usage</article-title>. <source>Cureus</source>. (<year>2022</year>) <volume>14</volume>(<issue>3</issue>):<fpage>312</fpage>&#x2013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.7759/cureus.23129</pub-id></citation></ref>
<ref id="B35"><label>35.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mirzai</surname><given-names>H</given-names></name><name><surname>Eminoglu</surname><given-names>M</given-names></name><name><surname>Orguc</surname><given-names>S</given-names></name></person-group>. <article-title>Are drains useful for lumbar disc surgery? A prospective, randomized clinical study</article-title>. <source>J Spinal Disord Tech</source>. (<year>2006</year>) <volume>19</volume>(<issue>3</issue>):<fpage>171</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1097/01.bsd.0000190560.20872.a7</pub-id><pub-id pub-id-type="pmid">16770213</pub-id></citation></ref>
<ref id="B36"><label>36.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ho</surname><given-names>C</given-names></name><name><surname>Sucato</surname><given-names>DJ</given-names></name><name><surname>Richards</surname><given-names>BS</given-names></name></person-group>. <article-title>Risk factors for the development of delayed infections following posterior spinal fusion and instrumentation in adolescent idiopathic scoliosis patients</article-title>. <source>Spine (Phila Pa 1976)</source>. (<year>2007</year>) <volume>32</volume>(<issue>20</issue>):<fpage>2272</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1097/BRS.0b013e31814b1c0b</pub-id><pub-id pub-id-type="pmid">17873822</pub-id></citation></ref>
<ref id="B37"><label>37.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Adogwa</surname><given-names>O</given-names></name><name><surname>Elsamadicy</surname><given-names>AA</given-names></name><name><surname>Sergesketter</surname><given-names>AR</given-names></name><name><surname>Shammas</surname><given-names>RL</given-names></name><name><surname>Vatsia</surname><given-names>S</given-names></name><name><surname>Vuong</surname><given-names>VD</given-names></name><etal/></person-group> <article-title>Post-operative drain use in patients undergoing decompression and fusion: incidence of complications and symptomatic hematoma</article-title>. <source>J Spine Surg</source>. (<year>2018</year>) <volume>4</volume>(<issue>2</issue>):<fpage>220</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.21037/jss.2018.05.09</pub-id><pub-id pub-id-type="pmid">30069510</pub-id></citation></ref>
<ref id="B38"><label>38.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Brown</surname><given-names>MD</given-names></name><name><surname>Brookfield</surname><given-names>KFW</given-names></name></person-group>. <article-title>A randomized study of closed wound suction drainage for extensive lumbar spine surgery</article-title>. <source>Spine (Phila Pa 1976)</source>. (<year>2004</year>) <volume>29</volume>(<issue>10</issue>):<fpage>1066</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1097/00007632-200405150-00003</pub-id><pub-id pub-id-type="pmid">15131430</pub-id></citation></ref>
<ref id="B39"><label>39.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Choi</surname><given-names>HS</given-names></name><name><surname>Lee</surname><given-names>SG</given-names></name><name><surname>Kim</surname><given-names>WK</given-names></name><name><surname>Son</surname><given-names>S</given-names></name><name><surname>Jeong</surname><given-names>TS</given-names></name></person-group>. <article-title>Is surgical drain useful for lumbar disc surgery?</article-title> <source>Korean J Spine</source>. (<year>2016</year>) <volume>13</volume>(<issue>1</issue>):<fpage>20</fpage>&#x2013;<lpage>3</lpage>. <pub-id pub-id-type="doi">10.14245/kjs.2016.13.1.20</pub-id><pub-id pub-id-type="pmid">27123026</pub-id></citation></ref>
<ref id="B40"><label>40.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Walid</surname><given-names>MS</given-names></name><name><surname>Abbara</surname><given-names>M</given-names></name><name><surname>Tolaymat</surname><given-names>A</given-names></name><name><surname>Davis</surname><given-names>JR</given-names></name><name><surname>Waits</surname><given-names>KD</given-names></name><name><surname>Robinson</surname><given-names>JS</given-names></name><etal/></person-group> <article-title>The role of drains in lumbar spine fusion</article-title>. <source>World Neurosurg</source>. (<year>2012</year>) <volume>77</volume>(<issue>3&#x2013;4</issue>):<fpage>564</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1016/j.wneu.2011.05.058</pub-id><pub-id pub-id-type="pmid">22120372</pub-id></citation></ref>
<ref id="B41"><label>41.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zaman</surname><given-names>S</given-names></name><name><surname>Mohamedahmed</surname><given-names>AYY</given-names></name><name><surname>Peterknecht</surname><given-names>E</given-names></name><name><surname>Zakaria</surname><given-names>RM</given-names></name><name><surname>Mohamedahmed</surname><given-names>SYY</given-names></name><name><surname>Hajibandeh</surname><given-names>S</given-names></name><etal/></person-group> <article-title>Sutures versus clips for skin closure following caesarean section: a systematic review, meta-analysis and trial sequential analysis of randomised controlled trials</article-title>. <source>Langenbecks Arch Surg</source>. (<year>2022</year>) <volume>407</volume>(<issue>1</issue>):<fpage>37</fpage>&#x2013;<lpage>50</lpage>. <pub-id pub-id-type="doi">10.1007/s00423-021-02239-0</pub-id><pub-id pub-id-type="pmid">34232372</pub-id></citation></ref>
<ref id="B42"><label>42.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mostofi</surname><given-names>K</given-names></name><name><surname>Peyravi</surname><given-names>M</given-names></name><name><surname>Shirbacheh</surname><given-names>A</given-names></name><name><surname>Shirbache</surname><given-names>K</given-names></name></person-group>. <article-title>A comparison between different suture techniques in lumbar spine surgery</article-title>. <source>Int Wound J</source>. (<year>2023</year>) <volume>20</volume>(<issue>2</issue>):<fpage>296</fpage>&#x2013;<lpage>301</lpage>. <pub-id pub-id-type="doi">10.1111/iwj.13875</pub-id><pub-id pub-id-type="pmid">36317419</pub-id></citation></ref>
<ref id="B43"><label>43.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Meiring</surname><given-names>L</given-names></name><name><surname>Cilliers</surname><given-names>K</given-names></name><name><surname>Barry</surname><given-names>R</given-names></name><name><surname>Nel</surname><given-names>CJ</given-names></name></person-group>. <article-title>A comparison of a disposable skin stapler and nylon sutures for wound closure</article-title>. <source>S Afr Med J</source>. (<year>1982</year>) <volume>62</volume>(<issue>11</issue>):<fpage>371</fpage>&#x2013;<lpage>2</lpage>.<pub-id pub-id-type="pmid">7112304</pub-id></citation></ref>
<ref id="B44"><label>44.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Orlinsky</surname><given-names>M</given-names></name><name><surname>Goldberg</surname><given-names>RM</given-names></name><name><surname>Chan</surname><given-names>L</given-names></name><name><surname>Puertos</surname><given-names>A</given-names></name><name><surname>Slajer</surname><given-names>HL</given-names></name></person-group>. <article-title>Cost analysis of stapling versus suturing for skin closure</article-title>. <source>Am J Emerg Med</source>. (<year>1995</year>) <volume>13</volume>(<issue>1</issue>):<fpage>77</fpage>&#x2013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1016/0735-6757(95)90248-1</pub-id><pub-id pub-id-type="pmid">7832962</pub-id></citation></ref>
<ref id="B45"><label>45.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rizan</surname><given-names>C</given-names></name><name><surname>Lillywhite</surname><given-names>R</given-names></name><name><surname>Reed</surname><given-names>M</given-names></name><name><surname>Bhutta</surname><given-names>MF</given-names></name></person-group>. <article-title>The carbon footprint of products used in five common surgical operations: identifying contributing products and processes</article-title>. <source>J R Soc Med</source>. (<year>2023</year>) <volume>116</volume>(<issue>6</issue>):<fpage>1410768231166135</fpage>. <pub-id pub-id-type="doi">10.1177/01410768231166135</pub-id></citation></ref></ref-list>
</back>
</article>