<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<?covid-19-tdm?>
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Med.</journal-id>
<journal-title>Frontiers in Medicine</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Med.</abbrev-journal-title>
<issn pub-type="epub">2296-858X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmed.2022.846525</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Medicine</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Machine-Learning Approaches for Predicting the Need of Oxygen Therapy in Early-Stage COVID-19 in Japan: Multicenter Retrospective Observational Study</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Yamanaka</surname> <given-names>Syunsuke</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/599651/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Morikawa</surname> <given-names>Koji</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Azuma</surname> <given-names>Hiroyuki</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Yamanaka</surname> <given-names>Maki</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Shimada</surname> <given-names>Yoshimitsu</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Wada</surname> <given-names>Toru</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Matano</surname> <given-names>Hideyuki</given-names></name>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Yamada</surname> <given-names>Naoki</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Yamamura</surname> <given-names>Osamu</given-names></name>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1407486/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Hayashi</surname> <given-names>Hiroyuki</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Emergency Medicine and General Internal Medicine, University of Fukui Hospital</institution>, <addr-line>Fukui</addr-line>, <country>Japan</country></aff>
<aff id="aff2"><sup>2</sup><institution>Connect Inc.</institution>, <addr-line>Tokyo</addr-line>, <country>Japan</country></aff>
<aff id="aff3"><sup>3</sup><institution>Department of Emergency Medicine, Fukui Prefectural Hospital</institution>, <addr-line>Fukui</addr-line>, <country>Japan</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Emergency Medicine, Tannan Regional Medical Center</institution>, <addr-line>Sabae</addr-line>, <country>Japan</country></aff>
<aff id="aff5"><sup>5</sup><institution>Department of Emergency Medicine, Japanese Red Cross Fukui Hospital</institution>, <addr-line>Fukui</addr-line>, <country>Japan</country></aff>
<aff id="aff6"><sup>6</sup><institution>Department of Emergency Medicine, Sugita Genpaku Memorial Obama Municipal Hospital</institution>, <addr-line>Obama</addr-line>, <country>Japan</country></aff>
<aff id="aff7"><sup>7</sup><institution>Department of Emergency Medicine, Fukui-ken Saiseikai Hospital</institution>, <addr-line>Fukui</addr-line>, <country>Japan</country></aff>
<aff id="aff8"><sup>8</sup><institution>Department of Community Medicine, Faculty of Medicine, University of Fukui Hospital</institution>, <addr-line>Fukui</addr-line>, <country>Japan</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Longxiang Su, Peking Union Medical College Hospital (CAMS), China</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Carmen Silvia Valente Barbas, University of S&#x000E3;o Paulo, Brazil; Zisis Kozlakidis, International Agency for Research on Cancer (IARC), France</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Syunsuke Yamanaka <email>yamanakasyunsuke&#x00040;yahoo.co.jp</email></corresp>
<fn fn-type="other" id="fn001"><p>This article was submitted to Infectious Diseases - Surveillance, Prevention and Treatment, a section of the journal Frontiers in Medicine</p></fn></author-notes>
<pub-date pub-type="epub">
<day>23</day>
<month>02</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>9</volume>
<elocation-id>846525</elocation-id>
<history>
<date date-type="received">
<day>31</day>
<month>12</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>27</day>
<month>01</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2022 Yamanaka, Morikawa, Azuma, Yamanaka, Shimada, Wada, Matano, Yamada, Yamamura and Hayashi.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Yamanaka, Morikawa, Azuma, Yamanaka, Shimada, Wada, Matano, Yamada, Yamamura and Hayashi</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Early prediction of oxygen therapy in patients with coronavirus disease 2019 (COVID-19) is vital for triage. Several machine-learning prognostic models for COVID-19 are currently available. However, external validation of these models has rarely been performed. Therefore, most reported predictive performance is optimistic and has a high risk of bias. This study aimed to develop and validate a model that predicts oxygen therapy needs in the early stages of COVID-19 using a sizable multicenter dataset.</p></sec>
<sec>
<title>Methods</title>
<p>This multicenter retrospective study included consecutive COVID-19 hospitalized patients confirmed by a reverse transcription chain reaction in 11 medical institutions in Fukui, Japan. We developed and validated seven machine-learning models (e.g., penalized logistic regression model) using routinely collected data (e.g., demographics, simple blood test). The primary outcome was the need for oxygen therapy (&#x02265;1 L/min or SpO<sub>2</sub> &#x02264; 94%) during hospitalization. C-statistics, calibration slope, and association measures (e.g., sensitivity) evaluated the performance of the model using the test set (randomly selected 20% of data for internal validation). Among these seven models, the machine-learning model that showed the best performance was re-evaluated using an external dataset. We compared the model performances using the A-DROP criteria (modified version of CURB-65) as a conventional method.</p></sec>
<sec>
<title>Results</title>
<p>Of the 396 patients with COVID-19 for the model development, 102 patients (26%) required oxygen therapy during hospitalization. For internal validation, machine-learning models, except for the <italic>k</italic>-point nearest neighbor, had a higher discrimination ability than the A-DORP criteria (<italic>P</italic> &#x0003C; 0.01). The XGboost had the highest c-statistic in the internal validation (0.92 vs. 0.69 in A-DROP criteria; <italic>P</italic> &#x0003C; 0.001). For the external validation with 728 temporal independent datasets (106 patients [15%] required oxygen therapy), the XG boost model had a higher c-statistic (0.88 vs. 0.69 in A-DROP criteria; <italic>P</italic> &#x0003C; 0.001).</p></sec>
<sec>
<title>Conclusions</title>
<p>Machine-learning models demonstrated a more significant performance in predicting the need for oxygen therapy in the early stages of COVID-19.</p></sec></abstract>
<kwd-group>
<kwd>COVID-19</kwd>
<kwd>machine learning</kwd>
<kwd>prognostic model</kwd>
<kwd>medical triage</kwd>
<kwd>multicenter</kwd>
<kwd>PROBAST</kwd>
<kwd>TRIPOD</kwd>
</kwd-group>
<counts>
<fig-count count="2"/>
<table-count count="4"/>
<equation-count count="0"/>
<ref-count count="33"/>
<page-count count="8"/>
<word-count count="5908"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>The novel coronavirus disease 2019 (COVID-19), first reported in the Hubei province of the People&#x00027;s Republic of China in December 2019, has led to an urgent threat to global health. Many countries faced an emergency crisis despite the significant public and private efforts to delay disease spread (<xref ref-type="bibr" rid="B1">1</xref>). The exponential increase in COVID-19 incidence has led to a significant demand for medical services, resulting in a shortage of medical resources (<xref ref-type="bibr" rid="B2">2</xref>, <xref ref-type="bibr" rid="B3">3</xref>). Since, it is challenging to hospitalize all patients with COVID-19 in most countries, careful observation outside the hospital is standard for asymptomatic patients and patients with mild symptoms (<xref ref-type="bibr" rid="B4">4</xref>). However, some asymptomatic or patients with mild symptoms of COVID-19 at the first medical visit develop severe pneumonia during observation (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>). Although, there is no definitive antiviral medication against COVID-19, medications, such as oxygen therapy, antiviral medication, steroids, and supportive care, have become the standard of care and have been effective (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B8">8</xref>). As a result, preventable deaths occur because of the lack of adequate prediction of patient prognosis at the first medical visit and close follow-up (<xref ref-type="bibr" rid="B9">9</xref>). Some of them could have been saved if the need for oxygen therapy had been correctly predicted on the first visit (<xref ref-type="bibr" rid="B10">10</xref>). Therefore, accurate medical triage for asymptomatic patients and patients with mild symptoms in the early stage of COVID-19 is essential to decrease the incidence of death and allocate limited medical resources appropriately during the observation period (<xref ref-type="bibr" rid="B11">11</xref>). In previous studies, artificial intelligence, such as machine learning, has shown better predictive capabilities than traditional statistical methods (<xref ref-type="bibr" rid="B12">12</xref>). However, most published models have not been externally validated with calibration plots, resulting in a high risk of bias (<xref ref-type="bibr" rid="B13">13</xref>&#x02013;<xref ref-type="bibr" rid="B15">15</xref>). In addition, few studies have included most patients who were hospitalized, even if the patients were asymptomatic, and have observed their progress in detail. Therefore, the performance of the reported models might be optimistic and highly biased (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B16">16</xref>).</p>
<p>Moreover, many studies did not include a follow-up period after the end of the study. However, the need for oxygen demand and outcome may have been underestimated because the outcome of these patients may have occurred after the end of the study. With the effort for the quality required by the PROBAST (prediction model risk of bias assessment tool) guidelines and TRIPOD (transparent reporting of a multivariable prediction model for individual prognosis or diagnosis) reporting guidelines (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B17">17</xref>), this study aimed to develop and validate a prognostic machine-learning model that accurately predicts the need for oxygen therapy in the early stages of COVID-19 using external datasets from multiple institutions and to compare its predictive performance with traditional approaches, such as the A-DROP criteria (consisting of age of &#x02265;70 years in men or &#x02265;75 years in women, blood urea nitrogen of &#x02265;21 mg/dL or dehydration, oxyhemoglobin saturation measured by pulse oximetry of &#x02264; 90% or partial oxygen pressure in the arterial blood of &#x02264; 60 mmHg, confusion, and systolic blood pressure of &#x02264; 90 mmHg) (<xref ref-type="bibr" rid="B18">18</xref>).</p></sec>
<sec sec-type="materials and methods" id="s2">
<title>Materials and Methods</title>
<sec>
<title>Study Design, Source of Data, Participants Selection, and Follow Up</title>
<p>This multicenter retrospective cohort study analyzed patients with COVID-19 in 11 academic and community hospitals in different geographic regions across Fukui, Japan. The 11 medical institutions included two level-I and eight level-II equivalent trauma centers and a temporal medical institution. The mean annual hospitalizations are 160,000 and 90,000 in two level-I and seven level-II-equivalent trauma centers, respectively. <xref ref-type="supplementary-material" rid="SM1">Supplementary Table 1</xref> and <xref ref-type="supplementary-material" rid="SM3">Supplementary Figure 1</xref> show the size, location, and number of full-time physicians, hospital beds, annual outpatients, annual patients transported by ambulances, and annual hospitalized patients. The ethics review board of the University of Fukui Hospital and each participating medical institution approved the present study (approval number in the University of Fukui Hospital: 20200120). In addition, the waiver of informed consent before data collection was approved by the institutional review board of each participating medical institution. All procedures were performed according to the principles of the Declaration of Helsinki.</p>
<p>We retrospectively studied all consecutive patients with COVID-19 confirmed by reverse transcription-polymerase chain reaction (RT-PCR) using a pharyngeal swab test for model development and internal validation admitted to participating medical facilities. Since, the number of patients with COVID-19 in Fukui during the study period was relatively small, most patients diagnosed with COVID-19 were hospitalized and few were kept at home (&#x0003C;5% of all patients with COVID-19 in Fukui). We lent pulse oximeters to home care patients, instructed them on how to take measurements, and followed up with daily phone calls to check their condition. In this study, there were only a small number of patients who were initially to have mild disease and were followed up at home; hence, we could collect data closer to the actual situation.</p>
<p>We obtained electronic medical dataon the early stage of COVID-19 in patients admitted to 10 medical institutions (except the Ota Hospital) from July 1, 2020 to March 31, 2021 to develop prediction models and perform internal validation. This study defines medical data regarding the early stage of COVID-19 as data within 48 h of PCR confirmation or initial diagnosis. After admission to the hospital, antivirals, corticosteroids, and herbal medicines were administered by the attending physician according to the standardized methods of each medical institution.</p>
<p>In addition, for temporal and external validation, we retrospectively examined all consecutive patients with COVID-19 admitted to the University of Fukui Hospital, Fukui Prefectural Hospital, Japanese Red Cross Fukui Hospital, Fukui-ken Saiseikai Hospital, and Ota Hospital from April 1, 2021 to September 30, 2021.</p>
<p>Exclusion criteria were patients aged &#x0003C;17 years and pregnant patients. The present study aimed to develop and validate a machine-learning model to identify COVID-19 patients who are mildly ill at the time of initial diagnosis and who require oxygen therapy during the course of their illness. We also excluded patients with transcutaneous oxygen saturation (SpO<sub>2</sub>) &#x0003C;95%, patients receiving oxygen therapy (&#x0003E;1 L O<sub>2</sub>/min) before admission, and patients with no recorded SpO<sub>2</sub> at the time of initial diagnosis.</p>
<p>We performed a post-discharge telephone follow-up survey on all patients 2&#x02013;4 weeks after discharge to determine if any patient&#x00027;s condition worsened after discharge.</p>
</sec>
<sec>
<title>Outcomes</title>
<p>The outcome of interest was oxygen therapy, which indicates disease progression. Oxygen therapy was administered between the time of diagnosis by PCR-positive confirmation of COVID-19 and the time of discharge from the hospital after negative confirmation by PCR. Oxygen therapy was defined as follows: (1) SpO<sub>2</sub> was &#x02264; 94% at least once during hospitalization; (2) at least one oxygen administration of 1 L/min or more during hospitalization; (3) admission to the ICU; (4) intubation; and (5) discharge due to death. Therefore, patients who met these conditions were considered to have needed oxygen therapy.</p>
</sec>
<sec>
<title>Data Collection and Predictors of Machine-Learning Models</title>
<p>From the electronic medical records of 11 medical institutions, we extracted the following routine data in the early stages of COVID-19: patient demographics [age, sex, smoking history, alcohol, height, body weight, body mass index, and comorbidities (myocardinal infarction, cognitive heart failure, peripheral vascular disease, cerebrovascular disease, chronic obstructive pulmonary disease, bronchial asthma, chronic kidney disease, hypertension, diabetes mellites, and malignancy)], symptoms (fever, fatigue, sore throat, headache, rhinorrhea, arthralgia, diarrhea, loss of smell, dyspnea, muscle ache, loss of taste, disturbance of consciousness, and conjunctival hyperemia), vital signs (systolic and diastolic blood pressure and oxygen saturation), Glasgow coma scale, complete blood count (white blood cells, lymphocytes, and platelets), coagulation profile (prothrombin time, activated partial thromboplastin time, fibrinogen, and d-dimer), biochemistry (sodium, potassium, albumin, blood urea nitrogen, creatinine, lactate dehydrogenase, aspartate aminotransferase, and alanine aminotransferase), c-reactive protein, and X-ray examination (chest X-ray or chest computed tomography). Radiology specialists or internal medicine specialists reviewed all X-ray examinations and classified them into three categories: bilateral pneumonia, unilateral pneumonia, and no pneumonia. We also recorded the medications and treatment plans after admission and outcomes.</p>
</sec>
<sec>
<title>Statistical Analysis</title>
<p>We performed summary statistics to describe the characteristics of the patients and the patient&#x00027;s clinical course. After multiple imputations using random forests (<xref ref-type="bibr" rid="B19">19</xref>) (<xref ref-type="supplementary-material" rid="SM2">Supplementary Table 2</xref> shows the missing rate for predictors), we preprocessed predictors, including one-shot encoding (i.e., creation of dummy variables), normalization, and standardization. In the training set (80% random sample) with all available predictors, six machine-learning models were developed: (1) penalized logistic regression (<xref ref-type="bibr" rid="B20">20</xref>), (2) random forest (<xref ref-type="bibr" rid="B21">21</xref>), (3) support vector machine (<xref ref-type="bibr" rid="B22">22</xref>), (4) <italic>k</italic>-point nearest neighbor (<xref ref-type="bibr" rid="B23">23</xref>), (5) XG boost (<xref ref-type="bibr" rid="B24">24</xref>), and (6) multilayer perceptron (<xref ref-type="bibr" rid="B25">25</xref>) for each outcome. In addition, we selected one machine-learning model that achieved the highest prediction performance among the six models. With the best performance model, we calculated the importance of the variables that improved the c-statistics and selected the top eight variables that improved the model performance for future practical usability. Another reason we developed the model with eight variables was to meet the PROBAST standard, which requires a large data set with at least 10 events per candidate variable for model development and at least 100 events for external validation (<xref ref-type="bibr" rid="B16">16</xref>). We performed stratified three-fold cross-validation to determine the optimal hyperparameters with the highest c-statistic [i.e., the area under the receiver operating characteristic (ROC) curve]. We used the A-DROP criteria, which is a modified version of CURB-65 as the reference model (<xref ref-type="bibr" rid="B26">26</xref>).</p>
<p>We measured the performance of the reference model (the A-DROP criteria) and each machine-learning model on the test set (the remaining 20% random sample) for internal validation. We estimated the c-statistics for each model and examined the relevant metrics as follows: sensitivity, specificity, positive and negative predictive values, and positive and negative likelihood ratios. Based on the ROC curve from the Youden method, we determined the threshold for perspective prediction results (cutoff) to determine the best performance model (<xref ref-type="bibr" rid="B27">27</xref>). We also examined the calibration plots of the best-performing model for the outcome.</p>
<p>For temporal external validation, we collected electronic medical record information from five hospitals. Of all the available variables, we extracted the top eight variables with missing values of 20% or less and contributed the most to improving the c-statistics using the filter method (<xref ref-type="bibr" rid="B28">28</xref>). We also demonstrated the c-statistics for the best machine-learning model with the eight variables and examined the relevant metrics (i.e., sensitivity), calibration plots, slope, intercepts, and coefficient of determination using temporal independent variable datasets.</p>
<p>A two-sided <italic>P</italic>-value of &#x0003C;0.05 was considered statistically significant. Data were analyzed using Python (version 3.7.3) and R (version 3.6.2).</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec>
<title>Patient Characteristics</title>
<p>A total of 489 patients with COVID-19 admitted to one of the 11 participating medical institutions were recorded for model development and internal validation during the 9-month study period. Of these, we excluded 28 patients aged &#x0003C;18 years, 14 patients with no SpO<sub>2</sub> data at the first visit, and 51 patients who required oxygen administration of &#x0003E;1 L or SpO<sub>2</sub> of &#x0003C;95% at the time of admission. The remaining 396 patients were included in the analytic cohort for model development.</p>
<p>For external validation, 855 patients were admitted to one of the five participating medical institutions during the 4 months. Of these, we excluded 90 patients under the age of 18 and 37 patients who required oxygen at the time of admission. The remaining 728 patients were included in the analytic cohort for external validation.</p>
<p>Patient characteristics on the admission of patients with COVID-19 are shown in <xref ref-type="table" rid="T1">Table 1</xref>. <xref ref-type="table" rid="T2">Table 2</xref> shows the patients&#x00027; vital signs, laboratory findings, X-rays on admission, and outcomes.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Characteristics of the patient on the admission of the patients with COVID-19.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Variables</bold></th>
<th valign="top" align="left"><bold>Model developing</bold></th>
<th valign="top" align="left"><bold>External validation</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Age, median (IQR), year</td>
<td valign="top" align="left">54 (34&#x02013;70)</td>
<td valign="top" align="left">42 (27&#x02013;53)</td>
</tr>
<tr>
<td valign="top" align="left">Female</td>
<td valign="top" align="left">192 (48)</td>
<td valign="top" align="left">326 (45)</td>
</tr>
<tr>
<td valign="top" align="left">Smoking history<xref ref-type="table-fn" rid="TN1"><sup>&#x0002A;</sup></xref></td>
<td valign="top" align="left">116 (32)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Drinking alcohol<xref ref-type="table-fn" rid="TN2"><sup>&#x0002A;&#x0002A;</sup></xref></td>
<td valign="top" align="left">123 (52)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Height, median (IQR), cm</td>
<td valign="top" align="left">164 (157&#x02013;171)</td>
<td valign="top" align="left">165 (158&#x02013;173)</td>
</tr>
<tr>
<td valign="top" align="left">Body weight, median (IQR), kg</td>
<td valign="top" align="left">61 (52&#x02013;72)</td>
<td valign="top" align="left">62 (53&#x02013;73)</td>
</tr>
<tr>
<td valign="top" align="left">Body mass index, median (IQR), kg/m<sup>2</sup></td>
<td valign="top" align="left">23 (20&#x02013;25)</td>
<td valign="top" align="left">23 (20&#x02013;25)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3"><bold>Comorbidities</bold></td>
</tr>
<tr>
<td valign="top" align="left">Any comorbidity</td>
<td valign="top" align="left">193 (49)</td>
<td valign="top" align="left">170 (24)</td>
</tr>
<tr>
<td valign="top" align="left">Cardiovascular all</td>
<td valign="top" align="left">32 (9)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Myocardial infarction</td>
<td valign="top" align="left">16 (4)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Congestive heart failure</td>
<td valign="top" align="left">5 (1)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Peripheral vascular disease</td>
<td valign="top" align="left">3 (1)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Cerebrovascular disease</td>
<td valign="top" align="left">16 (4)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Chronic Obstructive Pulmonary Disease (COPD)</td>
<td valign="top" align="left">5 (1)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Bronchial asthma</td>
<td valign="top" align="left">16 (4)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Chronic lung disease (excluding COPD)</td>
<td valign="top" align="left">4 (1)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Chronic kidney disease (CKD)</td>
<td valign="top" align="left">9 (3)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Hypertension</td>
<td valign="top" align="left">117 (30)</td>
<td valign="top" align="left">90 (12)</td>
</tr>
<tr>
<td valign="top" align="left">Hyperlipidemia</td>
<td valign="top" align="left">48 (13)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Diabetes mellites</td>
<td valign="top" align="left">52 (14)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Malignancy</td>
<td valign="top" align="left">15 (4)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3"><bold>Symptoms</bold></td>
</tr>
<tr>
<td valign="top" align="left">Any symptoms</td>
<td valign="top" align="left">298 (75)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Fever (37.0 to 38.0&#x000B0;C)</td>
<td valign="top" align="left">190 (53)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Fever (38.0&#x000B0;C or more)</td>
<td valign="top" align="left">47 (13)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Malaise or fatigue</td>
<td valign="top" align="left">110 (31)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Sore throat</td>
<td valign="top" align="left">92 (26)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Headache</td>
<td valign="top" align="left">60 (17)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Rhinorrhea</td>
<td valign="top" align="left">71 (20)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Arthralgia</td>
<td valign="top" align="left">37 (10)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Diarrhea</td>
<td valign="top" align="left">9 (3)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Loss of smell</td>
<td valign="top" align="left">45 (13)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Dyspnea</td>
<td valign="top" align="left">15 (4)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Muscle ache</td>
<td valign="top" align="left">37 (31)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Loss of taste</td>
<td valign="top" align="left">39 (11)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Disturbance of consciousness</td>
<td valign="top" align="left">2 (1)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Conjunctival hyperemia</td>
<td valign="top" align="left">1 (0)</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Period from onset of symptom to PCR positive (IQR) (days)</td>
<td valign="top" align="left">3 (1&#x02013;6)</td>
<td valign="top" align="left">3 (1&#x02013;6)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>Data are shown as no (%) otherwise is specified</italic>.</p>
<p><italic>Cardiovascular diseases include congestive heart failure, unstable angina pectoris, atrial fibrillation, and hypertension. Respiratory diseases include bronchial asthma, chronic obstructive pulmonary disease (COPD), tuberculosis, pleuritis, and pneumonia. Malignancy includes colonic cancer, spinal tumor, brain tumor, prostate cancer, oral cancer, and malignant lymphoma</italic>.</p>
<p><italic>CKD, chronic kidney disease; GERD, gastroesophageal reflux disease; PCR, polymerase chain reaction</italic>.</p>
<fn id="TN1">
<label>&#x0002A;</label>
<p><italic>Smoking history includes patients who are currently smoking or smoking in the past</italic>.</p></fn>
<fn id="TN2">
<label>&#x0002A;&#x0002A;</label>
<p><italic>Drinking alcohol includes patients who drink daily or occasionally</italic>.</p></fn>
</table-wrap-foot>
</table-wrap>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Blood pressure, percutaneous oxygen saturation, laboratory findings, X-ray on admission, and outcome of the patients with COVID-19.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Variables</bold></th>
<th valign="top" align="center"><bold>Model developing</bold></th>
<th valign="top" align="center"><bold>External validation</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="3"><bold>Blood pressure</bold></td>
</tr>
<tr>
<td valign="top" align="left">Systolic blood pressure (mmHg)</td>
<td valign="top" align="center">126 (115&#x02013;139)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Diastolic blood pressure (mmHg)</td>
<td valign="top" align="center">83 (75&#x02013;91)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Saturation of percutaneous oxygen (%)</td>
<td valign="top" align="center">97 (96&#x02013;98)</td>
<td valign="top" align="center">98 (97&#x02013;98)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3"><bold>Complete blood count</bold></td>
</tr>
<tr>
<td valign="top" align="left">White blood cells (&#x000D7;103/&#x003BC;L)</td>
<td valign="top" align="center">46 (37&#x02013;56)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Lymphocytes (%)</td>
<td valign="top" align="center">25 (20&#x02013;34)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Platelets (&#x000D7;104/&#x003BC;L)</td>
<td valign="top" align="center">10 (16&#x02013;25)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3"><bold>Coagulation profile</bold></td>
</tr>
<tr>
<td valign="top" align="left">Prothrombin time (seconds)</td>
<td valign="top" align="center">11 (10&#x02013;12)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Activated partial thromboplastin time (seconds)</td>
<td valign="top" align="center">32 (30&#x02013;35)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Fibrinogen (mg/dl)</td>
<td valign="top" align="center">329 (247&#x02013;428)</td>
<td valign="top" align="center">343 (290&#x02013;404)</td>
</tr>
<tr>
<td valign="top" align="left">D-dimer (&#x003BC;g/ml)</td>
<td valign="top" align="center">0.8 (0.5&#x02013;1.1)</td>
<td valign="top" align="center">0.7 (0.51&#x02013;0.9)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3"><bold>Biochemistry</bold></td>
</tr>
<tr>
<td valign="top" align="left">Na (mEq/l)</td>
<td valign="top" align="center">140 (138&#x02013;141)</td>
<td valign="top" align="center">141 (140&#x02013;151)</td>
</tr>
<tr>
<td valign="top" align="left">K (mEq/l)</td>
<td valign="top" align="center">4 (3.8&#x02013;4.2)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Albumin (g/dl)</td>
<td valign="top" align="center">4.2 (3.9&#x02013;4.5)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Blood urea nitrogen (mg/dl)</td>
<td valign="top" align="center">12.6 (10.0&#x02013;15.3)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Creatinine (mg/dl)</td>
<td valign="top" align="center">0.78 (0.66&#x02013;0.95)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Lactate dehydrogenase (U/l)</td>
<td valign="top" align="center">194 (168&#x02013;235)</td>
<td/>
</tr>
<tr>
<td valign="top" align="left">Aspartate aminotransferase (U/l)</td>
<td valign="top" align="center">24 (20&#x02013;33)</td>
<td valign="top" align="center">23 (19&#x02013;32)</td>
</tr>
<tr>
<td valign="top" align="left">Alanine aminotransferase (U/I)</td>
<td valign="top" align="center">21 (14&#x02013;35)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3"><bold>Serum</bold></td>
</tr>
<tr>
<td valign="top" align="left">C-reactive protein (mg/dl)</td>
<td valign="top" align="center">0.45 (0.12&#x02013;1.59)</td>
<td valign="top" align="center">0.44 (0.14&#x02013;1.39)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">X-ray (pneumonia)</td>
</tr>
<tr>
<td valign="top" align="left">Non</td>
<td valign="top" align="center">170 (43)</td>
<td valign="top" align="center">382 (52)</td>
</tr>
<tr>
<td valign="top" align="left">Unilateral</td>
<td valign="top" align="center">42 (11)</td>
<td valign="top" align="center">78 (11)</td>
</tr>
<tr>
<td valign="top" align="left">Bilateral</td>
<td valign="top" align="center">106 (33)</td>
<td valign="top" align="center">244 (35)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3"><bold>Outcome</bold></td>
</tr>
<tr>
<td valign="top" align="left">A-DROP (&#x02265;1)</td>
<td valign="top" align="center">99 (25)</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Oxygen needs</td>
<td valign="top" align="center">102 (26)</td>
<td valign="top" align="center">106 (15)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>A-DROP, Age-dehydration-respiration-orientation-blood-pressure criteria</italic>.</p>
</table-wrap-foot>
</table-wrap>
<p>The median age was 54 years [interquartile range (IQR), 34&#x02013;70], and 48% of the participants were female. Overall, 102 (26%) and 106 (15%) patients needed oxygen therapy for model dataset development and external validation, respectively. A post-discharge telephone follow-up survey was performed on all patients 2&#x02013;4 weeks after discharge (&#x02265;95% capture rate), and no patients were readmitted.</p>
</sec>
<sec>
<title>Prediction Performance With all Available Variables and Important Variables</title>
<p><xref ref-type="table" rid="T3">Table 3</xref> summarizes the prediction performance of the A-DROP criteria (reference) and eight machine-learning models. Compared with the A-DROP criteria, the discrimination performance of the machine-learning models was significantly greater (<italic>P</italic> &#x0003C; 0.05), except for the <italic>k</italic>-point nearest-neighbor model. Among the six machine-learning models using all available variables, the XG boost had the highest c-statistic (0.89; 95% confidence interval [CI], 0.79&#x02013;0.96), with a sensitivity of 0.83 (95% CI, 075&#x02013;0.91), specificity of 0.90 (95% CI, 0.84&#x02013;0.96), the positive predictive value of 0.71 (95% CI, 0.61&#x02013;0.81), and the negative predictive value of 0.95 (95% CI, 0.90&#x02013;0.99). With the filter method for variable selection, we selected the eight important variables as follows: hypertension, age, any comorbidity, aspartate aminotransferase, lactate dehydrogenase, SpO<sub>2</sub> at the first visit, pneumonia, and C-reactive protein.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>The ability of eight machine-learning models and A-DROP as the risk stratification tool.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Models</bold></th>
<th valign="top" align="center"><bold>C-statistic</bold></th>
<th valign="top" align="center"><bold><italic>P</italic>-value</bold></th>
<th valign="top" align="center"><bold>Sensitivity</bold></th>
<th valign="top" align="center"><bold>Specificity</bold></th>
<th valign="top" align="center"><bold>PPV (95% CI)</bold></th>
<th valign="top" align="center"><bold>NPV (95% CI)</bold></th>
<th valign="top" align="center"><bold>PLR (95% CI)</bold></th>
<th valign="top" align="center"><bold>NLR (95% CI)</bold></th>
</tr>
<tr>
<th/>
<th valign="top" align="center"><bold>(95% CI)</bold></th>
<th/>
<th valign="top" align="center"><bold>(95% CI)</bold></th>
<th valign="top" align="center"><bold>(95% CI)</bold></th>
<th/>
<th/>
<th/>
<th/>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">A-DROP criteria &#x02265;1 (Reference)</td>
<td valign="top" align="center">0.69 (0.62&#x02013;0.75)</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">0.54 (0.48&#x02013;0.59)</td>
<td valign="top" align="center">0.83 (0.79&#x02013;0.87)</td>
<td valign="top" align="center">0.54 (0.48&#x02013;0.59)</td>
<td valign="top" align="center">0.83 (0.79&#x02013;0.87)</td>
<td valign="top" align="center">3.08 (2.24&#x02013;4.25)</td>
<td valign="top" align="center">0.56 (0.41&#x02013;0.77)</td>
</tr>
<tr>
<td valign="top" align="left">Penalized logistic regression</td>
<td valign="top" align="center">0.85 (0.75&#x02013;0.95)</td>
<td valign="top" align="center">0.01</td>
<td valign="top" align="center">0.79 (0.70&#x02013;0.88)</td>
<td valign="top" align="center">0.73 (0.64&#x02013;0.82)</td>
<td valign="top" align="center">0.56 (0.45&#x02013;0.66)</td>
<td valign="top" align="center">0.89 (0.82&#x02013;0.95)</td>
<td valign="top" align="center">2.96 (1.83&#x02013;4.77)</td>
<td valign="top" align="center">0.28 (0.18&#x02013;0.46)</td>
</tr>
<tr>
<td valign="top" align="left">Random forest</td>
<td valign="top" align="center">0.88 (0.78&#x02013;0.97)</td>
<td valign="top" align="center">&#x0003C;0.01</td>
<td valign="top" align="center">0.79 (0.70&#x02013;0.73)</td>
<td valign="top" align="center">0.96 (0.93&#x02013;1.00)</td>
<td valign="top" align="center">0.90 (0.84&#x02013;0.96)</td>
<td valign="top" align="center">0.92 (0.85&#x02013;0.97)</td>
<td valign="top" align="center">22.17 (5.60&#x02013;7.38)</td>
<td valign="top" align="center">0.22 (0.05&#x02013;0.86)</td>
</tr>
<tr>
<td valign="top" align="left">SVM</td>
<td valign="top" align="center">0.83 (0.73&#x02013;0.94)</td>
<td valign="top" align="center">0.03</td>
<td valign="top" align="center">0.75 (0.65&#x02013;0.84)</td>
<td valign="top" align="center">0.80 (0.71&#x02013;0.89)</td>
<td valign="top" align="center">0.62 (0.51&#x02013;0.75)</td>
<td valign="top" align="center">0.88 (0.81&#x02013;0.95)</td>
<td valign="top" align="center">3.82 (2.14&#x02013;6.81)</td>
<td valign="top" align="center">0.31 (0.17&#x02013;0.55)</td>
</tr>
<tr>
<td valign="top" align="left">KNN</td>
<td valign="top" align="center">0.78 (0.66&#x02013;0.91)</td>
<td valign="top" align="center">0.23</td>
<td valign="top" align="center">0.25 (0.16&#x02013;0.35)</td>
<td valign="top" align="center">0.98 (0.95&#x02013;1.00)</td>
<td valign="top" align="center">0.86 (0.78&#x02013;0.93)</td>
<td valign="top" align="center">0.75 (0.66&#x02013;0.85)</td>
<td valign="top" align="center">14.01 (1.78&#x02013;110)</td>
<td valign="top" align="center">0.76 (0.10&#x02013;6.01)</td>
</tr>
<tr>
<td valign="top" align="left">XG boost</td>
<td valign="top" align="center">0.89 (0.79&#x02013;0.96)</td>
<td valign="top" align="center">&#x0003C;0.01</td>
<td valign="top" align="center">0.83 (0.75&#x02013;0.91)</td>
<td valign="top" align="center">0.90 (0.84&#x02013;0.96)</td>
<td valign="top" align="center">0.71 (0.61&#x02013;0.81)</td>
<td valign="top" align="center">0.95 (0.90&#x02013;0.99)</td>
<td valign="top" align="center">8.61 (3.92&#x02013;18.9)</td>
<td valign="top" align="center">0.18 (0.08&#x02013;0.41)</td>
</tr>
<tr>
<td valign="top" align="left">MLP</td>
<td valign="top" align="center">0.86 (0.76&#x02013;0.96)</td>
<td valign="top" align="center">&#x0003C;0.01</td>
<td valign="top" align="center">0.54 (0.44&#x02013;0.65)</td>
<td valign="top" align="center">0.95 (0.89&#x02013;0.99)</td>
<td valign="top" align="center">0.81 (0.72&#x02013;0.90)</td>
<td valign="top" align="center">0.83 (0.74&#x02013;0.91)</td>
<td valign="top" align="center">10.11 (3.17&#x02013;32.8)</td>
<td valign="top" align="center">0.48 (0.15&#x02013;1.55)</td>
</tr>
<tr>
<td valign="top" align="left">XG boost with eight features (Internal validation)</td>
<td valign="top" align="center">0.92 (0.86&#x02013;0.98)</td>
<td valign="top" align="center">&#x0003C;0.001</td>
<td valign="top" align="center">0.94 (0.89&#x02013;0.99)</td>
<td valign="top" align="center">0.69 (0.59&#x02013;0.79)</td>
<td valign="top" align="center">0.47 (0.36&#x02013;0.59)</td>
<td valign="top" align="center">0.98 (0.94&#x02013;1.00)</td>
<td valign="top" align="center">3.08 (2.08&#x02013;4.56)</td>
<td valign="top" align="center">0.08 (0.05&#x02013;0.12)</td>
</tr>
<tr>
<td valign="top" align="left">XG boost with eight features (External validation)</td>
<td valign="top" align="center">0.88 (0.81&#x02013;0.95)</td>
<td valign="top" align="center">&#x0003C;0.001</td>
<td valign="top" align="center">0.64 (0.55&#x02013;0.71)</td>
<td valign="top" align="center">0.93 (0.88&#x02013;0.97)</td>
<td valign="top" align="center">0.61 (0.53&#x02013;0.68)</td>
<td valign="top" align="center">0.93 (0.89&#x02013;0.97)</td>
<td valign="top" align="center">8.77 (4.34&#x02013;17.7)</td>
<td valign="top" align="center">0.39 (0.19&#x02013;0.79)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>A-DROP criteria, age-dehydration-respiration-orientation-blood-pressure criteria</italic>.</p>
<p><italic>CI, confidence interval; PPV, positive predictive value; NPV, negative predictive value; PLR, positive likelihood ratio; NLR, negative likelihood ratio; KNN, K-point nearest neighbor; MLPerceptron, multilayer perceptron; XG boost, extreme gradient boosting</italic>.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<title>Prediction Performance and Feature Importance With Eight Variables</title>
<p>The prediction performance of the XG boost model using the eight variables is presented in <xref ref-type="table" rid="T3">Table 3</xref>. Compared with the A-DROP criteria, the discrimination performance of the XG boost models using the top eight essential variables was significantly greater (<italic>P</italic> &#x0003C; 0.001).</p>
<p>For internal validation, compared to the six machine-learning models using all available variables, the XG boost model using the eight variables had the highest c-statistic (0.92; 95% CI, 0.86&#x02013;0.98 vs. 0.69 in A-DROP criteria; <italic>P</italic> &#x0003C; 0.001), with a sensitivity of 0.94 (95% CI, 0.89&#x02013;0.99), specificity of 0.69 (95% CI, 0.59&#x02013;0.79), the positive predictive value of 0.47 (95% CI, 0.36&#x02013;0.59), and negative predictive value of 0.98 (95% CI, 0.94&#x02013;1.00).</p>
<p>For external validation using an independent data set of 728 patients, compared to the A-DROP criteria, the XG boost using the eight variables had a higher c-statistic (0.88; 95% CI, 0.81&#x02013;0.95 vs. 0.69 in A-DROP criteria; <italic>P</italic> &#x0003C; 0.001; <xref ref-type="fig" rid="F1">Figure 1</xref>), with a sensitivity of 0.64 (95% CI, 0.55&#x02013;0.71), specificity of 0.93 (95% CI, 0.88&#x02013;0.97), positive predictive value of 0.61 (95% CI, 0.53&#x02013;0.68), positive predictive value of 0.93 (95% CI, 0.89&#x02013;0.97]. SpO<sub>2</sub> at the first visit was the most important feature, followed by age, lactate dehydrogenase, and aspartate aminotransferase levels (<xref ref-type="table" rid="T4">Table 4</xref>).</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>C-statistic of XG Boost model with eight variables in external validation.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-09-846525-g0001.tif"/>
</fig>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p>Feature importance of XGboost with eight variables.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Variables</bold></th>
<th valign="top" align="center"><bold>Feature importance</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">SpO<sub>2</sub> at the first visit</td>
<td valign="top" align="center">0.26135576</td>
</tr>
<tr>
<td valign="top" align="left">Age</td>
<td valign="top" align="center">0.26132179</td>
</tr>
<tr>
<td valign="top" align="left">Lactate dehydrogenase</td>
<td valign="top" align="center">0.16435097</td>
</tr>
<tr>
<td valign="top" align="left">Aminotransferase</td>
<td valign="top" align="center">0.15464792</td>
</tr>
<tr>
<td valign="top" align="left">Any comorbidity</td>
<td valign="top" align="center">0.124125525</td>
</tr>
<tr>
<td valign="top" align="left">C-reactive protein</td>
<td valign="top" align="center">0.06478236</td>
</tr>
<tr>
<td valign="top" align="left">Hypertension</td>
<td valign="top" align="center">0.062515706</td>
</tr>
<tr>
<td valign="top" align="left">Pneumonia</td>
<td valign="top" align="center">&#x0003C;0.01</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>SpO<sub>2</sub>, transcutaneous oxygen saturation</italic>.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<title>Calibration Plot</title>
<p><xref ref-type="fig" rid="F2">Figure 2</xref> shows the calibration plots of the XG boost models using the eight variables for predicting outcomes for external validation. A positive relationship was observed between the predicted and actual risks in the calibration plots. The slope, intercept, and coefficient of determination of the calibration were 1.132, &#x02212;0.202, and 0.949 for external validation, respectively. The model-predicted probability for external validation almost matched the observed probabilities.</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>XG boost model calibration plot in external validation.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-09-846525-g0002.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>In this study, we analyzed multicenter, retrospective data from 1,124 patients (396 for model development and internal validation, 728 for external validation) with COVID-19 and applied machine-learning models to predict oxygen therapy during the course of the infection. Specifically, most machine-learning models showed better discriminative performance than the traditional approach (i.e., the A-DROP criteria). In addition, these machine-learning models achieve a high negative predictive value in predicting outcomes, which may help us perform safer triage. To the best of our knowledge, this is the first study to investigate the performance of modern machine-learning models in predicting the need for oxygen therapy in early stage COVID-19 using a large multicenter dataset in Japan with the PROBAST standard.</p>
<p>It is challenging to admit all patients with COVID-19 in the current pandemic due to a lack of medical resources. The WHO guidelines recommend home treatment for patients with mild COVID-19 symptoms (<xref ref-type="bibr" rid="B29">29</xref>). Hence, the importance of accurate prediction for oxygen needs in the early state of COVID-19 has been emphasized, and many machine learning-based prognostic models have been developed (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>). However, most of their reported prediction ability may be optimistic because of the poorly reported study that did not follow PROBAST and the lack of external validation (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B16">16</xref>). In addition, since these studies have looked only at hospitalized patients and not at patients considered mildly ill in the early stages of COVID-19 who were kept home without careful observation, these studies do not comprise consecutive patient data, resulting in significant selection bias (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B30">30</xref>). The present study examined consecutive patients admitted to 11 participating medical institutions, and few patients were kept home. We followed the PROBAST standard, which recommends an extensive data set with at least 10 events per candidate variable for model development and at least 100 events for external validation to reduce bias (<xref ref-type="bibr" rid="B31">31</xref>).</p>
<p>The XG boost model with the eight variables validated by an external dataset in the present study shows a negative predictive value of 0.93 (95% CI, 0.89&#x02013;0.97). The model could contribute to a safer selection of low-risk patients at the initial diagnosis of COVID-19 and their safe management in home care under careful observation. In addition, accurate early prediction of oxygen requirements has several important implications in medical practice. For example, early identification of the potential risk of severe disease allows healthcare providers to develop individualized and optimal management strategies, prepare for hospitalization, and plan more careful follow-up.</p>
<p>Although the machine-learning models achieved significant predictive power, their performance remained imperfect. This can be explained, at least in part, by the limited number of predictors (e.g., the experience of healthcare professionals) and measurement errors in the data.</p>
<p>Furthermore, the A-DROP criterion is presumed to be simpler and easier to use. Although it is known that there is a trade-off between concise models, such as the A-DROP or CURB-65 criteria, the use of modern machine-learning models has the advantages in the era of health information technology, such as web-based applications, automated data entry through speech recognition, natural language processing, continuous model refinement through sequential extraction of electronic medical records, and reinforcement learning (<xref ref-type="bibr" rid="B32">32</xref>, <xref ref-type="bibr" rid="B33">33</xref>). Our findings and the recent advent of machine-learning approaches collectively support cautious optimism that machine learning may enhance the clinician&#x00027;s ability as an assistive technology in predicting patient outcomes in the early stage of COVID-19. We have already implemented this model as a web-based application and plan to triage future COVID-19 patients in Fukui Prefecture.</p>
<p>This study has several limitations. First, the current model is designed to predict disease progression to the stage in which oxygen therapy is required. Hence, the present study did not attempt to predict progression to a more severe stage requiring intubation or extracorporeal membrane oxygenation. However, external validation of this study showed that four people were intubated and three of them died, but the model determined that all of them were severely ill without any omissions. Second, although the current study was conducted with a geographically diverse patient population in Fukui Prefecture, our model may not generalize to other practice settings. Therefore, this model needs to be revalidated in other parts of Japan and outside Japan. The model should be validated in other countries outside Japan. Third, the AI model should be validated repeatedly with the new COVID19 variant. Generally, every AI model should be evaluated frequently with a new dataset to maintain its prediction performance. However, we developed the AI model mainly from the alpha variant of COVID19, and the AI model performed well in external validation that primarily consisted of the delta variant. In other words, the AI model can correctly predict the severity of COVID19 even when the model predicts patients with new COVID19 variants. The AI model predicts the severity using the human body&#x00027;s reaction, such as CRP, not using the virus itself. Therefore, we assume if the patient&#x00027;s response to a new variant of COVID19 is correctly reflected in blood data and radiographs, the AI model may accurately predict the patient&#x00027;s severity. Finally, machine-learning models have a common limitation in terms of interpretability.</p>
<p>In conclusion, based on multicenter retrospective data from 1,124 patients, we developed machine-learning models to predict the need for oxygen therapy during the course of COVID-19 at its early stages. We found that, compared to conventional approaches such as the A-DROP criteria, the machine-learning models had a higher ability to predict oxygen therapy.</p>
</sec>
<sec sec-type="data-availability" id="s5">
<title>Data Availability Statement</title>
<p>The datasets presented in this article are not readily available because we did not get permission to provide the dataset to publishers at each ethics review board of the participating hospital. Requests to access the datasets should be directed to Syunsuke Yamanaka, <email>yamanakasyunsuke&#x00040;yahoo.co.jp</email>.</p>
</sec>
<sec id="s6">
<title>Ethics Statement</title>
<p>The studies involving human participants were reviewed and approved by the Ethics Review Board of the University of Fukui Hospital. Written informed consent for participation was not required for this study in accordance with the national legislation and the institutional requirements.</p>
</sec>
<sec id="s7">
<title>Author Contributions</title>
<p>SY, HA, MY, YS, TW, HM, NY OY, and HH: contributed to the conception, design of the study, and organizing the database. SY and KM: performed the statistical analysis. SY: wrote the first draft of the manuscript. All authors contributed to manuscript revision, read, and approved the submitted version.</p>
</sec>
<sec sec-type="funding-information" id="s8">
<title>Funding</title>
<p>This study was financially supported by the health prevention division of the Fukui Prefecture.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>KM was employed by Connect Inc. The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x00027;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<ack><p>The authors acknowledge Hiroyuki Suto, MD, Ph.D. (Fukui Katsuyama General Hospital) and Manabu Kimura, MD (Nakamura Hospital) at the study hospitals for their assistance with this project.</p>
</ack>
<sec sec-type="supplementary-material" id="s10">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmed.2022.846525/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmed.2022.846525/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_2.DOCX" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Presentation_1.pptx" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Arabi</surname> <given-names>YM</given-names></name> <name><surname>Murthy</surname> <given-names>S</given-names></name> <name><surname>Webb</surname> <given-names>S</given-names></name></person-group>. <article-title>COVID-19: a novel coronavirus and a novel challenge for critical care</article-title>. <source>Intensive Care Med</source>. (<year>2020</year>) <volume>46</volume>:<fpage>833</fpage>&#x02013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1007/s00134-020-05955-1</pub-id><pub-id pub-id-type="pmid">32189010</pub-id></citation></ref>
<ref id="B2">
<label>2.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grasselli</surname> <given-names>G</given-names></name> <name><surname>Pesenti</surname> <given-names>A</given-names></name> <name><surname>Cecconi</surname> <given-names>M</given-names></name></person-group>. <article-title>Critical care utilization for the COVID-19 outbreak in Lombardy, Italy: early experience and forecast during an emergency response</article-title>. <source>JAMA.</source> (<year>2020</year>) <volume>323</volume>:<fpage>1545</fpage>&#x02013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1001/jama.2020.4031</pub-id><pub-id pub-id-type="pmid">32167538</pub-id></citation></ref>
<ref id="B3">
<label>3.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Remuzzi</surname> <given-names>A</given-names></name> <name><surname>Remuzzi</surname> <given-names>G</given-names></name></person-group>. <article-title>COVID-19 and Italy: what next?</article-title> <source>Lancet</source>. (<year>2020</year>) <volume>395</volume>:<fpage>1225</fpage>&#x02013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(20)30627-9</pub-id><pub-id pub-id-type="pmid">32178769</pub-id></citation></ref>
<ref id="B4">
<label>4.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gao</surname> <given-names>Z</given-names></name> <name><surname>Xu</surname> <given-names>Y</given-names></name> <name><surname>Sun</surname> <given-names>C</given-names></name> <name><surname>Wang</surname> <given-names>X</given-names></name> <name><surname>Guo</surname> <given-names>Y</given-names></name> <name><surname>Qiu</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>A systematic review of asymptomatic infections with COVID-19</article-title>. <source>J Microbiol Immunol Infect</source>. (<year>2021</year>) <volume>54</volume>:<fpage>12</fpage>&#x02013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmii.2020.05.001</pub-id><pub-id pub-id-type="pmid">32425996</pub-id></citation></ref>
<ref id="B5">
<label>5.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tabata</surname> <given-names>S</given-names></name> <name><surname>Imai</surname> <given-names>K</given-names></name> <name><surname>Kawano</surname> <given-names>S</given-names></name> <name><surname>Ikeda</surname> <given-names>M</given-names></name> <name><surname>Kodama</surname> <given-names>T</given-names></name> <name><surname>Miyoshi</surname> <given-names>K</given-names></name> <etal/></person-group>. <article-title>Clinical characteristics of COVID-19 in 104 people with SARS-CoV-2 infection on the Diamond Princess cruise ship: a retrospective analysis</article-title>. <source>Lancet Infect Dis</source>. (<year>2020</year>) <volume>20</volume>:<fpage>1043</fpage>&#x02013;<lpage>50</lpage>. <pub-id pub-id-type="doi">10.1016/S1473-3099(20)30482-5</pub-id><pub-id pub-id-type="pmid">32539988</pub-id></citation></ref>
<ref id="B6">
<label>6.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname> <given-names>F</given-names></name> <name><surname>Yu</surname> <given-names>T</given-names></name> <name><surname>Du</surname> <given-names>R</given-names></name> <name><surname>Fan</surname> <given-names>G</given-names></name> <name><surname>Liu</surname> <given-names>Y</given-names></name> <name><surname>Liu</surname> <given-names>Z</given-names></name> <etal/></person-group>. <article-title>Clinical course and risk factors for mortality of adult inpatients with COVID-19 in Wuhan, China: a retrospective cohort study</article-title>. <source>Lancet</source>. (<year>2020</year>) <volume>395</volume>:<fpage>1054</fpage>&#x02013;<lpage>62</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(20)30566-3</pub-id><pub-id pub-id-type="pmid">32171076</pub-id></citation></ref>
<ref id="B7">
<label>7.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cui</surname> <given-names>Y</given-names></name> <name><surname>Sun</surname> <given-names>Y</given-names></name> <name><surname>Sun</surname> <given-names>J</given-names></name> <name><surname>Liang</surname> <given-names>H</given-names></name> <name><surname>Ding</surname> <given-names>X</given-names></name> <name><surname>Sun</surname> <given-names>X</given-names></name> <etal/></person-group>. <article-title>Efficacy and safety of corticosteroid use in coronavirus disease 2019 (COVID-19): a systematic review and meta-analysis</article-title>. <source>Infect Dis Ther</source>. (<year>2021</year>) <volume>10</volume>:<fpage>2447</fpage>&#x02013;<lpage>63</lpage>. <pub-id pub-id-type="doi">10.1007/s40121-021-00518-3</pub-id><pub-id pub-id-type="pmid">34389970</pub-id></citation></ref>
<ref id="B8">
<label>8.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nangaku</surname> <given-names>M</given-names></name> <name><surname>Kadowaki</surname> <given-names>T</given-names></name> <name><surname>Yotsuyanagi</surname> <given-names>H</given-names></name> <name><surname>Ohmagari</surname> <given-names>N</given-names></name> <name><surname>Egi</surname> <given-names>M</given-names></name> <name><surname>Sasaki</surname> <given-names>J</given-names></name> <etal/></person-group>. <article-title>The Japanese Medical Science Federation COVID-19 Expert Opinion English Version</article-title>. <source>JMA J</source>. (<year>2021</year>) <volume>4</volume>:<fpage>148</fpage>&#x02013;<lpage>62</lpage>. <pub-id pub-id-type="doi">10.31662/jmaj.2021-0002</pub-id><pub-id pub-id-type="pmid">33997449</pub-id></citation></ref>
<ref id="B9">
<label>9.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Branas</surname> <given-names>CC</given-names></name> <name><surname>Rundle</surname> <given-names>A</given-names></name> <name><surname>Pei</surname> <given-names>S</given-names></name> <name><surname>Yang</surname> <given-names>W</given-names></name> <name><surname>Carr</surname> <given-names>BG</given-names></name> <name><surname>Sims</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Flattening the curve before it flattens us: hospital critical care capacity limits and mortality from novel coronavirus (SARS-CoV2) cases in US counties</article-title>. <source>medRxiv</source>. (<year>2020</year>). <pub-id pub-id-type="doi">10.1101/2020.04.01.20049759</pub-id></citation>
</ref>
<ref id="B10">
<label>10.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sanders</surname> <given-names>JM</given-names></name> <name><surname>Monogue</surname> <given-names>ML</given-names></name> <name><surname>Jodlowski</surname> <given-names>TZ</given-names></name> <name><surname>Cutrell</surname> <given-names>JB</given-names></name></person-group>. <article-title>Pharmacologic treatments for coronavirus disease 2019 (COVID-19): a review</article-title>. <source>JAMA.</source> (<year>2020</year>) <volume>323</volume>:<fpage>1824</fpage>&#x02013;<lpage>36</lpage>. <pub-id pub-id-type="doi">10.1001/jama.2020.6019</pub-id><pub-id pub-id-type="pmid">32282022</pub-id></citation></ref>
<ref id="B11">
<label>11.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>YH</given-names></name> <name><surname>Hong</surname> <given-names>CM</given-names></name> <name><surname>Kim</surname> <given-names>DH</given-names></name> <name><surname>Lee</surname> <given-names>TH</given-names></name> <name><surname>Lee</surname> <given-names>J</given-names></name></person-group>. <article-title>Clinical course of asymptomatic and mildly symptomatic patients with coronavirus disease admitted to community treatment centers, South Korea</article-title>. <source>Emerg Infect Dis</source>. (<year>2020</year>) <volume>26</volume>:<fpage>2346</fpage>&#x02013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.3201/eid2610.201620</pub-id><pub-id pub-id-type="pmid">32568662</pub-id></citation></ref>
<ref id="B12">
<label>12.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shamsoddin</surname> <given-names>E</given-names></name></person-group>. <article-title>Can medical practitioners rely on prediction models for COVID-19? A systematic review</article-title>. <source>Evid Based Dent.</source> (<year>2020</year>) <volume>21</volume>:<fpage>84</fpage>&#x02013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1038/s41432-020-0115-5</pub-id><pub-id pub-id-type="pmid">32978532</pub-id></citation></ref>
<ref id="B13">
<label>13.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wolff</surname> <given-names>RF</given-names></name> <name><surname>Moons</surname> <given-names>KGM</given-names></name> <name><surname>Riley</surname> <given-names>RD</given-names></name> <name><surname>Whiting</surname> <given-names>PF</given-names></name> <name><surname>Westwood</surname> <given-names>M</given-names></name> <name><surname>Collins</surname> <given-names>GS</given-names></name> <etal/></person-group>. <article-title>PROBAST: a tool to assess the risk of bias and applicability of prediction model studies</article-title>. <source>Ann Intern Med</source>. (<year>2019</year>) <volume>170</volume>:<fpage>51</fpage>&#x02013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.7326/M18-1376</pub-id><pub-id pub-id-type="pmid">30596876</pub-id></citation></ref>
<ref id="B14">
<label>14.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Najafabadi</surname> <given-names>ZAH</given-names></name> <name><surname>Ramspek</surname> <given-names>CL</given-names></name> <name><surname>Dekker</surname> <given-names>FW</given-names></name> <name><surname>Heus</surname> <given-names>P</given-names></name> <name><surname>Hooft</surname> <given-names>L</given-names></name> <name><surname>Moons</surname> <given-names>KGM</given-names></name> <etal/></person-group>. <article-title>TRIPOD statement: a preliminary pre-post analysis of reporting and methods of prediction models</article-title>. <source>BMJ Open</source>. (<year>2020</year>) <volume>10</volume>:<fpage>e041537</fpage>. <pub-id pub-id-type="doi">10.1136/bmjopen-2020-041537</pub-id><pub-id pub-id-type="pmid">32948578</pub-id></citation></ref>
<ref id="B15">
<label>15.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Collins</surname> <given-names>GS</given-names></name> <name><surname>Reitsma</surname> <given-names>JB</given-names></name> <name><surname>Altman</surname> <given-names>DG</given-names></name> <name><surname>Moons</surname> <given-names>KG</given-names></name></person-group>. <article-title>Transparent reporting of a multivariable prediction model for individual prognosis or diagnosis (TRIPOD): the TRIPOD statement</article-title>. <source>BMJ</source>. (<year>2015</year>) <volume>350</volume>:<fpage>g7594</fpage>. <pub-id pub-id-type="doi">10.1136/bmj.g7594</pub-id><pub-id pub-id-type="pmid">25627261</pub-id></citation></ref>
<ref id="B16">
<label>16.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wynants</surname> <given-names>L</given-names></name> <name><surname>Van Calster</surname> <given-names>B</given-names></name> <name><surname>Collins</surname> <given-names>GS</given-names></name> <name><surname>Riley</surname> <given-names>RD</given-names></name> <name><surname>Heinze</surname> <given-names>G</given-names></name> <name><surname>Schuit</surname> <given-names>E</given-names></name> <etal/></person-group>. <article-title>Prediction models for diagnosis prognosis of covid-19: systematic review critical appraisal</article-title>. <source>BMJ</source>. (<year>2020</year>) <volume>369</volume>:<fpage>m1328</fpage>. <pub-id pub-id-type="doi">10.1136/bmj.m1328</pub-id><pub-id pub-id-type="pmid">32265220</pub-id></citation></ref>
<ref id="B17">
<label>17.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moons</surname> <given-names>KG</given-names></name> <name><surname>Altman</surname> <given-names>DG</given-names></name> <name><surname>Reitsma</surname> <given-names>JB</given-names></name> <name><surname>Ioannidis</surname> <given-names>JP</given-names></name> <name><surname>Macaskill</surname> <given-names>P</given-names></name> <name><surname>Steyerberg</surname> <given-names>EW</given-names></name> <etal/></person-group>. <article-title>Transparent reporting of a multivariable prediction model for individual prognosis or diagnosis (TRIPOD): explanation and elaboration</article-title>. <source>Ann Intern Med</source>. (<year>2015</year>) <volume>162</volume>:<fpage>W1</fpage>&#x02013;<lpage>W73</lpage>. <pub-id pub-id-type="doi">10.7326/M14-0698</pub-id><pub-id pub-id-type="pmid">25560730</pub-id></citation></ref>
<ref id="B18">
<label>18.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Miyashita</surname> <given-names>N</given-names></name> <name><surname>Matsushima</surname> <given-names>T</given-names></name> <name><surname>Oka</surname> <given-names>M</given-names></name></person-group>. <article-title>The JRS guidelines for the management of community-acquired pneumonia in adults: an update and new recommendations</article-title>. <source>Intern Med</source>. (<year>2006</year>) <volume>45</volume>:<fpage>419</fpage>&#x02013;<lpage>28</lpage>. <pub-id pub-id-type="doi">10.2169/internalmedicine.45.1691</pub-id><pub-id pub-id-type="pmid">16679695</pub-id></citation></ref>
<ref id="B19">
<label>19.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stekhoven</surname> <given-names>DJ</given-names></name></person-group>. <source>Nonparametric Missing Value Imputation Using Random Forest.</source> R package version 1.4 (<year>2012</year>).<pub-id pub-id-type="pmid">32380076</pub-id></citation></ref>
<ref id="B20">
<label>20.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Warton</surname> <given-names>DI</given-names></name></person-group>. <article-title>Penalized normal likelihood and ridge regularization of correlation and covariance matrices</article-title>. <source>J Am Stat Assoc.</source> (<year>2008</year>) <volume>103</volume>:<fpage>340</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1198/016214508000000021</pub-id></citation>
</ref>
<ref id="B21">
<label>21.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Svetnik</surname> <given-names>V</given-names></name> <name><surname>Liaw</surname> <given-names>A</given-names></name> <name><surname>Tong</surname> <given-names>C</given-names></name> <name><surname>Culberson</surname> <given-names>JC</given-names></name> <name><surname>Sheridan</surname> <given-names>RP</given-names></name> <name><surname>Feuston</surname> <given-names>BP</given-names></name></person-group>. <article-title>Random forest: a classification and regression tool for compound classification and QSAR modeling</article-title>. <source>J Chem Inf Comput Sci.</source> (<year>2003</year>) <volume>43</volume>:<fpage>1947</fpage>&#x02013;<lpage>58</lpage>. <pub-id pub-id-type="doi">10.1021/ci034160g</pub-id><pub-id pub-id-type="pmid">14632445</pub-id></citation></ref>
<ref id="B22">
<label>22.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Suykens</surname> <given-names>JA</given-names></name> <name><surname>Vandewalle</surname> <given-names>J</given-names></name></person-group>. <article-title>Least squares support vector machine classifiers</article-title>. <source>Neural Process Lett</source>. (<year>1999</year>) <volume>9</volume>:<fpage>293</fpage>&#x02013;<lpage>300</lpage>. <pub-id pub-id-type="doi">10.1023/A:1018628609742</pub-id><pub-id pub-id-type="pmid">11972910</pub-id></citation></ref>
<ref id="B23">
<label>23.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bay</surname> <given-names>SD</given-names></name></person-group>. <article-title>Nearest neighbor classification from multiple feature subsets</article-title>. <source>Intell Data Anal</source>. (<year>1999</year>) <volume>3</volume>:<fpage>191</fpage>&#x02013;<lpage>209</lpage>. <pub-id pub-id-type="doi">10.1016/S1088-467X(99)00018-9</pub-id></citation>
</ref>
<ref id="B24">
<label>24.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>T</given-names></name> <name><surname>He</surname> <given-names>T</given-names></name> <name><surname>Benesty</surname> <given-names>M</given-names></name> <name><surname>Khotilovich</surname> <given-names>V</given-names></name> <name><surname>Tang</surname> <given-names>Y</given-names></name></person-group>. <source>Xgboost: Extreme Gradient Boosting</source>. R package version 0.4-2. 1-4 (<year>2015</year>).</citation>
</ref>
<ref id="B25">
<label>25.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pal</surname> <given-names>S</given-names></name> <name><surname>Mitra</surname> <given-names>S</given-names></name></person-group>. <article-title>Multilayer perceptron, fuzzy sets, and classification</article-title>. <source>IEEE Trans Neural Netw</source>. (<year>1992</year>) <volume>3</volume>:<fpage>683</fpage>&#x02013;<lpage>97</lpage>. <pub-id pub-id-type="doi">10.1109/72.159058</pub-id><pub-id pub-id-type="pmid">18276468</pub-id></citation></ref>
<ref id="B26">
<label>26.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shindo</surname> <given-names>Y</given-names></name> <name><surname>Sato</surname> <given-names>S</given-names></name> <name><surname>Maruyama</surname> <given-names>E</given-names></name> <name><surname>Ohashi</surname> <given-names>T</given-names></name> <name><surname>Ogawa</surname> <given-names>M</given-names></name> <name><surname>Imaizumi</surname> <given-names>K</given-names></name> <etal/></person-group>. <article-title>Comparison of severity scoring systems A-DROP and CURB-65 for community-acquired pneumonia</article-title>. <source>Respirology.</source> (<year>2008</year>) <volume>13</volume>:<fpage>731</fpage>&#x02013;<lpage>5</lpage>. <pub-id pub-id-type="doi">10.1111/j.1440-1843.2008.01329.x</pub-id><pub-id pub-id-type="pmid">18713094</pub-id></citation></ref>
<ref id="B27">
<label>27.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tolga</surname> <given-names>T</given-names></name> <name><surname>Jiju</surname> <given-names>A</given-names></name></person-group>. <article-title>The assessment of quality in medical diagnostic tests: a comparison of ROC/Youden and Taguchi methods</article-title>. <source>Int J Health Care Qual Assur</source>. (<year>2000</year>) <volume>13</volume>:<fpage>300</fpage>&#x02013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1108/09526860010378744</pub-id><pub-id pub-id-type="pmid">11484648</pub-id></citation></ref>
<ref id="B28">
<label>28.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guyon</surname> <given-names>I</given-names></name> <name><surname>Elisseeff</surname> <given-names>A</given-names></name></person-group>. <article-title>An introduction to variable and feature selection</article-title>. <source>J Mach Learn Res</source>. (<year>2003</year>) <volume>3</volume>:<fpage>1157</fpage>&#x02013;<lpage>82</lpage>. <pub-id pub-id-type="doi">10.1162/153244303322753616</pub-id></citation>
</ref>
<ref id="B29">
<label>29.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>World Health Organization</collab></person-group>. <source>Home Care for Patients With COVID-19 Presenting With Mild Symptoms and Management of Their Contacts: Interim Guidance</source> (<year>2020</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.who.int/publications/i/item/home-care-for-patients-with-suspected-novel-coronavirus-(ncov)-infection-presenting-with-mild-symptoms-and-management-of-contacts">https://www.who.int/publications/i/item/home-care-for-patients-with-suspected-novel-coronavirus-(ncov)-infection-presenting-with-mild-symptoms-and-management-of-contacts</ext-link> (accessed March 17, 2020).</citation>
</ref>
<ref id="B30">
<label>30.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname> <given-names>M</given-names></name> <name><surname>Liu</surname> <given-names>J</given-names></name> <name><surname>Jiang</surname> <given-names>W</given-names></name> <name><surname>Yue</surname> <given-names>S</given-names></name> <name><surname>Liu</surname> <given-names>H</given-names></name> <name><surname>Wei</surname> <given-names>S</given-names></name></person-group>. <article-title>IL-6 and CD8&#x0002B; T cell counts combined are an early predictor of in-hospital mortality of patients with COVID-19</article-title>. <source>JCI Insight</source>. (<year>2020</year>) <volume>5</volume>:<fpage>e139024</fpage>. <pub-id pub-id-type="doi">10.1172/jci.insight.139024</pub-id><pub-id pub-id-type="pmid">32544099</pub-id></citation></ref>
<ref id="B31">
<label>31.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Collins</surname> <given-names>GS</given-names></name> <name><surname>Ogundimu</surname> <given-names>EO</given-names></name> <name><surname>Altman</surname> <given-names>DG</given-names></name></person-group>. <article-title>Sample size considerations for the external validation of a multivariable prognostic model: a resampling study</article-title>. <source>Stat Med</source>. (<year>2016</year>) <volume>35</volume>:<fpage>214</fpage>&#x02013;<lpage>26</lpage>. <pub-id pub-id-type="doi">10.1002/sim.6787</pub-id><pub-id pub-id-type="pmid">26553135</pub-id></citation></ref>
<ref id="B32">
<label>32.</label>
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Freeman</surname> <given-names>MB,. Method Apparatus for Automated Data Entry. Google Patents</given-names></name></person-group> (<year>2001</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://patents.justia.com/patent/6299063">https://patents.justia.com/patent/6299063</ext-link> (accessed January 14, 2022).</citation>
</ref>
<ref id="B33">
<label>33.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Thanaki</surname> <given-names>J</given-names></name></person-group>. <source>Python Natural Language Processing.</source> <publisher-loc>Birmingham</publisher-loc>: <publisher-name>Packt Publishing Ltd.</publisher-name> (<year>2017</year>).</citation>
</ref>
</ref-list> 
</back>
</article>