<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" dtd-version="1.3" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Med.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Medicine</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Med.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-858X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmed.2026.1729990</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Artificial intelligence algorithm to predict the requirement of neonatal endotracheal intubation within 3 h: application for clinical practice</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Park</surname> <given-names>JinCheol</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x02020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<uri xlink:href="https://loop.frontiersin.org/people/3251115"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Yang</surname> <given-names>Minuk</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x02020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Kim</surname> <given-names>Ka Hyun</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Kim</surname> <given-names>Geun-Hyeong</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Park</surname> <given-names>Seung</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x00026; editing</role>
<uri xlink:href="https://loop.frontiersin.org/people/2618670"/>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>College of Medicine, Chungbuk National University</institution>, <city>Cheongju-si, Chungcheongbuk-do</city>, <country country="kp">Republic of Korea</country></aff>
<aff id="aff2"><label>2</label><institution>Development, Mediv Corp.</institution>, <city>Cheongju-si, Chungcheongbuk-do</city>, <country country="kp">Republic of Korea</country></aff>
<aff id="aff3"><label>3</label><institution>Department of Biomedical Engineering, Chungbuk National University Hospital</institution>, <city>Cheongju-si, Chungcheongbuk-do</city>, <country country="kp">Republic of Korea</country></aff>
<author-notes>
<corresp id="c001"><label>&#x0002A;</label>Correspondence: Geun-Hyeong Kim, <email xlink:href="mailto:kgh5408@nate.com">kgh5408@nate.com</email>; Seung Park, <email xlink:href="mailto:spark.cbnuh@gmail.com">spark.cbnuh@gmail.com</email></corresp>
<fn fn-type="equal" id="fn001"><label>&#x02020;</label><p>These authors have contributed equally to this work</p></fn></author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-20">
<day>20</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>13</volume>
<elocation-id>1729990</elocation-id>
<history>
<date date-type="received">
<day>22</day>
<month>10</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>13</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>23</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2026 Park, Yang, Kim, Kim and Park.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Park, Yang, Kim, Kim and Park</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-20">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Timely intervention, such as endotracheal intubation (EI), is crucial for managing acute respiratory distress in the neonatal intensive care unit (NICU). Delays in EI can lead to significant adverse effects in neonates. This study aimed to develop a highly accurate predictive model to forecast the requirement for EI, allowing for proactive clinical planning and intervention up to 3 h in advance.</p>
</sec>
<sec>
<title>Method</title>
<p>We developed a multimodal deep learning model designed to simultaneously analyze distinct data types. The model utilizes numeric initial clinical data and time-series vital sign data collected over the preceding 1&#x02013;3 h. To rigorously evaluate the model&#x00027;s reliability and clinical applicability, we performed comprehensive external validation using independent patient datasets, specifically assessing generalization and bias.</p>
</sec>
<sec>
<title>Result</title>
<p>The constrained model successfully predicted the requirement for EI with high predictive power across various forecasting intervals (up to 72 h in 1-h increments). Internal validation yielded an accuracy of 0.9579 and AUC of 0.9323, while external validation maintained high generalization (accuracy 0.9411, AUC 0.9336).</p>
</sec>
<sec>
<title>Discussion</title>
<p>The proposed multimodal deep learning model provides an effective tool for the advance prediction of EI requirements in neonates. Given its high accuracy, confirmed generalization capabilities through external validation, and potential to prevent severe respiratory distress problems by facilitating proactive care, this model holds wide and significant applicability in clinical NICU environments.</p>
</sec></abstract>
<kwd-group>
<kwd>deep learning</kwd>
<kwd>endotracheal intubation</kwd>
<kwd>multimodal network</kwd>
<kwd>neonatal intensive care units</kwd>
<kwd>neonates</kwd>
</kwd-group>
<funding-group>
<award-group id="gs1">
<funding-source id="sp1">
<institution-wrap>
<institution>National Research Foundation of Korea</institution>
<institution-id institution-id-type="doi" vocab="open-funder-registry" vocab-identifier="10.13039/open_funder_registry">10.13039/501100003725</institution-id>
</institution-wrap>
</funding-source>
</award-group>
<award-group id="gs2">
<funding-source id="sp2">
<institution-wrap>
<institution>Chungbuk National University</institution>
<institution-id institution-id-type="doi" vocab="open-funder-registry" vocab-identifier="10.13039/open_funder_registry">10.13039/501100002461</institution-id>
</institution-wrap>
</funding-source>
</award-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This research was supported by the Regional Innovation System &#x00026; Education (RISE) program through the Chungbuk Regional Innovation System &#x00026; Education Center, funded by the Ministry of Education (MOE) and the Chungcheongbuk-do, Republic of Korea. (2025-RISE-11-004-03). This work was supported by a funding for the academic research program of Chungbuk National University in 2024.</funding-statement>
</funding-group>
<counts>
<fig-count count="9"/>
<table-count count="2"/>
<equation-count count="5"/>
<ref-count count="26"/>
<page-count count="14"/>
<word-count count="7207"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Intensive Care Medicine and Anesthesiology</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<label>1</label>
<title>Introduction</title>
<p>Endotracheal intubation (EI) is a critical life-sustaining procedure for patients experiencing respiratory distress. Traditionally, EI decisions are made based on clinical assessment and available physiologic indicators, including vital signs and clinical scoring systems (<xref ref-type="bibr" rid="B1">1</xref>&#x02013;<xref ref-type="bibr" rid="B3">3</xref>). Timely and accurate identification of newborns who are likely to require EI remains challenging in clinical practice because their clinical presentations and physiologic conditions can vary widely. In addition, delayed or inappropriate airway management in newborns with worsening respiratory failure can be associated with serious complications, including hypoxemia and bradycardia (<xref ref-type="bibr" rid="B4">4</xref>&#x02013;<xref ref-type="bibr" rid="B6">6</xref>). Therefore, given these concerns, objective and quantifiable decision-support tools are needed to facilitate EI decision-making.</p>
<p>Recent studies have demonstrated that artificial intelligence (AI) models can support physicians in decision-making by predicting the optimal timing for EI based on patient data (<xref ref-type="bibr" rid="B7">7</xref>&#x02013;<xref ref-type="bibr" rid="B10">10</xref>). To predict the need for EI at the time of patient admission, Nopour et al. (<xref ref-type="bibr" rid="B7">7</xref>) and Yu et al. (<xref ref-type="bibr" rid="B8">8</xref>) developed models based on multilayer perceptron (MLP) and eXtreme Gradient Boosting (XGBoost), respectively. Arvind et al. (<xref ref-type="bibr" rid="B9">9</xref>) utilized a random forest algorithm to predict EI requirements by analyzing time-series data, including blood pressure, respiratory rate, and oxygen saturation, at 12-h intervals over 3 days. Siu et al. (<xref ref-type="bibr" rid="B10">10</xref>) not only predicted the necessity of EI within 24 h for patients with respiratory distress but also identified key contributing variables in the model&#x00027;s decision-making process using Shapley additive explanations. Furthermore, Jueng-Eun et al. (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B12">12</xref>) proposed AI models that can predict the timing of EI in 1-h intervals up to 12 h in advance. Their models leveraged initial clinical data from neonatal intensive care units (NICUs) along with hourly vital sign measurements for neonates experiencing respiratory distress.</p>
<p>However, previous studies (<xref ref-type="bibr" rid="B7">7</xref>&#x02013;<xref ref-type="bibr" rid="B12">12</xref>) have three limitations. First, some studies (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B8">8</xref>) do not reflect the health status of the patient over time. Physicians typically assess the condition of a patient by monitoring variations in vital signs, such as heart rate and oxygen saturation; however, these studies relied solely on initial clinical data obtained at the time of admission, without incorporating temporal changes in patient health. Second, the prediction time intervals set by previous studies (<xref ref-type="bibr" rid="B9">9</xref>&#x02013;<xref ref-type="bibr" rid="B12">12</xref>) are limited. As delayed EI causes adverse effects, the prediction interval for EI should be short with the capability of long-term predictions. Nonetheless, previous studies (<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B10">10</xref>) either predicted EI application in 12-h intervals or began the prediction only 12 h after NICU admission. Moreover, although NICU patients are often hospitalized for extended periods, some studies (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B12">12</xref>) only predicted EI application within the first 12 h after admission. Finally, existing models (<xref ref-type="bibr" rid="B7">7</xref>&#x02013;<xref ref-type="bibr" rid="B10">10</xref>) may not be applicable to neonatal patients. Neonates exhibit distinct physiological characteristics in their respiratory and circulatory systems compared to adults (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B14">14</xref>). As a result, EI prediction models originally designed for adult patients may not be suitable for neonatal use. Therefore, AI models should be developed to enable real-time assessment of patient health status, incorporate clinically relevant prediction intervals, and account for the unique physiological characteristics of neonates.</p>
<p>To address these limitations, we developed a multimodal model that integrates two types of data: initial clinical data (numerical data) and vital signs (time-series data). An overview of the proposed workflow is shown in <xref ref-type="fig" rid="F1">Figure 1</xref>. The model utilizes a multilayer perceptron (MLP) to process numerical data and a long short-term memory (LSTM)&#x02013;transformer architecture to analyze time-series data. LSTM&#x02013;Transformer is designed to capture micro-dynamics and inter-signal dependencies. To evaluate the model&#x00027;s performance and generalizability, we trained and internally validated it using a dataset of 432 patients from our institution, Chungbuk National University Hospital (CBNUH). External validation was conducted using a separate dataset of 176 patients from Chungnam National University Hospital (CNUH). Additionally, we extended the prediction window to 72 h after admission and enabled EI prediction at hourly intervals up to 3 h in advance, providing sufficient time for clinical preparation.</p>
<fig position="float" id="F1">
<label>Figure 1</label>
<caption><p>Overview of the development and validation process for an artificial intelligence model predicting the timing of endotracheal intubation (EI) in neonates.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-13-1729990-g0001.tif">
<alt-text content-type="machine-generated">Diagram illustrating an AI model for neonatal intensive care. It emphasizes the need for AI in the NICU to predict intubation using data on heart rate (HR), respiratory rate (RR), and oxygen saturation (SpO2). A timeline shows prediction three hours before actual intubation. The AI model process includes data collection at NICU admission, preprocessing numeric and time-series data, and using model architectures like MLP, LSTM, and Transformer Encoder for binary classification between intubation and non-intubation.</alt-text>
</graphic>
</fig>
<p>In summary, the contributions of our research are as follows:</p>
<list list-type="bullet">
<list-item><p>We developed an EI prediction model designed for neonatal patients.</p></list-item>
<list-item><p>We validated the generalization of the proposed model using a dataset from an external institution.</p></list-item>
<list-item><p>We predicted patients requiring EI at 1-h intervals and within 3 h, taking into account real-world clinical settings. Moreover, we extended the scope to predict neonatal patients up to 72 h after admission.</p></list-item>
</list>
</sec>
<sec id="s2">
<label>2</label>
<title>Method</title>
<sec>
<label>2.1</label>
<title>Datasets</title>
<p>We collected the dataset for model training to predict EI and for internal validation at CBNUH, located in Cheong-Ju, Republic of Korea, between July 3, 2020, and August 4, 2023. The institutional review board (IRB) of CBNUH approved this study (IRB No. CBNUH 2021-02-034-001). For external validation, an additional dataset was collected at CNUH, located in Daejeon, Republic of Korea, between October 1, 2019, and June 30, 2021. This study was approved by the IRB of CNUH (IRB No. CNUH 2023-07-031). Both datasets were retrospectively collected through manual transcription of electronic medical records (EMRs), and all patient data were subsequently anonymized. We confirm that all methods were conducted in accordance with relevant ethical guidelines and regulations.</p>
<p>We established exclusion criteria to ensure the selection of a cohort relevant to the study objectives and maintain the integrity and reliability of the study results. The exclusion criteria included the following: (a) patients without dyspnea; (b) patients who had already underwent EI on admission to the NICU; (c) patients who had died within 72 h of admission; (d) patients hospitalized for more than 48 h after birth; and (e) patients with two or more missing numeric data. We selected the aforementioned criteria for the following reasons. Criteria (a)&#x02013;(c) were not relevant to our study, which aimed to predict EI within 72 h of admission. Additionally, patients hospitalized more than 48 after birth were excluded due to an insufficient number of available data. Furthermore, since missing data exceeding 10% may cause bias in estimates (<xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B16">16</xref>), we excluded patients with more than two missing numeric data. A total of 1,387 data points were collected from CBNUH, of which 955 cases were excluded based on the exclusion criteria, leaving 432 cases for model training and internal validation (<xref ref-type="fig" rid="F2">Figure 2a</xref>). For the external validation, 761 data were collected from CNUH, with 587 cases excluded, resulting in 174 cases used for external validation (<xref ref-type="fig" rid="F2">Figure 2b</xref>).</p>
<fig position="float" id="F2">
<label>Figure 2</label>
<caption><p>Flowchart of the data selection processes: <bold>(a)</bold> the dataset collected from Chungbuk National University Hospital (CBNUH) for development and internal validation; and <bold>(b)</bold> the dataset collected from Chungnam National University Hospital (CNUH) for external validation.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-13-1729990-g0002.tif">
<alt-text content-type="machine-generated">Flowcharts illustrating participant eligibility assessment. Chart (a) shows 1,387 assessed, with 955 excluded, and 432 enrolled, divided into 98 intubation and 334 non-intubation. Chart (b) shows 761 assessed, 587 excluded, and 174 enrolled, split into 9 intubation and 165 non-intubation. Exclusion reasons include no respiratory distress, intubation at admission, early death, late admission, and missing data.</alt-text>
</graphic>
</fig>
<p>The collected variables included perinatal factors, arterial blood gas analysis (ABGA), patient vital signs, the Clinical Risk Index for Babies (CRIB) II score (<xref ref-type="bibr" rid="B17">17</xref>), and EI application status (<xref ref-type="table" rid="T1">Table 1</xref>). Perinatal factors comprised 12 variables: place of birth, gestational age, birth weight, gender, 1-min Apgar score, 5-min Apgar score, delivery type, antenatal steroid administration, pregnancy-induced hypertension, gestational diabetes mellitus, premature rupture of membranes, and multiple gestation. To assess neonatal clinical risk, we calculated the CRIB II score and used ABGA results that included pH, pCO<sub>2</sub>, pO<sub>2</sub>, base excess, and lactate concentration. All blood gas measurements included in the dataset were arterial samples as documented in the EMR; capillary blood gas analyses were not included. Additionally, four vital signs were collected: body temperature, heart rate (HR), respiratory rate (RR), and saturation measured via pulse oximetry (SpO<sub>2</sub>). Body temperature was recorded at admission, while HR, RR, and SpO<sub>2</sub> were measured at 1-h intervals for up to 72 h. Hourly HR, RR, and SpO<sub>2</sub> values were primarily transferred automatically from bedside monitoring devices to the EMR. If an hourly value was missing, we used the nearest nurse-charted value within &#x000B1; 30 min of the target time point when available.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Descriptions of the collected clinical variables in the dataset.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left" colspan="2"><bold>Variable</bold></th>
<th valign="top" align="left"><bold>Value [unit]</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" rowspan="11">Prenatal factors</td>
<td valign="top" align="left">Place of birth</td>
<td valign="top" align="left">0: Outside hospital, 1: In hospital</td>
</tr>
<tr>
<td valign="top" align="left">Gestational age</td>
<td valign="top" align="left">204&#x02013;296 [day]</td>
</tr>
<tr>
<td valign="top" align="left">Birth weight</td>
<td valign="top" align="left">870&#x02013;5,200 [g]</td>
</tr>
<tr>
<td valign="top" align="left">1 min Apgar score</td>
<td valign="top" align="left">1&#x02013;10</td>
</tr>
<tr>
<td valign="top" align="left">5 min Apgar score</td>
<td valign="top" align="left">3&#x02013;10</td>
</tr>
<tr>
<td valign="top" align="left">Delivery type</td>
<td valign="top" align="left">0: Natural birth, 1: C-section</td>
</tr>
<tr>
<td valign="top" align="left">Antenatal steroid administration</td>
<td valign="top" align="left">0: No, 1: Yes</td>
</tr>
<tr>
<td valign="top" align="left">Pregnancy hypertension</td>
<td valign="top" align="left">0: No, 1: Yes</td>
</tr>
<tr>
<td valign="top" align="left">Gestational diabetes mellitus</td>
<td valign="top" align="left">0: No, 1: Yes</td>
</tr>
<tr>
<td valign="top" align="left">Premature rupture of membranes</td>
<td valign="top" align="left">0: No, 1: Yes</td>
</tr>
<tr>
<td valign="top" align="left">Multi-birth</td>
<td valign="top" align="left">0: No multiples, 1: First, 2: Second, 3: Third or more</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="5">ABGA</td>
<td valign="top" align="left">pH</td>
<td valign="top" align="left">7.01&#x02013;7.571</td>
</tr>
<tr>
<td valign="top" align="left">pCO<sub>2</sub></td>
<td valign="top" align="left">24.3&#x02013;88.6 [mmHg]</td>
</tr>
<tr>
<td valign="top" align="left">pO<sub>2</sub></td>
<td valign="top" align="left">18.8&#x02013;138 [mmHg]</td>
</tr>
<tr>
<td valign="top" align="left">Base Excess</td>
<td valign="top" align="left">&#x02013;16.5&#x02013;18.5 [Mmol/L]</td>
</tr>
<tr>
<td valign="top" align="left">Lactate</td>
<td valign="top" align="left">0.8&#x02013;13.7 [Mmol/L]</td>
</tr>
<tr>
<td valign="top" align="left" rowspan="4">Vital sign</td>
<td valign="top" align="left">HR</td>
<td valign="top" align="left">28&#x02013;272 [Beats/min]</td>
</tr>
<tr>
<td valign="top" align="left">RR</td>
<td valign="top" align="left">10&#x02013;145 [Breaths/min]</td>
</tr>
<tr>
<td valign="top" align="left">SpO<sub>2</sub></td>
<td valign="top" align="left">10&#x02013;100 [%]</td>
</tr>
<tr>
<td valign="top" align="left">Body temperature</td>
<td valign="top" align="left">34&#x02013;38.2 [&#x000B0;C]</td>
</tr>
<tr>
<td valign="top" align="left">CRIB II score</td>
<td valign="top" align="left">CRIB II score</td>
<td valign="top" align="left">1&#x02013;10</td>
</tr>
<tr>
<td valign="top" align="left">Intubation</td>
<td valign="top" align="left">EI</td>
<td valign="top" align="left">0: Non-intubation, 1: Intubation</td>
</tr></tbody>
</table>
</table-wrap>
<p>During the study period, neonatal respiratory management at both centers followed routine standard-of-care practices guided by the attending neonatologist; for transparency, we explicitly list the key clinical indications used to determine EI in the manuscript. EI was determined by the attending neonatologist based on common clinical indications, including persistent or worsening respiratory failure despite non-invasive respiratory support, recurrent apnea requiring ventilatory support, progressive respiratory acidosis or hypercapnia on ABGA, and the need for stabilization or airway protection.</p>
<p>The final collected dataset comprised both numerical and time-series data. To facilitate EI prediction within a 3-h window, we applied pre-processing methods tailored to each data type. The pre-processing steps for the numerical and time series data are described below.</p>
<sec>
<label>2.1.1</label>
<title>Numeric data pre-processing</title>
<sec>
<label>2.1.1.1</label>
<title>Nominal data encoding</title>
<p>We converted text-based nominal data (place of birth, sex, delivery type, antenatal steroid administration, gestational hypertension, gestational diabetes mellitus, preterm rupture of membrane, and multi-birth) into numeric data suitable for model analysis. The encoding results are shown in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
</sec>
<sec>
<label>2.1.1.2</label>
<title>Handling missing values in numeric data</title>
<p>Numeric data with more than two missing values were excluded from the dataset, ensuring that all retained numerical data contained at most one missing value. For this missing value, we replaced the nominal data (encoded as numerical data) with the mode value, and discrete and continuous data (gestational age, birth weight, 1-min Apgar score, 5-min Apgar score, pH, pCO<sub>2</sub>, pO<sub>2</sub>, base excess, lactate, and CRIB II score) with the mean value.</p>
</sec>
</sec>
<sec>
<label>2.1.2</label>
<title>Time-series data pre-processing</title>
<sec>
<label>2.1.2.1</label>
<title>Outlier handling in data</title>
<p>In time-series data analysis, outliers can adversely impact model performance. Therefore, zero values in the HR and RR data were treated as missing (NaN) and subsequently processed alongside other missing values. Since data from neonatal patients who died during hospitalization had already been excluded during data collection, zero values in HR and RR were identified as outliers measured likely recorded while the patient was crying or sleeping.</p>
</sec>
<sec>
<label>2.1.2.2</label>
<title>Handling missing values in time-series data</title>
<p>In the collected dataset, 46.9% (46/98) of positive cases occurred within the first 3 h of hospitalization. Therefore, we applied a different imputation method for missing values based on 3 h. For time-series data recorded within the first 3 h, we imputed missing values by backward filling. This approach was chosen because the short data intervals between 0 and 2 h made it challenging to apply interpolation-based methods. For data after 3 h, we applied linear interpolation, which is a conventional method for handling missing values.</p>
</sec>
<sec>
<label>2.1.2.3</label>
<title>Feature labeling in data and extraction of the last 3 h</title>
<p>The collected dataset contained information on whether intubation was performed within 72 h after NICU admission. As shown in <xref ref-type="fig" rid="F3">Figure 3</xref>, we labeled the data features to enable the model to predict the need for intubation within a 3-h window. For positive cases, data points within 3 h prior to intubation were labeled as intubation. Data points recorded more than 4 h before intubation were excluded from model training to improve prediction accuracy. This exclusion was necessary because such data points could introduce ambiguity, potentially indicating the possibility of EI even in cases labeled as negative. Conversely, for negative cases, all data points were labeled as non-intubation. Across all time intervals, we extracted the last 3 h of data for each data sample and used it to train the model.</p>
<fig position="float" id="F3">
<label>Figure 3</label>
<caption><p>The process of pre-processing time-series data: Positive data were labeled as positive for data point corresponding to 3 h before the intubation time, and negative data point were labeled as negative for data in 1-h intervals.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-13-1729990-g0003.tif">
<alt-text content-type="machine-generated">Flowchart titled &#x0201C;Feature Labeling &#x00026; Extraction of the last 3 h&#x0201D; outlines data extraction from NICU admission. For positive patients, three positive samples are extracted around intubation time. For negative patients, seventy samples are extracted continuously. Data is represented in blocks indicating specific hours used for feature extraction.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec>
<label>2.1.3</label>
<title>Z-score standardization</title>
<p>Finally, we applied z-score standardization to all numerical and time-series data. This method transforms the data into a standard normal distribution, where the mean is zero and the standard deviation is one, as follows:</p>
<disp-formula id="EQ1"><mml:math id="M1"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mi>Z</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>x</mml:mi><mml:mo>-</mml:mo><mml:mi>&#x003BC;</mml:mi></mml:mrow><mml:mrow><mml:mi>&#x003C3;</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(1)</label></disp-formula>
<p>where <italic>x</italic> represents an individual data point, &#x003BC; denotes the mean, and &#x003C3; represents the standard deviation of the corresponding data. However, for time-series data, the z-score was calculated using the mean and standard deviation of HR, RR, and SpO<sub>2</sub> over the 0&#x02014;72 h period for each patient individually. This approach was chosen because calculating the mean and standard deviation across the entire patient population would obscure individual temporal trends, making it difficult to capture patient-specific variations over time.</p>
</sec>
</sec>
<sec>
<label>2.2</label>
<title>Model architecture</title>
<p>This section describes the multimodal model for predicting the probability of EI in NICU patients. As shown in <xref ref-type="fig" rid="F4">Figure 4</xref>, to analyze the heterogeneous data, we designed a multimodal model for the integrated analysis of numeric and time-series data. Unlike previous MLP&#x02013;LSTM (<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B19">19</xref>) or MLP&#x02013;Transformer (<xref ref-type="bibr" rid="B20">20</xref>) models, our architecture explicitly combines both temporal dependency modeling (via LSTM) and inter-signal attention (via Transformer), improving robustness against irregular NICU measurements. The numeric and time-series data are analyzed using the MLP and LSTM-transformer blocks, respectively. As we expected the LSTM model to help in modeling the relationship between individual time-series data such as HR, RR, and SpO<sub>2</sub>, by considering their temporal dependence. Furthermore, transformer models help elucidate complex patterns by analyzing the interactions between data at each time step (<xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B22">22</xref>). Therefore, this combination of LSTM and transformer models to aid in the comprehensive analysis of complex patterns in time-series data, including various features such as HR, RR, and SpO<sub>2</sub>. Moreover, as the LSTM replaces the positional encoding of the transformer, the model did not compute all the time information; conversely, it only computed the new temporal information per time step, thus reducing the computation time (<xref ref-type="bibr" rid="B23">23</xref>). The feature vectors analyzed by the MLP and LSTM&#x02013;transformer blocks are concatenated and the probability of EI requirement is calculated in the ensemble block.</p>
<fig position="float" id="F4">
<label>Figure 4</label>
<caption><p>The model processes and integrates two types of data: numerical and time-series data. (1) Numerical data is processed through a Multi-Layer Perceptron (MLP) block to extract relevant features. (2) Time-series data is processed through a Long Short-Term Memory (LSTM)-Transformer block, where time-dependent features are extracted. The feature vectors from both branches are then passed through an Ensemble block, where they are concatenated to form the final model representation. This multimodal approach enables the model to effectively capture and integrate key information from both data types, enhancing overall predictive performance.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-13-1729990-g0004.tif">
<alt-text content-type="machine-generated">Diagram depicting a hybrid neural network architecture combining MLP and LSTM-Transformer blocks. The MLP block processes numeric data \(X_n\) with dropout, batch normalization, and dense layers. The LSTM-Transformer block handles time-series data \(X_t\) with pooling, transformer encoder, dropout, and LSTM layers. The Ensemble Block concatenates outputs from both, applying additional dense and dropout layers. A sigmoid dense layer generates the final output \(Y\). An inset details the LSTM process, showing gates and outputs.</alt-text>
</graphic>
</fig>
<sec>
<label>2.2.1</label>
<title>MLP block</title>
<p>The MLP block processes numerical data <italic>X</italic><sub>n</sub>, including initial clinical variables. It consists of two dense layers with 25 and 50 units, respectively, rectified linear unit (ReLU) activation, and dropout layers, which output feature vectors.</p>
</sec>
<sec>
<label>2.2.2</label>
<title>LSTM-transformer block</title>
<p>To analyze time-series data, this study employed a multimodal LSTM-Transformer model (<xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B22">22</xref>), which integrates Long Short-Term Memory (LSTM) (<xref ref-type="bibr" rid="B24">24</xref>) and transformer (<xref ref-type="bibr" rid="B25">25</xref>) architectures. Although each input sequence covers only a 3-h window, the model was designed to capture micro-dynamics and multi-signal dependencies (e.g., HR&#x02013;SpO<sub>2</sub> coupling) that simple LSTM networks may fail to express effectively. This design enables the model to attend to subtle temporal interactions and inter-feature correlations that can precede rapid physiological deterioration. The LSTM-Transformer block processes time-series data, denoted as <italic>X</italic><sub>t</sub> &#x0003D; (<italic>X</italic><sub>1</sub>, <italic>X</italic><sub>2</sub>, <italic>X</italic><sub>3</sub>), which includes vital signs represented as three sequential features. The LSTM captures short-term temporal dependencies, while the Transformer attends to inter-signal correlations among HR, RR, and SpO<sub>2</sub>. The time-series data <italic>X</italic><sub>t</sub> includes a 3 h time window with three vital signs: heart rate (HR), respiratory rate (RR), and SpO<sub>2</sub>. These features are passed through the LSTM, generating a three-dimensional output with 25 hidden units, which is subsequently fed into the transformer component.</p>
<p>In this architecture, the LSTM replaces positional encoding in the transformer model (<xref ref-type="bibr" rid="B25">25</xref>). Since the transformer decoder is primarily designed for generative tasks such as machine translation, only the encoder is utilized in this model. The transformer encoder consists of two key components. First, Multi-head attention, which captures diverse dependencies within the input sequence. Second, a feedforward neural network (FFN), responsible for extracting features and recognizing patterns. The multi-head attention mechanism operates in parallel across eight attention heads, enabling the model to learn intricate relationships within the time-series data. The FFN includes layer normalization (computed using the mean and variance of input features), a dense layer with 50 units, GELU activation, and dropout, introducing non-linearity and improving the model&#x00027;s ability to learn complex representations. Finally, the sequence and embedding of time-series variables <italic>X</italic><sub>t</sub> processed by the transformer encoder are integrated into a unified output, effectively capturing both short-term and long-term dependencies in the time-series data.</p>
</sec>
<sec>
<label>2.2.3</label>
<title>Ensemble block</title>
<p>The output feature vectors, having the same shape, from both the MLP and LSTM-Transformer blocks are concatenated to form a unified output vector, which is then used to compute the probability of requiring EI in the ensemble block. The ensemble block consists of two dense layers with 90 and 30 units, respectively, ReLU activation, and two dropout layers. Finally, the output. Finally, the output Y from the ensemble block is passed through a dense layer followed by a sigmoid activation function, generating the probability of requiring EI as a value ranging from 0 to 1.</p>
</sec>
</sec>
<sec>
<label>2.3</label>
<title>Model training and implementation details</title>
<p>For model optimization, the Adam optimizer was employed with &#x003B2;<sub>1</sub>= 0.9 and &#x003B2;<sub>2</sub>= 0.999 and an exponential learning rate decay was applied over 100 steps. The initial learning rate and decay rate were set to 5 &#x000D7; 10<sup>&#x02212;5</sup> and 0.96, respectively. The model was trained for 2,000 epochs with a batch size of 1,024. During training, model checkpoints were saved based on the configuration that achieved the highest F1-score. To mitigate the effect of class imbalance, a weighted binary cross-entropy loss function was applied, assigning a weight of 3 to the intubated (EI) class and 1 to the non-EI class to penalize misclassification of the minority class. The proposed model was implemented using TensorFlow 2.4.1 with Python 3.8 and trained on an NVIDIA RTX 3090 GPU (CUDA v.11.0) with an Intel<sup>&#x000AE;</sup> Core i7-12700 CPU.</p>
</sec>
<sec>
<label>2.4</label>
<title>Performance evaluation</title>
<p>We employed 4-fold cross-validation to improve the model&#x00027;s generalization ability and mitigate overfitting.To quantitatively assess the performance of the trained model in each fold, we evaluated accuracy, sensitivity, specificity, the receiver operating characteristic (ROC) curve, and the area under the ROC curve (AUROC). The ROC curve represents the relationship between 1-specificity (false positive rate) and sensitivity (true positive rate). The evaluation metrics were calculated using the following equation.</p>
<disp-formula id="EQ2"><mml:math id="M2"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mtext>Accuracy</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mtext>TP&#x000A0;</mml:mtext><mml:mo>&#x0002B;</mml:mo><mml:mtext>&#x000A0;TN</mml:mtext></mml:mrow><mml:mrow><mml:mtext>TP&#x000A0;</mml:mtext><mml:mo>&#x0002B;</mml:mo><mml:mtext>&#x000A0;TN&#x000A0;</mml:mtext><mml:mo>&#x0002B;</mml:mo><mml:mtext>&#x000A0;FP&#x000A0;</mml:mtext><mml:mo>&#x0002B;</mml:mo><mml:mtext>&#x000A0;FN</mml:mtext></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(2)</label></disp-formula>
<disp-formula id="EQ3"><mml:math id="M3"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mtext>Sensitivity</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mtext>TP</mml:mtext></mml:mrow><mml:mrow><mml:mtext>TP&#x000A0;</mml:mtext><mml:mo>&#x0002B;</mml:mo><mml:mtext>&#x000A0;FN</mml:mtext></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(3)</label></disp-formula>
<disp-formula id="EQ4"><mml:math id="M4"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mtext>Specificity</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mtext>TN</mml:mtext></mml:mrow><mml:mrow><mml:mtext>TN&#x000A0;</mml:mtext><mml:mo>&#x0002B;</mml:mo><mml:mtext>&#x000A0;FP</mml:mtext></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(4)</label></disp-formula>
<p>Each of the four trained models utilized the Youden index (J) to determine the optimal threshold for its respective fold, balancing both sensitivity and specificity. Sensitivity and specificity were computed for each threshold and plotted on the receiver operating characteristic (ROC) curve. The threshold that maximized the J value, derived from the sensitivity and specificity at each threshold, was selected as the optimal threshold. J is calculated as follows:</p>
<disp-formula id="EQ5"><mml:math id="M5"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mtext class="textrm" mathvariant="normal">J</mml:mtext><mml:mo>=</mml:mo><mml:mtext>Sensitivity&#x000A0;</mml:mtext><mml:mo>&#x0002B;</mml:mo><mml:mtext>&#x000A0;Specificity</mml:mtext><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mtd></mml:mtr></mml:mtable></mml:math><label>(5)</label></disp-formula>
</sec>
</sec>
<sec id="s3">
<label>3</label>
<title>Result and discussion</title>
<p>The proposed model was compared with other models used in recent EI applied prediction studies [random forest (<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B10">10</xref>), logistic regression (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B10">10</xref>), and MLP (<xref ref-type="bibr" rid="B7">7</xref>)], other machine learning (ML) models (light gradient boosted machine (LightGBM)), and multimodal models similar to the proposed model [MLP-LSTM (<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B19">19</xref>) and MLP-transformer (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B20">20</xref>)]. ML models (Random Forest, Logistic Regression, and LightGBM) were implemented using the scikit-learn library and optimized via grid search. The grid search included tuning hyperparameters such as the number of estimators for Random Forest, the regularization strength for Logistic Regression, and the learning rate and number of leaves for LightGBM. Deep learning models (MLP, MLP-LSTM, and MLP&#x02013;transformer) were trained on numeric and time-series data and optimized via randomized search. The performances of each model are summarized in <xref ref-type="table" rid="T2">Table 2</xref>. As shown in <xref ref-type="table" rid="T2">Table 2</xref> and <xref ref-type="fig" rid="F5">Figure 5a</xref>, the proposed model achieved the following performances in the four averaged metrics: accuracy = 0.9579 &#x000B1; 0.02, sensitivity = 0.8472 &#x000B1; 0.08; specificity = 0.9591 &#x000B1; 0.02; AUROC = 0.9323 &#x000B1; 0.03. The proposed model showed the best performance in all evaluation metrics as compared to those of previous studies (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B10">10</xref>) and ML models. Furthermore, when comparing the evaluation metrics of the proposed model with other models based on multimodal architecture (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B18">18</xref>&#x02013;<xref ref-type="bibr" rid="B20">20</xref>), the proposed model demonstrates the best results in terms of accuracy, specificity, and AUROC, as well as the second-best performance in sensitivity. The MLP-LSTM model performed second best, with a difference of within 2% for each performance metric compared to the proposed model. Most models showed low performance in sensitivity and were weak at predicting positive cases.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Performance of the proposed model, machine learning (ML) models, and deep learning (DL) models on internal and external validation datasets.</p></caption>
<table frame="box" rules="all">
<thead>
<tr>
<th valign="top" align="left" colspan="2"><bold>Model</bold></th>
<th valign="top" align="center"><bold>Accuracy</bold></th>
<th valign="top" align="center"><bold>Sensitivity</bold></th>
<th valign="top" align="center"><bold>Specificity</bold></th>
<th valign="top" align="center"><bold>AUROC</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" rowspan="7">Internal validation</td>
<td valign="top" align="left">Random forest</td>
<td valign="top" align="center">0.9386 &#x000B1; 0.02</td>
<td valign="top" align="center">0.6535 &#x000B1; 0.04</td>
<td valign="top" align="center">0.9420 &#x000B1; 0.02</td>
<td valign="top" align="center">0.9113 &#x000B1; 0.01</td>
</tr>
<tr>
<td valign="top" align="left">Logistic regression</td>
<td valign="top" align="center">0.8940 &#x000B1; 0.01</td>
<td valign="top" align="center">0.6930 &#x000B1; 0.10</td>
<td valign="top" align="center">0.8964 &#x000B1; 0.01</td>
<td valign="top" align="center">0.8854 &#x000B1; 0.01</td>
</tr>
<tr>
<td valign="top" align="left">LightGBM</td>
<td valign="top" align="center">0.9091 &#x000B1; 0.02</td>
<td valign="top" align="center">0.6711 &#x000B1; 0.21</td>
<td valign="top" align="center">0.9119 &#x000B1; 0.02</td>
<td valign="top" align="center">0.8881 &#x000B1; 0.04</td>
</tr>
<tr>
<td valign="top" align="left">MLP</td>
<td valign="top" align="center">0.8572 &#x000B1; 0.07</td>
<td valign="top" align="center">0.8426 &#x000B1; 0.10</td>
<td valign="top" align="center">0.8574 &#x000B1; 0.07</td>
<td valign="top" align="center">0.9120 &#x000B1; 0.04</td>
</tr>
<tr>
<td valign="top" align="left">MLP-LSTM</td>
<td valign="top" align="center"><underline>0.9417 &#x000B1; 0.04</underline></td>
<td valign="top" align="center"><bold>0.8565</bold> <bold>&#x000B1;</bold> <bold>0.08</bold></td>
<td valign="top" align="center"><underline>0.9427 &#x000B1; 0.04</underline></td>
<td valign="top" align="center"><underline>0.9282 &#x000B1; 0.03</underline></td>
</tr>
<tr>
<td valign="top" align="left">MLP-transformer</td>
<td valign="top" align="center">0.9313 &#x000B1; 0.03</td>
<td valign="top" align="center">0.8426 &#x000B1; 0.08</td>
<td valign="top" align="center">0.9323 &#x000B1; 0.03</td>
<td valign="top" align="center">0.9211 &#x000B1; 0.02</td>
</tr>
<tr>
<td valign="top" align="left">Proposed model</td>
<td valign="top" align="center"><bold>0.9579</bold> <bold>&#x000B1;</bold> <bold>0.02</bold></td>
<td valign="top" align="center"><underline>0.8472 &#x000B1; 0.08</underline></td>
<td valign="top" align="center"><bold>0.9591</bold> <bold>&#x000B1;</bold> <bold>0.02</bold></td>
<td valign="top" align="center"><bold>0.9323</bold> <bold>&#x000B1;</bold> <bold>0.03</bold></td>
</tr>
<tr>
<td valign="top" align="left" rowspan="7">External validation</td>
<td valign="top" align="left">Random forest</td>
<td valign="top" align="center">0.7472 &#x000B1; 0.07</td>
<td valign="top" align="center">0.6196 &#x000B1; 0.04</td>
<td valign="top" align="center">0.7474 &#x000B1; 0.07</td>
<td valign="top" align="center">0.7483 &#x000B1; 0.04</td>
</tr>
<tr>
<td valign="top" align="left">Logistic regression</td>
<td valign="top" align="center">0.5160 &#x000B1; 0.14</td>
<td valign="top" align="center"><bold>0.8913</bold> <bold>&#x000B1;</bold> <bold>0.08</bold></td>
<td valign="top" align="center">0.5153 &#x000B1; 0.14</td>
<td valign="top" align="center">0.8091 &#x000B1; 0.00</td>
</tr>
<tr>
<td valign="top" align="left">LightGBM</td>
<td valign="top" align="center">0.4314 &#x000B1; 0.21</td>
<td valign="top" align="center"><underline>0.7283 &#x000B1; 0.22</underline></td>
<td valign="top" align="center">0.4308 &#x000B1; 0.21</td>
<td valign="top" align="center">0.6295 &#x000B1; 0.08</td>
</tr>
<tr>
<td valign="top" align="left">MLP</td>
<td valign="top" align="center">0.8066 &#x000B1; 0.09</td>
<td valign="top" align="center">0.6196 &#x000B1; 0.03</td>
<td valign="top" align="center">0.8070 &#x000B1; 0.09</td>
<td valign="top" align="center">0.7967 &#x000B1; 0.05</td>
</tr>
<tr>
<td valign="top" align="left">MLP-LSTM</td>
<td valign="top" align="center">0.9220 &#x000B1; 0.06</td>
<td valign="top" align="center">0.5761 &#x000B1; 0.26</td>
<td valign="top" align="center">0.9227 &#x000B1; 0.06</td>
<td valign="top" align="center"><underline>0.8813 &#x000B1; 0.03</underline></td>
</tr>
<tr>
<td valign="top" align="left">MLP-transformer</td>
<td valign="top" align="center"><underline>0.9283 &#x000B1; 0.04</underline></td>
<td valign="top" align="center">0.4674 &#x000B1; 0.05</td>
<td valign="top" align="center"><underline>0.9292 &#x000B1; 0.04</underline></td>
<td valign="top" align="center">0.7784 &#x000B1; 0.04</td>
</tr>
<tr>
<td valign="top" align="left">Proposed model</td>
<td valign="top" align="center"><bold>0.9411</bold> <bold>&#x000B1;</bold> <bold>0.01</bold></td>
<td valign="top" align="center">0.6739 &#x000B1; 0.08</td>
<td valign="top" align="center"><bold>0.9416</bold> <bold>&#x000B1;</bold> <bold>0.01</bold></td>
<td valign="top" align="center"><bold>0.9336</bold> <bold>&#x000B1;</bold> <bold>0.02</bold></td>
</tr></tbody>
</table>
<table-wrap-foot>
<p>The best and second-best performances are denoted by bold and underlined, respectively.</p>
</table-wrap-foot>
</table-wrap>
<fig position="float" id="F5">
<label>Figure 5</label>
<caption><p>Confusion matrices and receiver operating characteristic (ROC) curves of the EI prediction model, calculated through four-fold cross-validation. <bold>(a, b)</bold> depict the results for each fold using the test sets from the interval and external datasets, respectively. <bold>(a)</bold> Internal validation. <bold>(b)</bold> External validation.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-13-1729990-g0005.tif">
<alt-text content-type="machine-generated">Two panels labeled &#x0201C;a&#x0201D; and &#x0201C;b&#x0201D; present performance across four cross-validation folds (Fold 1&#x02013;4), each showing a confusion matrix and the corresponding ROC curve. Panel &#x0201C;a&#x0201D; shows the internal validation results, and panel &#x0201C;b&#x0201D; shows the external validation results. For each fold, the confusion matrix summarizes predicted versus true labels, and the ROC curve plots sensitivity versus 1&#x02013;specificity. The small &#x0201C;Val/Train&#x0201D; boxes at the top of each fold indicate which subset is used for validation and which subsets are used for training in the 4-fold split.</alt-text>
</graphic>
</fig>
<p>To validate the generalization of the proposed model, external validation was performed using datasets collected from other institutions. The results were summarized using a confusion matrix and ROC curve as shown in <xref ref-type="fig" rid="F5">Figure 5b</xref>. We compared the external validation results of the proposed model with those of other models, and the results of the evaluation metrics are listed in <xref ref-type="table" rid="T2">Table 2</xref>, while comparative results of the ROC curve are shown in <xref ref-type="fig" rid="F6">Figure 6b</xref>. As listed in <xref ref-type="table" rid="T2">Table 2</xref>, the proposed model achieved the following performances in the four average metrics on the external dataset: accuracy = 0.9411 &#x000B1; 0.01; sensitivity = 0.6739 &#x000B1; 0.08; specificity = 0.9416 &#x000B1; 0.01; AUROC = 0.9336 &#x000B1; 0.02. The proposed model demonstrated good performance in accuracy, specificity and AUROC when compared with previous studies (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B10">10</xref>) and ML models in external validation. Logistic regression and LightGBM showed sensitivity 0.8913 &#x000B1; 0.08 and 0.7283 &#x000B1; 0.22, respectively, in the external validation results. However, they exhibited a bias toward positive cases predictions attributed to their low accuracy and specificity. The proposed model achieved the third-highest sensitivity, and excluding the two models that exhibited a bias toward positive case predictions, it showed the highest sensitivity among the remaining models. Moreover, we compared the evaluation metrics of the proposed model with other multimodal-based models (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B18">18</xref>&#x02013;<xref ref-type="bibr" rid="B20">20</xref>) and found that it performs well on all evaluation metrics. Deep learning-based models (MLP, MLP-LSTM, MLP-transformer, and proposed model) demonstrated good performance in accuracy, specificity, and AUROC, but exhibited relatively low values in sensitivity.</p>
<fig position="float" id="F6">
<label>Figure 6</label>
<caption><p>Average receiver operating characteristic (ROC) curves of the proposed and comparative models obtained through four-fold cross-validation. <bold>(a)</bold> ROC curves for the internal validation datasets. <bold>(b)</bold> ROC curves for the external validation datasets.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-13-1729990-g0006.tif">
<alt-text content-type="machine-generated">Two ROC curve charts labeled &#x0201C;a&#x0201D; and &#x0201C;b&#x0201D; compare the performance of multiple models. Chart &#x0201C;a&#x0201D; shows ROC curves for internal validation, including logistic regression, LightGBM, random forest, MLP, MLP-transformer, MLP-LSTM, and the proposed model, with AUROC values ranging from 0.8854 to 0.9323. Chart &#x0201C;b&#x0201D; shows ROC curves for external validation with the same models, with AUROC values ranging from 0.6295 to 0.9336. The proposed model has the highest AUROC in both charts. Each curve plots sensitivity versus 1&#x02013;specificity.</alt-text>
</graphic>
</fig>
<p><xref ref-type="fig" rid="F6">Figure 6</xref> shows the ROC curves comparing the proposed model with other baseline models. The proposed model showed superior AUC and ROC curve performance in both internal and external validation. Furthermore, in <xref ref-type="fig" rid="F7">Figure 7</xref>, to compare the classification results between the proposed model and the baseline models, we performed a non-parametric permutation test of the ROC curves (<xref ref-type="bibr" rid="B26">26</xref>). In internal validation(in <xref ref-type="fig" rid="F7">Figure 7a</xref>), all models achieved similar AUROC values (0.91&#x02014;0.93) with no statistically significant difference (<italic>p</italic>-value&#x0003E;0.05). This suggests that most models could effectively learn the underlying patterns within the same institutional dataset. In contrast, in the external validation(in <xref ref-type="fig" rid="F7">Figure 7b</xref>) using data from a different institution, the proposed model demonstrated a statistically significant improvement (<italic>p</italic>-value &#x0003C; 0.05) compared to other baselines. Despite differences in data distribution and measurement frequency, the model maintained high AUROC (0.93) and accuracy (0.94), indicating strong generalization performance under domain shift conditions. This robustness suggests the model&#x00027;s potential for multi-institutional deployment. This finding implies that the hybrid LSTM&#x02013;Transformer architecture effectively captured robust temporal dependencies and cross-feature interactions, which conventional models such as random forest or MLP-based approaches failed to generalize.</p>
<fig position="float" id="F7">
<label>Figure 7</label>
<caption><p>Results of the non-parametric permutation test comparing the ROC curves of the proposed model and the comparison models: <bold>(a)</bold> AUC in internal validation datasets; <bold>(b)</bold> AUC in external validation datasets.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-13-1729990-g0007.tif">
<alt-text content-type="machine-generated">Two sets of ROC curve graphs compare the proposed model with six algorithms (Random Forest, Logistic Regression, LightGBM, MLP, MLP-LSTM, and MLP-Transformer). Set &#x0201C;a&#x0201D; shows internal validation results, and set &#x0201C;b&#x0201D; shows external validation results. Each set contains six pairwise comparisons between the proposed model and one comparison model, with AUROC values for the proposed model around 0.9323 in set &#x0201C;a&#x0201D; and around 0.9336 in set &#x0201C;b&#x0201D;. P-values from a non-parametric permutation test are reported to assess whether differences between ROC curves are statistically significant. Each graph plots sensitivity versus 1&#x02013;specificity.</alt-text>
</graphic>
</fig>
<p>However, as shown in <xref ref-type="table" rid="T2">Table 2</xref> and <xref ref-type="fig" rid="F6">Figure 6</xref>, the model performance was lower in the external validation (sensitivity = 0.8472) as compared to that in the internal validation (sensitivity = 0.6739). This was because of two issues with the dataset collected for external validation. First, the external institution that collected the dataset used for external validation had a high number of missing positive cases owing to the institutional tendency of not recording vital sign data on an immediately before applying EI to a patient. This resulted in a significantly unbalanced dataset between positive and negative data (positive cases: 14, negative cases: 165). This can be addressed by focusing on collecting more positive cases during future data collection. Second, the datasets we collected had many missing RRs: the training dataset was collected at hourly intervals, while the external institution dataset was collected at irregular time intervals. Moreover, both internal and external validation results indicate that sensitivity showed lower performance compared to accuracy, specificity, and AUROC. This is the result of a trade-off between sensitivity and specificity, which can be resolved by adjusting the numbers.</p>
<p>In this study, the proposed model offers predictions of intubation probabilities using multimodal information including 3 h of vital signs and initial clinical variables. To develop and evaluate this model, we established a dataset including information on 432 neonatal patients and evaluated a multimodal model that could classify neonates requiring intubation 3 h in advance. The model used for validation was validated using fold 4, which showed the best performance metrics among the four trained folds. The AI model recommended EI if the probability exceeded 78.1% (optimal threshold of fold 4); otherwise, it did not recommend EI. In <xref ref-type="fig" rid="F8">Figures 8</xref>, <xref ref-type="fig" rid="F9">9</xref>, the process of determining the probability of predicting EI, alongside the vital signs (HR, RR, and SpO<sub>2</sub>) over time, is depicted based on the data of six random patients using the proposed model is shown. <xref ref-type="fig" rid="F8">Figure 8</xref> illustrate the intubation cases where EI was applied either 3, 5, or 6 h after admission, respectively. <xref ref-type="fig" rid="F9">Figure 9</xref> show the non-intubation case. <xref ref-type="fig" rid="F8">Figure 8a</xref> shows that from 0 to 3 h after admission, HR increased by approximately 7.64%, RR decreased by approximately 15.79%, and SpO<sub>2</sub> showed minimal change in value. The probability of EI occurring during this period varied from 78% to 97%. As evident from <xref ref-type="fig" rid="F8">Figure 8b</xref>, the RR decreased sharply to 51.6% between the 2 and 3 h time of admission, and the change gradually stabilized from 3 to 5 h; therefore, the probability of applying EI went down reduced by approximately 5.5%. Furthermore, during at 2&#x02013;3 h after admission, the RRs was 80 and 74 breaths per min, respectively, which were out of the normal range (normal range of RR: 30&#x02013;60 breaths per min). In <xref ref-type="fig" rid="F8">Figure 8c</xref>, HR decreased by 12.8% between 4 and 6 h to 109&#x02013;110 beats per min, which was above the normal range (normal range of HR: 120&#x02013;160 beats per min). From 4&#x02013;6 h, the HR remained low, and the probability of EI increased from 63.2% to 98.6%. <xref ref-type="fig" rid="F9">Figure 9</xref> show that the HR and RR values often appeared to deviate from the normal range. Furthermore, the vital signs changed rapidly and the probability of applying EI increased or decreased. However, we confirmed that the predictive probability of intubation was stable. This appears to reflect the analysis results of numeric data because our model integrates numeric and time-series data. <xref ref-type="fig" rid="F8">Figures 8</xref>, <xref ref-type="fig" rid="F9">9</xref> were designed not only to visualize prediction dynamics but also to provide case-based interpretability, showing that the predicted EI probability follows clinically plausible vital sign trajectories.</p>
<fig position="float" id="F8">
<label>Figure 8</label>
<caption><p>Real-time prediction for intubated patients using the best-performing fold 4 model. Graphs <bold>(a&#x02013;c)</bold> illustrate the time-series data (left) and predicted intubation probability (right) for patients who were intubated after 3, 5, and 6 h, respectively. The predicted probabilities are classified according to the optimal threshold (horizontal dotted lines). <bold>(a)</bold> Patient case intubated after 3 h. <bold>(b)</bold> Patient case intubated after 5 h. <bold>(c)</bold> Patient case intubated after 6 h.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-13-1729990-g0008.tif">
<alt-text content-type="machine-generated">Three sets of charts display measurements over six hours. In each, the left chart shows SpO2, HR, and RR levels, while the right highlights the probability of endotracheal intubation. In chart a, SpO2 declines while HR and RR are stable. In chart b, SpO2 decreases, HR slightly increases, and RR declines. In chart c, SpO2, HR, and RR remain steady. The second chart in each pair indicates a suggested intubation time, highlighted with an upward red arrow. The background colors in both chart types denote different time intervals.</alt-text>
</graphic>
</fig>
<fig position="float" id="F9">
<label>Figure 9</label>
<caption><p>Real-time prediction for non-intubated patients using the best-performing fold 4 model. Graphs <bold>(a&#x02013;c)</bold> illustrate the time-series data (left) and predicted probability (right) for patients without intubation. The model consistently predicted below the optimal threshold (horizontal dotted lines), confirming the non-intubation outcome. <bold>(a)</bold> Patient case without intubation 1. <bold>(b)</bold> Patient case without intubation 2. <bold>(c)</bold> Patient case without intubation 3.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-13-1729990-g0009.tif">
<alt-text content-type="machine-generated">Three sets of graphs labeled a, b, and c show time-based charts comparing SpO2, HR, and RR with corresponding probabilities. Graphs on the left depict SpO2 (%), HR, or RR against time (hours). Graphs on the right display probability distributions over time with a red dashed line marking 0.781 probability(optimal threshold). Notably, graph a indicates &#x0201C;Not Recommended for Endotracheal Intubation&#x0201D; near hour 5, with a downward arrow.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s4">
<label>4</label>
<title>Limitations</title>
<p>The proposed model has three primary limitations in analyzing time-series data.</p>
<p>First, it exhibits bias when predicting short sequences. The model processes sequences up to 3 h in 1-h increments. Among the positive cases collected, 31.6% (31/98) underwent EI within 2 h of NICU admission. Consequently, 31.3% of patients had missing data due to backfilling, which may have introduced bias in the analysis. Therefore, further research is needed to develop a model specifically designed to analyze short-sequence vital signs data and integrate it into the existing framework. Accordingly, predictions generated immediately after NICU admission, when substantial backfilling may be required, should be interpreted with caution.</p>
<p>Second, the proposed model heavily relies on time-series data. The dataset was augmented in 1-h intervals, and the last 3 h of data were extracted. While the proposed model utilizes separate encoders for static and time-series inputs, the window-based augmentation replicates static variables across multiple time steps, which may increase the model&#x00027;s reliance on time-series patterns. Future work will explore fusion strategies (e.g., modality gating or modality-specific regularization) to better balance contributions from static and temporal features.</p>
<p>Third, to preserve the intrinsic temporal dependencies and physiological consistency of the time-series data, no synthetic oversampling techniques (e.g., SMOTE) were applied, even though there was a notable class imbalance between the intubated (positive) and non-intubated (negative) groups. Instead, the imbalance was indirectly compensated by applying a weighted binary cross-entropy loss during model training, which penalized misclassification of the minority (intubated) class more heavily. In addition, while we report performance using an optimal threshold determined by the Youden index, the operating threshold can be calibrated to prioritize sensitivity for early warning applications depending on institutional clinical priorities. Regarding external validation, the reduced sensitivity observed in external validation may reflect a limited number of positive cases and outcome-dependent missingness (e.g., incomplete near-event vital-sign capture) as well as irregular charting intervals (particularly for RR) at the external site. Future external validation should adopt prospective multi-center protocols that ensure comprehensive vital-sign recording immediately preceding EI and investigate approaches robust to irregular sampling (e.g., time-aware model inputs and enhanced interpolation methods).</p>
</sec>
<sec sec-type="conclusions" id="s5">
<label>5</label>
<title>Conclusion</title>
<p>We developed a real-time prediction system utilizing a multimodal model to predict neonatal EI 3 h in advance. The proposed model outperformed previously developed models, achieving the following results: accuracy = 0.9579 &#x000B1; 0.02, sensitivity = 0.8472 &#x000B1; 0.08, specificity = 0.9591 &#x000B1; 0.01, and AUROC = 0.9323 &#x000B1; 0.03. The proposed model also demonstrated superior performance in external validation using datasets collected from an independent institution, achieving: accuracy = 0.9411 &#x000B1; 0.01, sensitivity = 0.6739 &#x000B1; 0.08, specificity = 0.9416 &#x000B1; 0.01, and AUROC = 0.9336 &#x000B1; 0.02. Moreover, the model was designed to reflect real-world clinical applications by incorporating three prediction windows: hourly intervals, within 3 h, and up to 72 h after admission. We anticipate that the proposed model will contribute to the early prevention of respiratory distress by enabling timely EI predictions in neonates. Given its generalizability and effectiveness, the model holds significant potential for clinical implementation. In future clinical implementation, the model could be integrated into real-time NICU monitoring systems to provide early warnings to physicians when the predicted probability of EI exceeds the predefined threshold. This could allow pre-intubation preparation, reduce procedure-related complications, and improve neonatal outcomes.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The datasets generated and/or analyzed during the current study are available from the corresponding author on reasonable request, subject to institutional approvals and data-sharing agreements.</p>
</sec>
<sec sec-type="ethics-statement" id="s7">
<title>Ethics statement</title>
<p>Written informed consent was not obtained from the individual(s) for the publication of any potentially identifiable images or data included in this article because the review board waived the requirement for informed consent, owing to the retrospective design of this study.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>JP: Conceptualization, Methodology, Writing &#x02013; original draft. MY: Investigation, Methodology, Writing &#x02013; review &#x00026; editing. KK: Data curation, Formal analysis, Visualization, Writing &#x02013; original draft. G-HK: Methodology, Software, Validation, Writing &#x02013; review &#x00026; editing. SP: Conceptualization, Project administration, Supervision, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>JP, MY, and SP were employed by Development, Mediv Corp.</p>
<p>The remaining author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s10">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tobin</surname> <given-names>MJ</given-names></name></person-group>. <article-title>Basing respiratory management of COVID-19 on physiological principles</article-title>. <source>Am Thorac Soc</source>. (<year>2020</year>) <volume>201</volume>:<fpage>1319</fpage>&#x02013;<lpage>20</lpage>. doi: <pub-id pub-id-type="doi">10.1164/rccm.202004-1076ED</pub-id><pub-id pub-id-type="pmid">32281885</pub-id></mixed-citation>
</ref>
<ref id="B2">
<label>2.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lundstr&#x000F8;m</surname> <given-names>L</given-names></name> <name><surname>Vester-Andersen</surname> <given-names>M</given-names></name> <name><surname>M&#x000F8;ller</surname> <given-names>A</given-names></name> <name><surname>Charuluxananan</surname> <given-names>S</given-names></name> <name><surname>L&#x00027;hermite</surname> <given-names>J</given-names></name> <name><surname>Wetterslev</surname> <given-names>J</given-names></name></person-group>. <article-title>Poor prognostic value of the modified Mallampati score: a meta-analysis involving 177 088 patients</article-title>. <source>Br J Anaesth</source>. (<year>2011</year>) <volume>107</volume>:<fpage>659</fpage>&#x02013;<lpage>67</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bja/aer292</pub-id><pub-id pub-id-type="pmid">21948956</pub-id></mixed-citation>
</ref>
<ref id="B3">
<label>3.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mallampati</surname> <given-names>SR</given-names></name> <name><surname>Gatt</surname> <given-names>SP</given-names></name> <name><surname>Gugino</surname> <given-names>LD</given-names></name> <name><surname>Desai</surname> <given-names>SP</given-names></name> <name><surname>Waraksa</surname> <given-names>B</given-names></name> <name><surname>Freiberger</surname> <given-names>D</given-names></name> <etal/></person-group>. <article-title>A clinical sign to predict difficult tracheal intubation; a prospective study</article-title>. <source>Can Anaesth Soc J</source>. (<year>1985</year>) <volume>32</volume>:<fpage>429</fpage>&#x02013;<lpage>34</lpage>. doi: <pub-id pub-id-type="doi">10.1007/BF03011357</pub-id><pub-id pub-id-type="pmid">4027773</pub-id></mixed-citation>
</ref>
<ref id="B4">
<label>4.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Esposito</surname> <given-names>TJ</given-names></name> <name><surname>Sanddal</surname> <given-names>ND</given-names></name> <name><surname>Hansen</surname> <given-names>JD</given-names></name> <name><surname>Reynolds</surname> <given-names>S</given-names></name></person-group>. <article-title>Analysis of preventable trauma deaths and inappropriate trauma care in a rural state</article-title>. <source>Jo Trauma Acute Care Surg</source>. (<year>1995</year>) <volume>39</volume>:<fpage>955</fpage>&#x02013;<lpage>62</lpage>. doi: <pub-id pub-id-type="doi">10.1097/00005373-199511000-00022</pub-id><pub-id pub-id-type="pmid">7474014</pub-id></mixed-citation>
</ref>
<ref id="B5">
<label>5.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Miraflor</surname> <given-names>E</given-names></name> <name><surname>Chuang</surname> <given-names>K</given-names></name> <name><surname>Miranda</surname> <given-names>MA</given-names></name> <name><surname>Dryden</surname> <given-names>W</given-names></name> <name><surname>Yeung</surname> <given-names>L</given-names></name> <name><surname>Strumwasser</surname> <given-names>A</given-names></name> <etal/></person-group>. <article-title>Timing is everything: delayed intubation is associated with increased mortality in initially stable trauma patients</article-title>. <source>J Surg Res</source>. (<year>2011</year>) <volume>170</volume>:<fpage>286</fpage>&#x02013;<lpage>90</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jss.2011.03.044</pub-id><pub-id pub-id-type="pmid">21550060</pub-id></mixed-citation>
</ref>
<ref id="B6">
<label>6.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Teixeira</surname> <given-names>PG</given-names></name> <name><surname>Inaba</surname> <given-names>K</given-names></name> <name><surname>Hadjizacharia</surname> <given-names>P</given-names></name> <name><surname>Brown</surname> <given-names>C</given-names></name> <name><surname>Salim</surname> <given-names>A</given-names></name> <name><surname>Rhee</surname> <given-names>P</given-names></name> <etal/></person-group>. <article-title>Preventable or potentially preventable mortality at a mature trauma center</article-title>. <source>J Trauma Acute Care Surg</source>. (<year>2007</year>) <volume>63</volume>:<fpage>1338</fpage>&#x02013;<lpage>47</lpage>. doi: <pub-id pub-id-type="doi">10.1097/TA.0b013e31815078ae</pub-id><pub-id pub-id-type="pmid">18212658</pub-id></mixed-citation>
</ref>
<ref id="B7">
<label>7.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nopour</surname> <given-names>R</given-names></name> <name><surname>Shanbehzadeh</surname> <given-names>M</given-names></name> <name><surname>Kazemi-Arpanahi</surname> <given-names>H</given-names></name></person-group>. <article-title>Predicting the need for intubation among COVID-19 patients using machine learning algorithms: a single-center study</article-title>. <source>Med J Islamic Republ Iran</source>. (<year>2022</year>) <volume>36</volume>:<fpage>30</fpage>. doi: <pub-id pub-id-type="doi">10.47176/mjiri.36.30</pub-id><pub-id pub-id-type="pmid">35999913</pub-id></mixed-citation>
</ref>
<ref id="B8">
<label>8.</label>
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>Z</given-names></name> <name><surname>Li</surname> <given-names>J</given-names></name> <name><surname>Zhao</surname> <given-names>Y</given-names></name></person-group>. <article-title>Prediction of airway management of trauma patients based on machine learning</article-title>. In: <source>LISS 2021: Proceedings of the 11th International Conference on Logistics, Informatics and Service Sciences</source>. <publisher-loc>Singapore</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>2022</year>). p. <fpage>132</fpage>&#x02013;<lpage>41</lpage>. doi: <pub-id pub-id-type="doi">10.1007/978-981-16-8656-6_12</pub-id></mixed-citation>
</ref>
<ref id="B9">
<label>9.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Arvind</surname> <given-names>V</given-names></name> <name><surname>Kim</surname> <given-names>JS</given-names></name> <name><surname>Cho</surname> <given-names>BH</given-names></name> <name><surname>Geng</surname> <given-names>E</given-names></name> <name><surname>Cho</surname> <given-names>SK</given-names></name></person-group>. <article-title>Development of a machine learning algorithm to predict intubation among hospitalized patients with COVID-19</article-title>. <source>J Crit Care</source>. (<year>2021</year>) <volume>62</volume>:<fpage>25</fpage>&#x02013;<lpage>30</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jcrc.2020.10.033</pub-id><pub-id pub-id-type="pmid">33238219</pub-id></mixed-citation>
</ref>
<ref id="B10">
<label>10.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Siu</surname> <given-names>BMK</given-names></name> <name><surname>Kwak</surname> <given-names>GH</given-names></name> <name><surname>Ling</surname> <given-names>L</given-names></name> <name><surname>Hui</surname> <given-names>P</given-names></name></person-group>. <article-title>Predicting the need for intubation in the first 24 h after critical care admission using machine learning approaches</article-title>. <source>Sci Rep</source>. (<year>2020</year>) <volume>10</volume>:<fpage>20931</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-020-77893-3</pub-id></mixed-citation>
</ref>
<ref id="B11">
<label>11.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Im</surname> <given-names>JE</given-names></name> <name><surname>Park</surname> <given-names>S</given-names></name> <name><surname>Kim</surname> <given-names>YJ</given-names></name> <name><surname>Yoon</surname> <given-names>SA</given-names></name> <name><surname>Lee</surname> <given-names>JH</given-names></name></person-group>. <article-title>Predicting the need for intubation within 3 hours in the neonatal intensive care unit using a multimodal deep neural network</article-title>. <source>Sci Rep</source>. (<year>2022</year>) <volume>13</volume>:<fpage>6213</fpage>. doi: <pub-id pub-id-type="doi">10.21203/rs.3.rs-1872902/v1</pub-id></mixed-citation>
</ref>
<ref id="B12">
<label>12.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Im</surname> <given-names>JE</given-names></name> <name><surname>Yoon</surname> <given-names>SA</given-names></name> <name><surname>Shin</surname> <given-names>YM</given-names></name> <name><surname>Park</surname> <given-names>S</given-names></name></person-group>. <article-title>Real-time prediction for neonatal endotracheal intubation using multimodal transformer network</article-title>. <source>IEEE J Biomed Health Informat</source>. (<year>2023</year>) <volume>27</volume>:<fpage>2625</fpage>&#x02013;<lpage>34</lpage>. doi: <pub-id pub-id-type="doi">10.1109/JBHI.2023.3267521</pub-id><pub-id pub-id-type="pmid">37067962</pub-id></mixed-citation>
</ref>
<ref id="B13">
<label>13.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fleming</surname> <given-names>S</given-names></name> <name><surname>Thompson</surname> <given-names>M</given-names></name> <name><surname>Stevens</surname> <given-names>R</given-names></name> <name><surname>Heneghan</surname> <given-names>C</given-names></name></person-group>. <article-title>Pl&#x000FC;ddemann A, Maconochie I, et al. Normal ranges of heart rate and respiratory rate in children from birth to 18 years of age: a systematic review of observational studies</article-title>. <source>Lancet</source>. (<year>2011</year>) <volume>377</volume>:<fpage>1011</fpage>&#x02013;<lpage>8</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(10)62226-X</pub-id></mixed-citation>
</ref>
<ref id="B14">
<label>14.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>te Pas</surname> <given-names>AB</given-names></name> <name><surname>Wong</surname> <given-names>C</given-names></name> <name><surname>Kamlin</surname> <given-names>COF</given-names></name> <name><surname>Dawson</surname> <given-names>JA</given-names></name> <name><surname>Morley</surname> <given-names>CJ</given-names></name> <name><surname>Davis</surname> <given-names>PG</given-names></name></person-group>. <article-title>Breathing patterns in preterm and term infants immediately after birth</article-title>. <source>Pediatr Res</source>. (<year>2009</year>) <volume>65</volume>:<fpage>352</fpage>&#x02013;<lpage>6</lpage>. doi: <pub-id pub-id-type="doi">10.1203/PDR.0b013e318193f117</pub-id><pub-id pub-id-type="pmid">19391251</pub-id></mixed-citation>
</ref>
<ref id="B15">
<label>15.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bennett</surname> <given-names>DA</given-names></name></person-group>. <article-title>How can I deal with missing data in my study?</article-title> <source>Aust N Z J Public Health</source>. (<year>2001</year>) <volume>25</volume>:<fpage>464</fpage>&#x02013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1467-842X.2001.tb00294.x</pub-id><pub-id pub-id-type="pmid">11688629</pub-id></mixed-citation>
</ref>
<ref id="B16">
<label>16.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dong</surname> <given-names>Y</given-names></name> <name><surname>Peng</surname> <given-names>CYJ</given-names></name></person-group>. <article-title>Principled missing data methods for researchers</article-title>. <source>Springerplus</source>. (<year>2013</year>) <volume>2</volume>:<fpage>1</fpage>&#x02013;<lpage>17</lpage>. doi: <pub-id pub-id-type="doi">10.1186/2193-1801-2-222</pub-id><pub-id pub-id-type="pmid">23853744</pub-id></mixed-citation>
</ref>
<ref id="B17">
<label>17.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Network</surname> <given-names>TIN</given-names></name></person-group>. <article-title>The CRIB (clinical risk index for babies) score: a tool for assessing initial neonatal risk and comparing performance of neonatal intensive care units</article-title>. <source>Lancet</source>. (<year>1993</year>) <volume>342</volume>:<fpage>193</fpage>&#x02013;<lpage>8</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0140-6736(93)92296-6</pub-id></mixed-citation>
</ref>
<ref id="B18">
<label>18.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fan</surname> <given-names>Y</given-names></name> <name><surname>Xu</surname> <given-names>K</given-names></name> <name><surname>Wu</surname> <given-names>H</given-names></name> <name><surname>Zheng</surname> <given-names>Y</given-names></name> <name><surname>Tao</surname> <given-names>B</given-names></name></person-group>. <article-title>Spatiotemporal modeling for nonlinear distributed thermal processes based on KL decomposition, MLP and LSTM network</article-title>. <source>IEEE Access</source>. (<year>2020</year>) <volume>8</volume>:<fpage>25111</fpage>&#x02013;<lpage>21</lpage>. doi: <pub-id pub-id-type="doi">10.1109/ACCESS.2020.2970836</pub-id></mixed-citation>
</ref>
<ref id="B19">
<label>19.</label>
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>KH</given-names></name> <name><surname>Park</surname> <given-names>JC</given-names></name> <name><surname>Kim</surname> <given-names>GY</given-names></name> <name><surname>Maeng</surname> <given-names>JY</given-names></name> <name><surname>Sung</surname> <given-names>JB</given-names></name> <name><surname>Kim</surname> <given-names>JW</given-names></name></person-group>. <article-title>Predicting endotracheal intubation needs in neonatal intensive care unit: a multimodal approach</article-title>. In: <source>2024 International Technical Conference on Circuits/Systems, Computers, and Communications (ITC-CSCC)</source>. <publisher-loc>Piscataway, NJ</publisher-loc>: <publisher-name>IEEE</publisher-name> (<year>2024</year>). p. <fpage>1</fpage>&#x02013;<lpage>7</lpage>. doi: <pub-id pub-id-type="doi">10.1109/ITC-CSCC62988.2024.10628132</pub-id></mixed-citation>
</ref>
<ref id="B20">
<label>20.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>GH</given-names></name> <name><surname>Lee</surname> <given-names>DH</given-names></name> <name><surname>Choi</surname> <given-names>JW</given-names></name> <name><surname>Jeon</surname> <given-names>HJ</given-names></name> <name><surname>Park</surname> <given-names>S</given-names></name></person-group>. <article-title>Multimodal neural network for recurrence prediction of papillary thyroid carcinoma</article-title>. <source>Adv Intell Syst</source>. (<year>2023</year>) <volume>5</volume>:<fpage>2200365</fpage>. doi: <pub-id pub-id-type="doi">10.1002/aisy.202200365</pub-id></mixed-citation>
</ref>
<ref id="B21">
<label>21.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Andayani</surname> <given-names>F</given-names></name> <name><surname>Theng</surname> <given-names>LB</given-names></name> <name><surname>Tsun</surname> <given-names>MT</given-names></name> <name><surname>Chua</surname> <given-names>C</given-names></name></person-group>. <article-title>Hybrid LSTM-transformer model for emotion recognition from speech audio files</article-title>. <source>IEEE Access</source>. (<year>2022</year>) <volume>10</volume>:<fpage>36018</fpage>&#x02013;<lpage>27</lpage>. doi: <pub-id pub-id-type="doi">10.1109/ACCESS.2022.3163856</pub-id></mixed-citation>
</ref>
<ref id="B22">
<label>22.</label>
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Andayani</surname> <given-names>F</given-names></name></person-group>. <source>Investigating the Impacts of LSTM-Transformer on Classification Performance of Speech Emotion Recognition.</source> <publisher-loc>Swinburne</publisher-loc> (<year>2022</year>).</mixed-citation>
</ref>
<ref id="B23">
<label>23.</label>
<mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Sakatani</surname> <given-names>Y</given-names></name></person-group>. <source>Combining RNN with Transformer for Modeling Multi-Leg Trips</source>. <publisher-loc>Aachen</publisher-loc>: <publisher-name>WebTour&#x00040; WSDM</publisher-name> (<year>2021</year>). p. <fpage>50</fpage>&#x02013;<lpage>2</lpage>.</mixed-citation>
</ref>
<ref id="B24">
<label>24.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kawakami</surname> <given-names>K</given-names></name></person-group>. <source>Supervised Sequence Labelling With Recurrent Neural Networks</source>. Technical University of Munich (<year>2008</year>).</mixed-citation>
</ref>
<ref id="B25">
<label>25.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vaswani</surname> <given-names>A</given-names></name> <name><surname>Shazeer</surname> <given-names>N</given-names></name> <name><surname>Parmar</surname> <given-names>N</given-names></name> <name><surname>Uszkoreit</surname> <given-names>J</given-names></name> <name><surname>Jones</surname> <given-names>L</given-names></name> <name><surname>Gomez</surname> <given-names>AN</given-names></name> <etal/></person-group>. <article-title>Attention is all you need</article-title>. <source>Adv Neural Inform Process Syst</source>. (<year>2017</year>) <volume>30</volume>:<fpage>5998</fpage>&#x02013;<lpage>6008</lpage>. doi: <pub-id pub-id-type="doi">10.5555/3295222.3295349</pub-id></mixed-citation>
</ref>
<ref id="B26">
<label>26.</label>
<mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Venkatraman</surname> <given-names>E</given-names></name></person-group>. <article-title>A permutation test to compare receiver operating characteristic curves</article-title>. <source>Biometrics</source>. (<year>2000</year>) <volume>56</volume>:<fpage>1134</fpage>&#x02013;<lpage>8</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.0006-341X.2000.01134.x</pub-id><pub-id pub-id-type="pmid">11129471</pub-id></mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0001">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/156001/overview">Antonio M. Esquinas</ext-link>, Hospital General Universitario Morales Meseguer, Spain</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0002">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/926538/overview">Daniel Ibarra-R&#x000ED;os</ext-link>, Federico G&#x000F3;mez Children&#x00027;s Hospital, Mexico</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1300308/overview">Susanne Tippmann</ext-link>, Johannes Gutenberg University Mainz, Germany</p>
</fn>
</fn-group>
</back>
</article>