<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article article-type="research-article" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Digit. Health</journal-id><journal-title-group>
<journal-title>Frontiers in Digital Health</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Digit. Health</abbrev-journal-title></journal-title-group>
<issn pub-type="epub">2673-253X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fdgth.2026.1755878</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Machine learning prediction of oxygen therapy in pediatric Mycoplasma pneumoniae pneumonia</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name><surname>Coppola</surname><given-names>Claudio</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref>
<xref ref-type="author-notes" rid="an1"><sup>&#x2020;</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/3250142/overview"/><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role></contrib>
<contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name><surname>Andrew</surname><given-names>Judith Jeyafreeda</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref>
<xref ref-type="author-notes" rid="an1"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3250297/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role></contrib>
<contrib contrib-type="author"><name><surname>Ruggieri</surname><given-names>Martino</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/1154699/overview" /><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role></contrib>
<contrib contrib-type="author"><name><surname>La Spina</surname><given-names>Milena</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role></contrib>
<contrib contrib-type="author"><name><surname>La Bianca</surname><given-names>Maria Rosaria</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role></contrib>
<contrib contrib-type="author"><name><surname>Leonardi</surname><given-names>Salvatore</given-names></name>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role><role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role></contrib><on-behalf-of>the PneumoML Study Group</on-behalf-of>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Postgraduate Training Program in Pediatrics, University of Catania</institution>, <city>Catania</city>, <country country="it">Italy</country></aff>
<aff id="aff2"><label>2</label><institution>Unit of Pediatrics, Sant&#x0027;Antonio Abate Hospital</institution>, <city>Trapani</city>, <country country="it">Italy</country></aff>
<aff id="aff3"><label>3</label><institution>Clinical Bioinformatics Laboratory, INSERM UMR1163, Imagine Institute, Universit&#x00E9; Paris Cit&#x00E9;</institution>, <city>Paris</city>, <country country="fr">France</country></aff>
<aff id="aff4"><label>4</label><institution>PR[AI]RIE AI Institute</institution>, <city>Paris</city>, <country country="fr">France</country></aff>
<aff id="aff5"><label>5</label><institution>Unit of Pediatric Clinic, Department of Clinical and Experimental Medicine, University of Catania</institution>, <city>Catania</city>, <country country="it">Italy</country></aff>
<aff id="aff6"><label>6</label><institution>Unit of Pediatrics and Pediatric Emergency, San Marco Hospital</institution>, <city>Catania</city>, <country country="it">Italy</country></aff>
<aff id="aff7"><label>7</label><institution>Department of Clinical and Experimental Medicine, University of Catania</institution>, <city>Catania</city>, <country country="it">Italy</country></aff>
<author-notes>
<corresp id="cor1"><label>&#x002A;</label><bold>Correspondence:</bold> Claudio Coppola <email xlink:href="mailto:dott.claudiocoppola@gmail.com">dott.claudiocoppola@gmail.com</email> Judith Jeyafreeda Andrew <email xlink:href="mailto:judithjeyafreeda@gmail.com">judithjeyafreeda@gmail.com</email></corresp>
<fn fn-type="equal" id="an1"><label>&#x2020;</label><p>These authors have contributed equally to this work</p></fn>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-19"><day>19</day><month>02</month><year>2026</year></pub-date>
<pub-date publication-format="electronic" date-type="collection"><year>2026</year></pub-date>
<volume>8</volume><elocation-id>1755878</elocation-id>
<history>
<date date-type="received"><day>27</day><month>11</month><year>2025</year></date>
<date date-type="rev-recd"><day>25</day><month>12</month><year>2025</year></date>
<date date-type="accepted"><day>09</day><month>01</month><year>2026</year></date>
</history>
<permissions>
<copyright-statement>&#x00A9; 2026 Coppola, Andrew, Ruggieri, La Spina, La Bianca and Leonardi.</copyright-statement>
<copyright-year>2026</copyright-year><copyright-holder>Coppola, Andrew, Ruggieri, La Spina, La Bianca and Leonardi</copyright-holder><license><ali:license_ref start_date="2026-02-19">https://creativecommons.org/licenses/by/4.0/</ali:license_ref><license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p></license>
</permissions>
<abstract><sec><title>Background</title>
<p>Mycoplasma pneumoniae pneumonia represents a significant cause of community-acquired pneumonia in children, with clinical presentations ranging from mild to severe forms requiring respiratory support. Early identification of children at risk for oxygen therapy remains challenging using conventional clinical and laboratory parameters.</p>
</sec><sec><title>Methods</title>
<p>We conducted a multicenter retrospective study involving 206 pediatric patients (aged 1 month to 18 years) with confirmed Mycoplasma pneumoniae pneumonia admitted to three Italian hospitals between 2023 and 2025. Nine machine learning algorithms were developed and validated using routine admission data including demographics, clinical presentation, laboratory tests, and imaging findings. The primary outcome was the need for oxygen therapy during hospitalization. Model performance was evaluated using area under the curve (AUC), precision, recall, and F1-score metrics. Feature importance was assessed using SHAP (Shapley Additive Explanations) analysis.</p>
</sec><sec><title>Results</title>
<p>Among the 206 patients, 42 (20.4&#x0025;) required oxygen therapy during hospitalization. The cohort had a mean age of approximately 4.6 years (SD &#x2248; 3.5), with comorbidities present in approximately 40&#x0025; of cases. Support Vector Machine (SVM) achieved the highest performance with an AUC of 0.97, precision of 0.93, recall of 0.93, and F1-score of 0.92. Logistic Regression (AUC 0.95), XGBoost (AUC 0.94), and LightGBM (AUC 0.93) also demonstrated strong predictive performance. SHAP analysis consistently identified C-reactive protein (CRP), lactate dehydrogenase (LDH), neutrophil-to-lymphocyte ratio (NLR), neutrophil percentage, and respiratory distress as the most important predictive features across models.</p>
</sec><sec><title>Conclusion</title>
<p>Machine learning models using routine admission data can accurately predict oxygen therapy requirements in pediatric Mycoplasma pneumoniae pneumonia. The integration of interpretable artificial intelligence approaches may enable earlier risk stratification and improve clinical decision-making in pediatric respiratory infections.</p>
</sec>
</abstract>
<kwd-group>
<kwd>artificial intelligence</kwd>
<kwd>machine learning</kwd>
<kwd>Mycoplasma pneumoniae</kwd>
<kwd>oxygen therapy</kwd>
<kwd>pediatric pneumonia</kwd>
<kwd>predictive modeling</kwd>
<kwd>respiratory support</kwd>
<kwd>SHAP</kwd>
</kwd-group><funding-group><funding-statement>The author(s) declared that financial support was not received for this work and/or its publication.</funding-statement></funding-group><counts>
<fig-count count="4"/>
<table-count count="3"/><equation-count count="0"/><ref-count count="14"/><page-count count="19"/><word-count count="0"/></counts><custom-meta-group><custom-meta><meta-name>section-at-acceptance</meta-name><meta-value>Health Informatics</meta-value></custom-meta></custom-meta-group>
</article-meta>
</front>
<body><sec id="s1" sec-type="intro"><label>1</label><title>Introduction</title>
<p>Respiratory infections caused by Mycoplasma pneumoniae represent a significant cause of community-acquired pneumonia in children, accounting for up to 40&#x0025; of pneumonia cases in school-age children and adolescents. The clinical manifestations range from mild upper respiratory symptoms to complicated forms requiring intensive respiratory support and prolonged hospitalization. Recent epidemiological studies have documented increasing severity of Mycoplasma pneumoniae pneumonia presentations, particularly following the COVID-19 pandemic, creating substantial organizational challenges for pediatric healthcare systems worldwide.</p>
<p>The pathophysiology of Mycoplasma pneumoniae pneumonia involves both direct cellular damage and immune-mediated inflammatory responses. Unlike typical bacterial pneumonia, Mycoplasma pneumoniae lacks a cell wall, making it resistant to beta-lactam antibiotics and requiring specific antimicrobial therapy with macrolides, tetracyclines, or fluoroquinolones. The organism&#x0027;s unique characteristics contribute to its propensity for causing both pulmonary and extrapulmonary manifestations, the latter occurring in approximately 25&#x0025; of pediatric cases.</p>
<p>Early risk stratification at admission has become crucial for guiding decisions regarding monitoring intensity, imaging protocols, therapeutic interventions, and care escalation. Current diagnostic approaches rely primarily on microbiological and serological methods, with molecular polymerase chain reaction (PCR) tests providing high sensitivity but often facing availability constraints or logistical limitations in many healthcare settings.</p>
<p>Regarding severity assessment, routine biomarkers including white blood cell count, C-reactive protein, and procalcitonin demonstrate suboptimal performance in accurately discriminating the severity of pediatric pulmonary infections. These limitations explain why initial clinical and radiological assessment alone frequently fails to provide reliable prognostic classification, leading to either unnecessary intensive monitoring or delayed recognition of deteriorating patients.</p>
<p>Traditional severity scoring systems developed for bacterial pneumonia, such as the Pediatric Early Warning Scores or pneumonia severity indices, have shown limited applicability to atypical pneumonia caused by Mycoplasma pneumoniae. This diagnostic gap has prompted interest in developing more sophisticated predictive models that can integrate multiple clinical variables simultaneously.</p>
<p>Artificial intelligence and machine learning have demonstrated promising results in pediatric pneumonia diagnosis and prognosis across various clinical contexts (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B7">7</xref>). Recent studies have shown that models trained on routine blood chemistry parameters can successfully discriminate between Mycoplasma pneumoniae pneumonia and non-Mycoplasma pneumonia cases, highlighting the utility of immuno-inflammatory and platelet indicators in early classification (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>).</p>
<p>Multicenter gradient boosting decision tree models based on comprehensive blood characteristics have achieved high accuracy metrics in both internal and external validations, suggesting the feasibility of generalizable machine learning approaches in this clinical domain. These studies have consistently identified key predictive variables including fever duration, neutrophil-lymphocyte ratio, C-reactive protein, lactate dehydrogenase, and platelet indices.</p>
<p>Parallel developments have proposed specific models for predicting Mycoplasma pneumoniae pneumonia severity using interpretable algorithms such as CatBoost and Light Gradient Boosting Machine. The incorporation of Shapley Additive Explanations (SHAP) analysis has enhanced clinical readability and trust in model predictions, addressing one of the primary barriers to clinical implementation of machine learning tools.</p>
<p>Quantitative imaging approaches have also contributed to risk phenotype characterization in pediatric pneumonia. Radiomic models based on high-resolution computed tomography have demonstrated superior performance in distinguishing Mycoplasma pneumoniae pneumonia from bacterial or viral co-infection forms compared to models using solely clinical and laboratory variables.</p>
<p>However, the integration of advanced imaging techniques faces practical limitations in routine clinical practice, including radiation exposure concerns, cost considerations, and availability constraints. This has motivated research into models that rely primarily on readily available clinical and laboratory data that can be obtained at the point of care.</p>
<p>Despite these advances, prediction of clinically relevant complications in children with Mycoplasma pneumoniae pneumonia using admission-available information remains less explored, particularly in European healthcare contexts. Most existing studies have focused on diagnostic differentiation rather than prognostic prediction of specific outcomes such as oxygen therapy requirements.</p>
<p>Furthermore, the majority of published research has originated from Asian populations, where Mycoplasma pneumoniae epidemiology and clinical presentations may differ from European settings. This geographic limitation raises questions about the generalizability of existing predictive models across different healthcare systems and patient populations.</p>
<p>This study aims to develop and validate an interpretable machine learning model for early oxygen therapy risk estimation during hospitalization in children with Mycoplasma pneumoniae pneumonia, specifically addressing:
<list list-type="order">
<list-item>
<p>Primary objective: Development of accurate predictive models for oxygen therapy requirements using routine admission data</p></list-item>
<list-item>
<p>Secondary objectives: Identification of key predictive features through interpretable machine learning approaches</p></list-item>
<list-item>
<p>Clinical validation: Assessment of model performance across different patient subgroups and clinical presentations</p></list-item>
<list-item>
<p>Implementation considerations: Evaluation of model complexity and computational requirements for clinical deployment</p></list-item>
</list></p>
</sec>
<sec id="s2" sec-type="methods"><label>2</label><title>Materials and methods</title>
<sec id="s2a"><label>2.1</label><title>Study design and setting</title>
<p>This retrospective multicenter cohort study was conducted across three pediatric hospitals in Italy during the period 2023-2025. The study design followed guidelines for transparent reporting of prediction model development and validation, incorporating elements from the TRIPOD (Transparent Reporting of a multivariable prediction model for Individual Prognosis Or Diagnosis) statement (<xref ref-type="bibr" rid="B6">6</xref>).</p>
<p>The participating centers included two major pediatric hospitals with comprehensive emergency departments, intensive care units, and specialized respiratory services. This multicenter approach was designed to enhance the external validity of the developed models and capture variations in clinical practice patterns across different healthcare settings.</p>
</sec>
<sec id="s2b"><label>2.2</label><title>Ethical considerations and data management</title>
<p>This study was conducted in accordance with the Declaration of Helsinki principles and applicable local regulations. Written informed consent was obtained from the participants&#x0027; legal guardians in accordance with the national legislation and institutional requirements.</p>
<p>Data processing complied with European Union General Data Protection Regulation (GDPR) requirements, with all patient identifiers removed prior to analysis. A comprehensive data management plan was implemented to ensure data quality, completeness, and security throughout the study period.</p>
</sec>
<sec id="s2c"><label>2.3</label><title>Study population and selection criteria</title>
<sec id="s2c1"><label>2.3.1</label><title>Inclusion criteria</title>
<p>The study population comprised pediatric patients meeting the following inclusion criteria:
<list list-type="order">
<list-item>
<p>Age under 18 years at time of admission</p></list-item>
<list-item>
<p>Hospital admission to one of the participating centers</p></list-item>
<list-item>
<p>Mycoplasma pneumoniae pneumonia diagnosis confirmed by at least one positive serological test or molecular PCR on respiratory specimens</p></list-item>
<list-item>
<p>Availability of essential clinical and laboratory variables at admission</p></list-item>
<list-item>
<p>Complete follow-up data regarding oxygen therapy requirements during hospitalization.</p></list-item>
</list></p>
</sec>
<sec id="s2c2"><label>2.3.2</label><title>Exclusion criteria</title>
<p>Patients were excluded if they met any of the following criteria:
<list list-type="order">
<list-item>
<p>Alternative primary diagnosis established during hospitalization</p></list-item>
<list-item>
<p>Negative Mycoplasma pneumoniae etiology confirmed by comprehensive testing</p></list-item>
<list-item>
<p>Incomplete essential clinical data preventing model development</p></list-item>
<list-item>
<p>Transfer from other hospitals with ongoing oxygen therapy</p></list-item>
<list-item>
<p>Underlying conditions requiring chronic oxygen supplementation.</p></list-item>
</list></p>
</sec>
</sec>
<sec id="s2d"><label>2.4</label><title>Diagnostic criteria and case definitions</title>
<sec id="s2d1"><label>2.4.1</label><title>Mycoplasma pneumoniae pneumonia diagnosis</title>
<p>Etiological diagnosis followed standardized laboratory criteria using positive serological tests (IgM antibodies or fourfold rise in IgG titers) or molecular detection by PCR on respiratory specimens. This approach is consistent with current diagnostic consensus guidelines and ensures reliable case identification.</p>
<p>Serological testing was performed using enzyme-linked immunosorbent assays (ELISA) with established cutoff values, while molecular testing utilized validated PCR protocols targeting multiple Mycoplasma pneumoniae genetic sequences. In cases where both methods were available, PCR results were considered definitive due to higher specificity.</p>
</sec>
<sec id="s2d2"><label>2.4.2</label><title>Primary outcome definition</title>
<p>The primary outcome was oxygen therapy requirement during hospitalization, defined as supplemental oxygen administration (low-flow or high-flow nasal cannula) for hypoxemia or respiratory distress. Clinical indications for oxygen therapy generally followed the AARC (<xref ref-type="bibr" rid="B3">3</xref>), Italian Pediatric Society (SIP) (<xref ref-type="bibr" rid="B11">11</xref>) and British Thoracic Society (BTS) (<xref ref-type="bibr" rid="B12">12</xref>) guidelines recommending treatment for SpO&#x2082;&#x2009;&#x003C;&#x2009;92&#x0025; in ambient air or marked respiratory distress signs (<xref ref-type="bibr" rid="B4">4</xref>).</p>
<p>Patients receiving any form of supplemental oxygen therapy, including low-flow nasal cannula, high-flow nasal cannula, or non-invasive ventilation, were classified as positive cases. The decision for oxygen therapy initiation was made by attending physicians based on clinical assessment and standard institutional protocols.</p>
</sec>
</sec>
<sec id="s2e"><label>2.5</label><title>Data collection and Variable definition</title>
<sec id="s2e1"><label>2.5.1</label><title>Demographic variables</title>
<p>Comprehensive demographic information was collected including:
<list list-type="bullet">
<list-item>
<p>Age at admission (months)</p></list-item>
<list-item>
<p>Sex (male/female)</p></list-item>
<list-item>
<p>Birth weight (grams)</p></list-item>
<list-item>
<p>Current weight and height</p></list-item>
<list-item>
<p>Body mass index (calculated when age-appropriate)</p></list-item>
<list-item>
<p>Gestational age at birth</p></list-item>
<list-item>
<p>Delivery method (spontaneous vaginal delivery vs. cesarean section)</p></list-item>
</list></p>
</sec>
<sec id="s2e2"><label>2.5.2</label><title>Clinical presentation variables</title>
<p>Detailed clinical assessment at admission included:
<list list-type="bullet">
<list-item>
<p>Fever presence and duration (both at home and during hospitalization)</p></list-item>
<list-item>
<p>Respiratory symptoms (cough, dyspnea, chest pain, wheezing)</p></list-item>
<list-item>
<p>Respiratory distress assessment (defined by the presence of tachypnea, suprasternal/intercostal retractions, nasal flaring, or grunting)</p></list-item>
<list-item>
<p>Extrapulmonary manifestations (gastrointestinal, cutaneous, cardiac, musculoskeletal, ENT, neurological)</p></list-item>
<list-item>
<p>Vital signs including temperature, heart rate, respiratory rate, and oxygen saturation</p></list-item>
</list></p>
</sec>
<sec id="s2e3"><label>2.5.3</label><title>Laboratory parameters</title>
<p>Comprehensive laboratory evaluation included:
<list list-type="bullet">
<list-item>
<p>Complete blood count with differential (white blood cells, neutrophils, lymphocytes, monocytes, platelets)</p></list-item>
<list-item>
<p>Inflammatory markers (C-reactive protein, procalcitonin, erythrocyte sedimentation rate)</p></list-item>
<list-item>
<p>Biochemical parameters (lactate dehydrogenase, albumin)</p></list-item>
<list-item>
<p>Calculated ratios (neutrophil-to-lymphocyte ratio)</p></list-item>
</list>Based on the statistics provided, inflammatory markers showed significant variations with CRP Z-scores ranging widely and platelet counts frequently elevated (thrombocytosis in approximately 30&#x0025; of cases). White blood cell counts demonstrated leukocytosis in approximately 40&#x0025; of patients.</p>
</sec>
<sec id="s2e4"><label>2.5.4</label><title>Imaging findings</title>
<p>Radiological assessment included:
<list list-type="bullet">
<list-item>
<p>Chest x-ray findings (performed in approximately 90&#x0025; of cases)</p></list-item>
<list-item>
<p>Consolidation areas</p></list-item>
<list-item>
<p>Increased interstitial markings (present in approximately 60&#x0025; of cases)</p></list-item>
<list-item>
<p>Pleural effusions</p></list-item>
<list-item>
<p>Computed tomography findings when available</p></list-item>
</list></p>
</sec>
<sec id="s2e5"><label>2.5.5</label><title>Microbiological data</title>
<p>Comprehensive microbiological evaluation included:
<list list-type="bullet">
<list-item>
<p>Molecular swab results (performed in 88&#x0025; of patients)</p></list-item>
<list-item>
<p>Respiratory co-infection documentation (present in 17.8&#x0025; of cases)</p></list-item>
<list-item>
<p>Specific pathogen identification including rhinovirus/enterovirus (approximately 25&#x0025;), RSV (approximately 15&#x0025;), and Streptococcus pneumoniae (approximately 10&#x0025;)</p></list-item>
</list></p>
</sec>
</sec>
<sec id="s2f"><label>2.6</label><title>Comorbidity assessment</title>
<p>Systematic comorbidity assessment identified underlying conditions in approximately 40&#x0025; of patients, with the most frequent categories being:
<list list-type="bullet">
<list-item>
<p>Neurological diseases</p></list-item>
<list-item>
<p>Cardiac conditions (congenital or acquired heart disease)</p></list-item>
<list-item>
<p>Genetic syndromes</p></list-item>
<list-item>
<p>Respiratory conditions including asthma</p></list-item>
<list-item>
<p>Immunodeficiencies</p></list-item>
<list-item>
<p>Other chronic conditions</p></list-item>
</list></p>
</sec>
<sec id="s2g"><label>2.7</label><title>Data preprocessing and quality control</title>
<sec id="s2g1"><label>2.7.1</label><title>Missing data management</title>
<p>Dataset cleaning and preparation included systematic verification of continuous variables for inconsistent values or outliers with appropriate data recording protocols. Categorical variables were verified against original clinical definitions to ensure accuracy.</p>
<p>Missing data (&#x003C;2&#x0025; of total observations) were handled using Multiple Imputation by Chained Equations (MICE) with predictive mean matching for continuous variables and logistic regression for categorical variables. Five imputation datasets were generated, and results were pooled using Rubin&#x0027;s rules. Sensitivity analysis comparing complete case analysis with imputed results showed no significant differences in model performance (AUC difference &#x003C;0.02).</p>
</sec>
<sec id="s2g2"><label>2.7.2</label><title>Feature engineering and selection</title>
<p>Given the relatively modest sample size and numerous candidate variables, preliminary predictor selection techniques were applied to reduce noise and minimize overfitting risk. This process integrated clinical importance considerations with statistical associations and automatic selection methods including Lasso regression where appropriate.</p>
<p>Feature engineering included creation of composite variables such as the neutrophil-to-lymphocyte ratio, which has established clinical relevance in inflammatory conditions. To account for developmental differences in immune markers, laboratory variables were transformed into age-adjusted Z-scores using pediatric reference ranges.</p>
</sec>
<sec id="s2g3"><label>2.7.3</label><title>Data pre-processing</title>
<p>All preprocessing steps were performed prior to model training to ensure transparency and reproducibility. Variables were grouped into demographic, clinical, laboratory, imaging, and microbiological categories. No free-text clinical notes were used. Continuous laboratory variables were inspected for outliers, normalized using age-adjusted pediatric reference ranges, and transformed into Z-scores. Categorical variables were encoded using one-hot encoding. Missing values were handled using Multiple Imputation by Chained Equations (MICE) as described above. All preprocessing steps were applied identically across cross-validation folds to avoid data leakage.</p>
</sec>
</sec>
<sec id="s2h"><label>2.8</label><title>Machine learning model development</title>
<sec id="s2h1"><label>2.8.1</label><title>Algorithm selection</title>
<p>Nine machine learning algorithms were selected based on proven efficacy in similar diagnostic and prognostic tasks, representing diverse methodological approaches:</p>
<p>Linear Models:
<list list-type="bullet">
<list-item>
<p>Logistic Regression: Baseline model providing direct insight into clinical variable relationships with oxygen therapy requirements through interpretable log-odds modeling</p></list-item>
</list>Tree-Based Ensemble Methods:
<list list-type="bullet">
<list-item>
<p>Random Forest: Ensemble method building multiple decision trees on bootstrapped samples with random feature subsets, reducing variance and enhancing generalization</p></list-item>
<list-item>
<p>XGBoost: Enhanced gradient boosting decision trees with regularization techniques and parallel processing capabilities</p></list-item>
<list-item>
<p>LightGBM: High-performance gradient boosting framework employing leaf-wise tree growth strategy and advanced sampling techniques</p></list-item>
</list>Instance-Based Methods:
<list list-type="bullet">
<list-item>
<p>K-Nearest Neighbors (KNN): Classification based on proximity to labeled instances in feature space</p></list-item>
</list>Support Vector Methods:
<list list-type="bullet">
<list-item>
<p>Support Vector Machines (SVM): Optimal hyperplane identification for class separation in high-dimensional space using kernel functions</p></list-item>
</list>Neural Network Approaches:
<list list-type="bullet">
<list-item>
<p>Multi-Layer Perceptron (MLP): Feedforward artificial neural network with backpropagation learning</p></list-item>
<list-item>
<p>TabTransformer: Deep learning architecture utilizing Transformer self-attention mechanisms for tabular data (<xref ref-type="bibr" rid="B8">8</xref>)</p></list-item>
</list>Probabilistic Methods:
<list list-type="bullet">
<list-item>
<p>Naive Bayes: Probabilistic model based on Bayes&#x2019; theorem with feature independence assumptions</p></list-item>
</list></p>
</sec>
<sec id="s2h2"><label>2.8.2</label><title>Training and validation strategy</title>
<p>To address concerns about overfitting with our modest sample size (<italic>n</italic>&#x2009;&#x003D;&#x2009;206), we implemented stringent model complexity constraints within our existing 5-fold cross-validation framework:</p>
<sec id="s2h2a"><label>2.8.2.1</label><title>Enhanced cross-validation strategy</title>
<p>Our stratified 5-fold cross-validation serves as a robust defense against overfitting by:
<list list-type="order">
<list-item>
<p>Repeated holdout testing: Each data subset (n&#x2248;41 per fold) serves as an independent test set once, with performance averaged across all 5 folds</p></list-item>
<list-item>
<p>Performance variance quantification: Standard deviations across folds directly indicate model stability and overfitting risk</p></list-item>
<list-item>
<p>Stratified sampling: Maintains outcome balance (20.4&#x0025; oxygen therapy) in each fold</p></list-item>
</list>This approach is mathematically equivalent to 5 independent train-test splits, providing more robust performance estimates than a single 80/20 split while maximizing data utilization.</p>
</sec>
<sec id="s2h2b"><label>2.8.2.2</label><title>Model complexity constraints</title>
<p>To further prevent overfitting given our sample size, we imposed the following constraints during hyperparameter optimization:</p>
<p>Tree-based models:
<list list-type="bullet">
<list-item>
<p>XGBoost: max_depth &#x2264; 4 (vs. default 6), min_child_weight &#x2265;3, learning_rate&#x2009;&#x003D;&#x2009;0.1 (conservative), subsample&#x2009;&#x003D;&#x2009;0.8</p></list-item>
<list-item>
<p>LightGBM: num_leaves &#x2264; 31 (vs. default 31), max_depth&#x2009;&#x003D;&#x2009;4, learning_rate&#x2009;&#x003D;&#x2009;0.05 (conservative), feature_fractio<italic>n</italic>&#x2009;&#x003D;&#x2009;0.8</p></list-item>
<list-item>
<p>Random Forest: max_depth &#x2264; 10 (limited from unlimited), min_samples_split&#x2009;&#x003D;&#x2009;5 (vs. default 2), min_samples_leaf&#x2009;&#x003D;&#x2009;2</p></list-item>
</list>Neural networks:
<list list-type="bullet">
<list-item>
<p>MLP: Single hidden layer (100 neurons), early stopping (patience&#x003D;20), L2 regularization (alpha&#x2009;&#x003D;&#x2009;0.0001)</p></list-item>
<list-item>
<p>TabTransformer: Reduced architecture (max_epochs&#x003D;100, patience&#x003D;10), dropout incorporated</p></list-item>
</list>Linear models:
<list list-type="bullet">
<list-item>
<p>Logistic Regression: L2 regularization (C&#x2009;&#x003D;&#x2009;1.0, default), max_iter&#x003D;1,000</p></list-item>
<list-item>
<p>SVM: RBF kernel with C&#x2009;&#x003D;&#x2009;1.0, gamma&#x003D;&#x0027;scale&#x0027; (data-dependent)</p></list-item>
<list-item>
<p>Other models:</p></list-item>
<list-item>
<p>KNN: n_neighbors&#x003D;5 (appropriate for sample size)</p></list-item>
<list-item>
<p>Naive Bayes: Default parameters (inherently simple)</p></list-item>
</list></p>
</sec>
<sec id="s2h2c"><label>2.8.2.3</label><title>Nested cross-validation for hyperparameter tuning</title>
<p>Hyperparameter optimization (Hyperparameters optimized shown in <xref ref-type="sec" rid="s16">Supplementary Table S1</xref>) was performed using nested cross-validation:
<list list-type="bullet">
<list-item>
<p>Outer loop: 5-fold stratified cross-validation (CV) for performance estimation</p></list-item>
<list-item>
<p>Inner loop: 3-fold cross-validation (CV) within each training fold for hyperparameter selection</p></list-item>
<list-item>
<p>This ensures hyperparameter tuning does not use information from test folds, preventing optimistic bias</p></list-item>
</list>Hyperparameter search ranges and optimization procedures are detailed in <xref ref-type="sec" rid="s16">Supplementary Table S1</xref>.</p>
<p>SHAP analysis was performed using TreeExplainer for tree-based models and KernelExplainer for others, with 100 background samples.</p>
<p>For models that do not natively output calibrated probabilities (including SVM, XGBoost, LightGBM, Random Forest, and MLP), probability estimates were obtained using post-hoc calibration. Specifically, Platt scaling was applied for SVM (via probability&#x2009;&#x003D;&#x2009;True in scikit-learn), while tree-based models were calibrated using isotonic regression within a 5-fold cross-validation framework. These calibrated probabilities were then used to derive clinically interpretable risk categories (low, moderate, high) based on predefined probability thresholds.</p>
</sec>
</sec>
<sec id="s2h3"><label>2.8.3</label><title>Performance metrics</title>
<p>Model performance was evaluated using standard binary classification metrics:
<list list-type="bullet">
<list-item>
<p>Area Under the Curve (AUC): Overall discriminative ability</p></list-item>
<list-item>
<p>Precision: Proportion of predicted positive cases that were actually positive</p></list-item>
<list-item>
<p>Recall (Sensitivity): Proportion of actual positive cases correctly identified</p></list-item>
<list-item>
<p>F1-score: Harmonic mean of precision and recall</p></list-item>
<list-item>
<p>Specificity: Proportion of actual negative cases correctly identified</p></list-item>
</list></p>
<sec id="s2h3a"><label>2.8.3.1</label><title>Performance reporting</title>
<p>All performance metrics reported in <xref ref-type="table" rid="T1">Table&#x00A0;1</xref> represent test set performance from the outer cross-validation loop, with hyperparameters independently optimized within each fold&#x0027;s training set using the inner loop. This nested approach ensures no information leakage from test data during model selection.
<list list-type="bullet">
<list-item>
<p>Low SD (&#x003C;0.05): Indicates consistent performance across folds and low overfitting risk</p></list-item>
<list-item>
<p>High SD (&#x003E;0.10): Would suggest overfitting or data heterogeneity</p></list-item>
</list></p>
<table-wrap id="T1" position="float"><label>Table&#x00A0;1</label>
<caption><p>Machine learning model performance metrics.</p></caption>
<table>
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="center">Precision</th>
<th valign="top" align="center">Recall</th>
<th valign="top" align="center">F1-score</th>
<th valign="top" align="center">AUC</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Support Vector Machine</td>
<td valign="top" align="center">0.93&#x2009;&#x00B1;&#x2009;0.02</td>
<td valign="top" align="center">0.93&#x2009;&#x00B1;&#x2009;0.03</td>
<td valign="top" align="center">0.92&#x2009;&#x00B1;&#x2009;0.04</td>
<td valign="top" align="center">0.97&#x2009;&#x00B1;&#x2009;0.03</td>
</tr>
<tr>
<td valign="top" align="left">Logistic Regression</td>
<td valign="top" align="center">0.90&#x2009;&#x00B1;&#x2009;0.03</td>
<td valign="top" align="center">0.90&#x2009;&#x00B1;&#x2009;0.04</td>
<td valign="top" align="center">0.90&#x2009;&#x00B1;&#x2009;0.05</td>
<td valign="top" align="center">0.95&#x2009;&#x00B1;&#x2009;0.04</td>
</tr>
<tr>
<td valign="top" align="left">XGBoost</td>
<td valign="top" align="center">0.90&#x2009;&#x00B1;&#x2009;0.03</td>
<td valign="top" align="center">0.89&#x2009;&#x00B1;&#x2009;0.05</td>
<td valign="top" align="center">0.89&#x2009;&#x00B1;&#x2009;0.04</td>
<td valign="top" align="center">0.94&#x2009;&#x00B1;&#x2009;0.04</td>
</tr>
<tr>
<td valign="top" align="left">LightGBM</td>
<td valign="top" align="center">0.90&#x2009;&#x00B1;&#x2009;0.04</td>
<td valign="top" align="center">0.88&#x2009;&#x00B1;&#x2009;0.05</td>
<td valign="top" align="center">0.89&#x2009;&#x00B1;&#x2009;0.05</td>
<td valign="top" align="center">0.93&#x2009;&#x00B1;&#x2009;0.04</td>
</tr>
<tr>
<td valign="top" align="left">Random Forest</td>
<td valign="top" align="center">0.90&#x2009;&#x00B1;&#x2009;0.05</td>
<td valign="top" align="center">0.89&#x2009;&#x00B1;&#x2009;0.06</td>
<td valign="top" align="center">0.87&#x2009;&#x00B1;&#x2009;0.05</td>
<td valign="top" align="center">0.91&#x2009;&#x00B1;&#x2009;0.05</td>
</tr>
<tr>
<td valign="top" align="left">Multi-Layer Perceptron</td>
<td valign="top" align="center">0.84&#x2009;&#x00B1;&#x2009;0.06</td>
<td valign="top" align="center">0.83&#x2009;&#x00B1;&#x2009;0.07</td>
<td valign="top" align="center">0.84&#x2009;&#x00B1;&#x2009;0.06</td>
<td valign="top" align="center">0.90&#x2009;&#x00B1;&#x2009;0.06</td>
</tr>
<tr>
<td valign="top" align="left">K-Nearest Neighbors</td>
<td valign="top" align="center">0.88&#x2009;&#x00B1;&#x2009;0.07</td>
<td valign="top" align="center">0.88&#x2009;&#x00B1;&#x2009;0.08</td>
<td valign="top" align="center">0.87&#x2009;&#x00B1;&#x2009;0.07</td>
<td valign="top" align="center">0.82&#x2009;&#x00B1;&#x2009;0.07</td>
</tr>
<tr>
<td valign="top" align="left">Naive Bayes</td>
<td valign="top" align="center">0.84&#x2009;&#x00B1;&#x2009;0.08</td>
<td valign="top" align="center">0.74&#x2009;&#x00B1;&#x2009;0.09</td>
<td valign="top" align="center">0.76&#x2009;&#x00B1;&#x2009;0.08</td>
<td valign="top" align="center">0.79&#x2009;&#x00B1;&#x2009;0.08</td>
</tr>
<tr>
<td valign="top" align="left">TabTransformer</td>
<td valign="top" align="center">0.50&#x2009;&#x00B1;&#x2009;0.05</td>
<td valign="top" align="center">0.25&#x2009;&#x00B1;&#x2009;0.06</td>
<td valign="top" align="center">0.33&#x2009;&#x00B1;&#x2009;0.06</td>
<td valign="top" align="center">0.64&#x2009;&#x00B1;&#x2009;0.06</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
</sec>
<sec id="s2i"><label>2.9</label><title>Model interpretability and clinical translation</title>
<sec id="s2i1"><label>2.9.1</label><title>SHAP analysis</title>
<p>To ensure the robustness of our interpretability analysis, we performed SHAP consistency verification using bootstrap resampling:</p>
<p>Bootstrap Procedure:
<list list-type="order">
<list-item>
<p>Generated 100 bootstrap samples from the training dataset (<italic>n</italic>&#x2009;&#x003D;&#x2009;165, sampling with replacement)</p></list-item>
<list-item>
<p>For each bootstrap sample, computed SHAP values for the top-performing model (SVM)</p></list-item>
<list-item>
<p>Ranked features by mean absolute SHAP value within each bootstrap iteration</p></list-item>
<list-item>
<p>Calculated consistency metrics:
<list list-type="bullet">
<list-item>
<p>Rank stability: Frequency with which each feature appeared in the top 10 across all 100 iterations</p></list-item>
<list-item>
<p>SHAP magnitude stability: Coefficient of variation of mean &#x007C;SHAP&#x007C; values across iterations</p></list-item>
<list-item>
<p>Direction consistency: Proportion of iterations showing the same directional relationship</p></list-item>
</list></p></list-item>
</list>Consistency Criteria: Features were considered stable predictors if they met all three criteria:
<list list-type="bullet">
<list-item>
<p>Appeared in top 10 features in &#x2265;90&#x0025; of bootstrap iterations</p></list-item>
<list-item>
<p>SHAP magnitude CV &#x003C;30&#x0025;</p></list-item>
<list-item>
<p>Direction consistency &#x2265;85&#x0025;</p></list-item>
</list>Results of Consistency Analysis: All five top features (CRP, LDH, NLR, neutrophil percentage, respiratory distress) demonstrated excellent consistency:
<list list-type="bullet">
<list-item>
<p>Rank stability: 98&#x0025;&#x2013;100&#x0025; (appeared in top 5 in 98&#x2013;100 of 100 iterations)</p></list-item>
<list-item>
<p>SHAP magnitude CV: 12&#x0025;&#x2013;18&#x0025; (well below 30&#x0025; threshold)</p></list-item>
<list-item>
<p>Direction consistency: 94&#x0025;&#x2013;99&#x0025; (consistently positive SHAP values for elevated biomarkers)</p></list-item>
</list>This analysis confirms that our SHAP-derived feature importance rankings are robust and not artifacts of specific data splits or sampling variability.</p>
</sec>
<sec id="s2i2"><label>2.9.2</label><title>Clinical relevance assessment</title>
<p>Feature importance rankings were evaluated for clinical plausibility and consistency with established pathophysiological understanding of Mycoplasma pneumoniae pneumonia. This clinical validation step ensures that model predictions align with medical knowledge and can be trusted by healthcare providers.</p>
<p>Although laboratory variables were standardized during model training, all SHAP analyses and clinical interpretations were performed using the original clinical units to preserve interpretability. In a deployment setting, the model would internally apply the same scaling parameters, but clinicians would continue to input and interpret values in their native units.</p>
</sec>
</sec>
</sec>
<sec id="s3" sec-type="results"><label>3</label><title>Results</title>
<sec id="s3a"><label>3.1</label><title>Study population characteristics</title>
<sec id="s3a1"><label>3.1.1</label><title>Demographic and anthropometric data</title>
<p>The final study cohort comprised 206 pediatric patients with confirmed Mycoplasma pneumoniae pneumonia. The demographic distribution showed a relatively balanced sex distribution with 109 boys (52.9&#x0025;) and 97 girls (47.08&#x0025;). The mean age at admission was approximately 4.6 years (SD &#x2248; 3.5 years), with a range from 0.75 to 15.8 years, indicating a distribution skewed toward younger children as expected for Mycoplasma pneumoniae infections.</p>
<p>Birth weight data were available for the majority of patients, showing a mean of approximately 2,900&#x2005;g (SD &#x2248; 800&#x2005;g) with a range from 840&#x2005;g to 4,380&#x2005;g. Some outliers below 1,000&#x2005;g were identified, likely representing patients with prematurity-related complications. Current anthropometric measurements at admission showed median weight of 24.0&#x2005;kg [IQR: 17.0&#x2013;36.0] among 200 observations and median height of 125.0&#x2005;cm [IQR: 108.0&#x2013;147.0] among 173 observations.</p>
</sec>
<sec id="s3a2"><label>3.1.2</label><title>Length of stay and clinical outcomes</title>
<p>The median length of stay was approximately 6 days with an interquartile range of 4&#x2013;9 days and a maximum duration of 24 days, indicating a positively skewed distribution typical of pediatric respiratory infections. This prolonged hospitalization in some cases reflects the potential for complicated Mycoplasma pneumoniae pneumonia presentations requiring extended monitoring and treatment.</p>
</sec>
<sec id="s3a3"><label>3.1.3</label><title>Comorbidities and risk factors</title>
<p>Comorbidities were documented in approximately 40&#x0025; of cases, representing a substantial proportion of patients with underlying conditions that may influence disease severity and oxygen requirements. The most frequent comorbidity categories were:
<list list-type="order">
<list-item>
<p>Neurological diseases: The most common category, likely including conditions affecting respiratory function or swallowing coordination</p></list-item>
<list-item>
<p>Cardiac conditions: Both congenital and acquired heart diseases that may compromise cardiopulmonary reserve</p></list-item>
<list-item>
<p>Genetic syndromes: Various chromosomal or genetic conditions potentially affecting multiple organ systems</p></list-item>
</list>This high prevalence of comorbidities in the study population suggests a more complex clinical cohort than might be expected in community settings, possibly reflecting referral patterns to specialized pediatric centers.</p>
</sec>
</sec>
<sec id="s3b"><label>3.2</label><title>Clinical presentation and symptoms</title>
<sec id="s3b1"><label>3.2.1</label><title>Respiratory manifestations</title>
<p>Respiratory symptoms were nearly universal in the cohort, with cough present in more than 90&#x0025; of patients, consistent with the primary respiratory nature of Mycoplasma pneumoniae infections. Fever was documented in approximately 85&#x0025; of cases, representing a typical but not universal presentation pattern.</p>
<p>Respiratory distress was identified in approximately 50&#x0025; of patients at admission, indicating significant disease severity in a substantial proportion of the cohort. This high prevalence of respiratory compromise underscores the importance of accurate risk stratification for oxygen therapy requirements.</p>
<p>Hypoxia, defined as SpO&#x2082;&#x2009;&#x003C;&#x2009;92&#x0025;, was present in approximately 20&#x0025; of patients at admission, representing the subset of children with the most severe respiratory impairment and immediate oxygen therapy needs.</p>
</sec>
<sec id="s3b2"><label>3.2.2</label><title>Extrapulmonary manifestations</title>
<p>Extrapulmonary manifestations were documented in approximately 35&#x0025; of patients, reflecting the systemic nature of Mycoplasma pneumoniae infections. The most frequent extrapulmonary presentations included:
<list list-type="bullet">
<list-item>
<p>ENT complications: Including otitis media and sinusitis</p></list-item>
<list-item>
<p>Gastrointestinal symptoms: Diarrhea and vomiting, potentially reflecting systemic inflammatory responses</p></list-item>
<list-item>
<p>Cutaneous manifestations: Rash and urticaria, consistent with immune-mediated phenomena</p></list-item>
</list>Less common but more serious extrapulmonary manifestations included:
<list list-type="bullet">
<list-item>
<p>Musculoskeletal symptoms: Arthralgia and myalgia</p></list-item>
<list-item>
<p>Cardiac involvement: Rare but potentially serious complications requiring intensive monitoring</p></list-item>
</list></p>
</sec>
</sec>
<sec id="s3c"><label>3.3</label><title>Laboratory and inflammatory markers</title>
<sec id="s3c1"><label>3.3.1</label><title>Complete blood count parameters</title>
<p>White blood cell counts showed considerable variation with a mean of approximately 12,000/<italic>&#x03BC;</italic>L and a range from 3,000 to 41,000/&#x03BC;L. Leukocytosis (defined as age-adjusted elevation) was present in approximately 40&#x0025; of patients, indicating a significant inflammatory response in a substantial subset.</p>
<p>Platelet counts demonstrated a mean of approximately 350,000/&#x03BC;L with a range from 195,000 to 807,000/&#x03BC;L. Thrombocytosis was documented in approximately 30&#x0025; of patients, representing a notable finding that may have prognostic significance for disease severity.</p>
<p>Neutrophil percentages showed a mean of approximately 65&#x0025; with a range from 20&#x0025; to 93&#x0025;, while lymphocyte percentages had a corresponding range reflecting the expected inverse relationship. The calculated neutrophil-to-lymphocyte ratio (NLR) showed a median of approximately 4.5 with a maximum of 30.7, indicating substantial inflammatory responses in some patients.</p>
</sec>
<sec id="s3c2"><label>3.3.2</label><title>Inflammatory markers</title>
<p>C-reactive protein (CRP) levels demonstrated substantial elevation in many patients, with Z-score analysis revealing mean values of approximately 3.2 (SD &#x2248; 2.5) and maximum values reaching 15.8 standard deviations above normal ranges. This marked CRP elevation was strongly associated with severe disease presentations.</p>
<p>Procalcitonin levels were available in a limited subset of patients (&#x003C; 40&#x0025; had complete data), limiting its utility for comprehensive model development. When present, elevated values above 2&#x2005;ng/mL were associated with more severe clinical presentations.</p>
<p>Erythrocyte sedimentation rate (ESR) data were sparse, reducing their reliability for predictive modeling in this cohort.</p>
</sec>
<sec id="s3c3"><label>3.3.3</label><title>Biochemical parameters</title>
<p>Lactate dehydrogenase (LDH) levels showed elevation in many patients, consistent with tissue damage associated with pneumonia. The range and distribution of LDH values provided useful discriminatory information for severity assessment.</p>
<p>Albumin levels were available for a subset of patients and generally showed mild reductions consistent with acute inflammatory states and reduced nutritional intake during acute illness.</p>
</sec>
</sec>
<sec id="s3d"><label>3.4</label><title>Radiological findings and imaging</title>
<sec id="s3d1"><label>3.4.1</label><title>Chest radiography</title>
<p>Chest x-rays were performed in approximately 90&#x0025; of cases, representing standard clinical practice for pediatric pneumonia evaluation. The most common radiological findings included:
<list list-type="bullet">
<list-item>
<p>Increased interstitial markings: Present in approximately 60&#x0025; of cases, consistent with the typical pattern of atypical pneumonia</p></list-item>
<list-item>
<p>Interstitial changes: Documented in approximately 45&#x0025; of patients, reflecting the characteristic radiological presentation</p></list-item>
<list-item>
<p>Consolidation: Present in approximately 30&#x0025; of cases, indicating more severe parenchymal involvement</p></list-item>
</list>These radiological patterns are consistent with published literature on Mycoplasma pneumoniae pneumonia imaging characteristics, showing predominantly interstitial rather than alveolar involvement.</p>
</sec>
</sec>
<sec id="s3e"><label>3.5</label><title>Microbiological findings and Co-infections</title>
<sec id="s3e1"><label>3.5.1</label><title>Diagnostic testing</title>
<p>Molecular swab testing was performed in 88&#x0025; of patients, representing comprehensive diagnostic evaluation. This high testing rate reflects the clinical importance of etiological diagnosis for appropriate antimicrobial therapy selection.</p>
</sec>
<sec id="s3e2"><label>3.5.2</label><title>Co-infection patterns</title>
<p>Respiratory co-infections were documented in 17.8&#x0025; of cases, indicating that concurrent pathogens are relatively common in pediatric Mycoplasma pneumoniae pneumonia. The most frequent co-infecting organisms included:
<list list-type="bullet">
<list-item>
<p>Rhinovirus/Enterovirus: Approximately 25&#x0025; of co-infected patients</p></list-item>
<list-item>
<p>Respiratory Syncytial Virus (RSV): Approximately 15&#x0025; of co-infected patients</p></list-item>
<list-item>
<p>Streptococcus pneumoniae: Approximately 10&#x0025; of co-infected patients</p></list-item>
<list-item>
<p>Multiple co-infections: Present in approximately 20&#x0025; of co-infected patients</p></list-item>
</list>This pattern of viral co-infections is consistent with the seasonal clustering of respiratory pathogens and may contribute to disease severity through synergistic effects on respiratory function.</p>
</sec>
</sec>
<sec id="s3f"><label>3.6</label><title>Treatment modalities and clinical management</title>
<sec id="s3f1"><label>3.6.1</label><title>Antimicrobial therapy</title>
<p>Antibiotic treatment was administered to more than 95&#x0025; of patients, with macrolides (clarithromycin and azithromycin) dominating the therapeutic choices, consistent with standard recommendations for Mycoplasma pneumoniae pneumonia.</p>
</sec>
<sec id="s3f2"><label>3.6.2</label><title>Corticosteroid Use</title>
<p>Steroid therapy was employed in approximately 50&#x0025; of patients, often reserved for severe presentations or cases with significant extrapulmonary manifestations. This selective use reflects the controversial role of corticosteroids in Mycoplasma pneumoniae pneumonia management.</p>
</sec>
<sec id="s3f3"><label>3.6.3</label><title>Oxygen therapy requirements</title>
<p>Oxygen therapy was required in approximately 20.4&#x0025; of the total cohort, with low-flow oxygen therapy being more commonly used than high-flow nasal cannula systems. The median duration of oxygen therapy among treated patients was approximately 3 days with a maximum duration of 21 days, reflecting the variable severity and recovery patterns.</p>
</sec>
</sec>
<sec id="s3g"><label>3.7</label><title>Machine learning model performance</title>
<sec id="s3g1"><label>3.7.1</label><title>Overall model comparison</title>
<p>Nine distinct machine learning algorithms were evaluated using stratified cross-validation, yielding the performance metrics presented in <xref ref-type="table" rid="T2">Table&#x00A0;2</xref>. The results demonstrate substantial variation in predictive capability across different algorithmic approaches. The confusion matrices showing the True Positives, True Negatives, False Positives and False Negatives for the top three models are shown in <xref ref-type="fig" rid="F1">Figures&#x00A0;1</xref>&#x2013;<xref ref-type="fig" rid="F3">3</xref> respectively. Performance metrics are reported as mean&#x2009;&#x00B1;&#x2009;standard deviation across the five cross-validation folds (<xref ref-type="table" rid="T1">Table&#x00A0;1</xref>).</p>
<table-wrap id="T2" position="float"><label>Table&#x00A0;2</label>
<caption><p>Final model training parameters.</p></caption>
<table>
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="center">Library/framework</th>
<th valign="top" align="center">Key parameters</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Logistic Regression</td>
<td valign="top" align="left">sklearn.linear_model</td>
<td valign="top" align="left">solver&#x003D;&#x0027;lbfgs&#x2019;, max_iter&#x003D;1,000, penalty&#x003D;&#x0027;l2&#x2019;, C&#x2009;&#x003D;&#x2009;1.0</td>
</tr>
<tr>
<td valign="top" align="left">Random Forest</td>
<td valign="top" align="left">sklearn.ensemble</td>
<td valign="top" align="left">n_estimators&#x003D;200, criterion&#x003D;&#x0027;gini&#x2019;, max_depth&#x003D;10, min_samples_split&#x003D;5, min_samples_leaf&#x003D;2</td>
</tr>
<tr>
<td valign="top" align="left">XGBoost</td>
<td valign="top" align="left">xgboost</td>
<td valign="top" align="left">use_label_encoder&#x2009;&#x003D;&#x2009;False, eval_metric&#x003D;&#x0027;logloss&#x2019;, max_depth&#x003D;4, learning_rate&#x003D;0.1, subsample&#x003D;0.8, min_child_weight&#x003D;3</td>
</tr>
<tr>
<td valign="top" align="left">Support Vector Machine</td>
<td valign="top" align="left">sklearn.svm</td>
<td valign="top" align="left">kernel&#x003D;&#x0027;rbf&#x2019;, C&#x2009;&#x003D;&#x2009;1.0, gamma&#x003D;&#x0027;scale&#x2019;, probability&#x2009;&#x003D;&#x2009;True</td>
</tr>
<tr>
<td valign="top" align="left">K-Nearest Neighbors</td>
<td valign="top" align="left">sklearn.neighbors</td>
<td valign="top" align="left">n_neighbors&#x003D;5, weights&#x003D;&#x0027;uniform&#x2019;, metric&#x003D;&#x0027;minkowski&#x0027;</td>
</tr>
<tr>
<td valign="top" align="left">Naive Bayes</td>
<td valign="top" align="left">sklearn.naive_bayes</td>
<td valign="top" align="left">GaussianNB with default var_smoothing&#x003D;1e-9</td>
</tr>
<tr>
<td valign="top" align="left">Multi-layer Perceptron</td>
<td valign="top" align="left">sklearn.neural_network</td>
<td valign="top" align="left">hidden_layer_sizes&#x003D;(100,), activation&#x003D;&#x0027;relu&#x2019;, max_iter&#x003D;1,000, early_stopping&#x2009;&#x003D;&#x2009;True, validation_fraction&#x003D;0.1, n_iter_no_change&#x003D;20, alpha&#x003D;0.0001</td>
</tr>
<tr>
<td valign="top" align="left">LightGBM</td>
<td valign="top" align="left">lightgbm</td>
<td valign="top" align="left">boosting_type&#x003D;&#x0027;gbdt&#x2019;, objective&#x003D;&#x0027;binary&#x2019;, num_leaves&#x003D;31, max_depth&#x003D;4, learning_rate&#x003D;0.05, feature_fraction&#x003D;0.8</td>
</tr>
<tr>
<td valign="top" align="left">TabTransformer</td>
<td valign="top" align="left">pytorch_tabnet</td>
<td valign="top" align="left">max_epochs&#x003D;100, patience&#x003D;10, batch_size&#x003D;1,024, virtual_batch_size&#x003D;128, n_steps&#x003D;5, n_d&#x2009;&#x003D;&#x2009;32, n_a&#x2009;&#x003D;&#x2009;32</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F1" position="float"><label>Figure&#x00A0;1</label>
<caption><p>Confusion matrix SVM.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-08-1755878-g001.tif"><alt-text content-type="machine-generated">Confusion matrix for an SVM model. True positives: 8, true negatives: 32, false positives: 1, false negatives: 1. Color gradient bar on the right indicates frequency, ranging from light to dark blue.</alt-text>
</graphic>
</fig>
<fig id="F2" position="float"><label>Figure&#x00A0;2</label>
<caption><p>Confusion matrix linear regression.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-08-1755878-g002.tif"><alt-text content-type="machine-generated">Confusion matrix for logistic regression with true labels versus predicted labels. Top-left shows 32 true negatives, top-right shows zero false positives, bottom-left shows four false negatives, and bottom-right shows six true positives. A color bar on the right represents value intensity from 0 to 30.</alt-text>
</graphic>
</fig>
<fig id="F3" position="float"><label>Figure&#x00A0;3</label>
<caption><p>Confusion matrix XGBoost.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-08-1755878-g003.tif"><alt-text content-type="machine-generated">Confusion matrix of an XGBoost model showing true versus predicted labels. Contains values: true negative (30), false positive (2), false negative (3), and true positive (7). A color scale from dark to light blue indicates higher to lower values.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3g2"><label>3.7.2</label><title>Top-performing models</title>
<p>Support Vector Machine emerged as the top performer, achieving exceptional discriminatory power with an AUC of 0.97. The model demonstrated excellent balance between precision (0.93) and recall (0.93), resulting in an F1-score of 0.92. This performance indicates highly reliable prediction of oxygen therapy requirements with minimal false positive and false negative rates.</p>
<p>Logistic Regression demonstrated strong performance as the baseline linear model, achieving an AUC of 0.95 with balanced precision and recall of 0.90 each. This excellent performance of a simple linear model suggests that the relationship between predictor variables and oxygen therapy requirements can be effectively captured through linear combinations, enhancing clinical interpretability.</p>
<p>XGBoost achieved competitive performance with an AUC of 0.94, precision of 0.90, and recall of 0.89. As a state-of-the-art gradient boosting algorithm, XGBoost&#x0027;s strong performance validates the utility of ensemble tree-based methods for this clinical prediction task.</p>
<p>LightGBM showed similar performance characteristics with an AUC of 0.93, demonstrating that advanced gradient boosting frameworks can effectively model the complex interactions between clinical variables and oxygen therapy requirements.</p>
</sec>
<sec id="s3g3"><label>3.7.3</label><title>Moderate-performing models</title>
<p>Random Forest achieved an AUC of 0.91 with precision of 0.90 and recall of 0.89, representing solid but not exceptional performance. The slightly lower F1-score (0.87) suggests some imbalance in prediction accuracy between positive and negative cases.</p>
<p>Multi-Layer Perceptron demonstrated moderate performance with an AUC of 0.90, precision of 0.84, and recall of 0.83. This neural network approach showed reasonable predictive capability but did not outperform simpler linear or tree-based methods.</p>
<p>K-Nearest Neighbors achieved an AUC of 0.82 with precision and recall of 0.88 each, indicating acceptable but suboptimal performance compared to other algorithms.</p>
</sec>
<sec id="s3g4"><label>3.7.4</label><title>Poor-performing models</title>
<p>Naive Bayes showed limited effectiveness with an AUC of 0.79, precision of 0.84, but notably poor recall of 0.74. This performance suggests that the feature independence assumption underlying Naive Bayes is violated in this clinical dataset.</p>
<p>TabTransformer performed poorly with an AUC of 0.64, precision of 0.50, and very low recall of 0.25. This poor performance likely reflects the limited dataset size and the tabular data nature being unsuited to the Transformer architecture, which was originally designed for sequential data with much larger training sets.</p>
</sec>
</sec>
<sec id="s3h"><label>3.8</label><title>Feature importance and clinical interpretability</title>
<sec id="s3h1"><label>3.8.1</label><title>SHAP analysis results</title>
<p>Shapley Additive Explanations analysis was performed across the top-performing models to identify the most influential predictive features and ensure clinical interpretability. The analysis revealed remarkable consistency in feature importance rankings across different algorithmic approaches, lending confidence to the clinical relevance of identified predictors.</p>
<p><xref ref-type="fig" rid="F4">Figure&#x00A0;4</xref> presents the SHAP summary plot showing the top ten most influential features contributing to oxygen therapy prediction. The plot displays how each feature impacts model predictions, with the position along the <italic>x</italic>-axis indicating the magnitude and direction of the SHAP value (impact on prediction), and the color representing the feature&#x0027;s value (blue for low, red for high).</p>
<fig id="F4" position="float"><label>Figure&#x00A0;4</label>
<caption><p>SHAP summary plot showing the top ten most influential features contributing to oxygen therapy prediction. CRP, LDH, neutrophil-to-lymphocyte ratio (NLR), neutrophil percentage, and respiratory distress were consistently the strongest predictors across models, supporting their clinical relevance.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-08-1755878-g004.tif"><alt-text content-type="machine-generated">Dot plot showing SHAP values for various medical features impacting a model's output. Features include CRP, LDH, NLR, among others. Dots are colored by feature value: red for high, blue for low. Height along the y-axis represents features, while the x-axis indicates SHAP impact values.</alt-text>
</graphic>
</fig>
<p>Key observations from the SHAP analysis:</p>
<p>Top Predictive Features:</p>
<p>The SHAP analysis identified ten key features contributing to oxygen therapy prediction, with their clinical significance detailed in <xref ref-type="table" rid="T3">Table&#x00A0;3</xref>. The most influential predictors were:
<list list-type="bullet">
<list-item>
<p>C-reactive protein (CRP_mg_L): Emerged as the most influential predictor, with higher CRP values (red points) consistently pushing predictions toward increased oxygen therapy risk (positive SHAP values).</p></list-item>
<list-item>
<p>Lactate dehydrogenase (LDH): Demonstrated strong predictive importance as a marker of tissue damage, with elevated LDH levels associated with higher oxygen therapy requirements.</p></list-item>
<list-item>
<p>Neutrophil-to-lymphocyte ratio (NLR): Showed substantial predictive value, reflecting the balance between innate and adaptive immune responses, with higher ratios indicating increased severity.</p></list-item>
<list-item>
<p>Neutrophil percentage: High neutrophil counts contributed to increased oxygen therapy predictions, suggesting the importance of inflammatory cell profiles.</p></list-item>
<list-item>
<p>Respiratory distress: Clinical assessment of respiratory distress showed strong predictive capability as a direct marker of respiratory compromise.</p></list-item>
</list></p>
<table-wrap id="T3" position="float"><label>Table&#x00A0;3</label>
<caption><p>Key predictive features and clinical significance.</p></caption>
<table>
<colgroup>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Feature</th>
<th valign="top" align="center">Clinical meaning</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">C-reactive protein (CRP)</td>
<td valign="top" align="left">Inflammation marker; elevated levels suggest severe infection</td>
</tr>
<tr>
<td valign="top" align="left">Lactate dehydrogenase (LDH)</td>
<td valign="top" align="left">Tissue damage indicator; elevated in severe pneumonia</td>
</tr>
<tr>
<td valign="top" align="left">Neutrophil-to-lymphocyte ratio (NLR)</td>
<td valign="top" align="left">Composite immune response marker; higher ratios indicate severity</td>
</tr>
<tr>
<td valign="top" align="left">Neutrophil percentage</td>
<td valign="top" align="left">High neutrophil count suggests bacterial superinfection and systemic inflammation</td>
</tr>
<tr>
<td valign="top" align="left">Respiratory distress</td>
<td valign="top" align="left">Direct clinical severity indicator; often precedes oxygen therapy</td>
</tr>
<tr>
<td valign="top" align="left">Lymphocyte percentage</td>
<td valign="top" align="left">Lower lymphocyte count may correlate with severity in viral or atypical infections</td>
</tr>
<tr>
<td valign="top" align="left">Platelets</td>
<td valign="top" align="left">Reflects systemic inflammation or coagulopathy in severe infections</td>
</tr>
<tr>
<td valign="top" align="left">Fever duration</td>
<td valign="top" align="left">Longer fever duration signals severe or persistent infection</td>
</tr>
<tr>
<td valign="top" align="left">Age at admission</td>
<td valign="top" align="left">Younger children may be more vulnerable to respiratory complications</td>
</tr>
<tr>
<td valign="top" align="left">Comorbidities</td>
<td valign="top" align="left">Underlying conditions increase severe outcome risk</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Feature Value Patterns: The color gradient in <xref ref-type="fig" rid="F4">Figure&#x00A0;4</xref> reveals clear directional relationships: elevated inflammatory markers (CRP, LDH), higher neutrophil counts and NLR, presence of respiratory distress, and younger age all contribute positively to oxygen therapy risk prediction. Conversely, lower values of these features are associated with reduced risk (negative SHAP values).</p>
<p>Additional predictive features identified in the top ten include lymphocyte percentage, platelet count, fever duration at home, age at admission, and presence of comorbidities, all of which demonstrated clinically meaningful contributions to the prediction models. The clinical meaning and pathophysiological significance of all identified features are provided in <xref ref-type="table" rid="T3">Table&#x00A0;3</xref>.</p>
<p>The consistency of these findings across multiple machine learning algorithms (SVM, Logistic Regression, XGBoost, LightGBM) strengthens confidence in their biological relevance and clinical utility for risk stratification in pediatric Mycoplasma pneumoniae pneumonia.</p>
</sec>
<sec id="s3h2"><label>3.8.2</label><title>Top-tier predictive features</title>
<p>C-reactive protein (CRP) emerged as the most consistently important predictor across all models. The SHAP analysis revealed that elevated CRP Z-scores above 3.0 standard deviations were strongly associated with oxygen therapy requirements. This finding aligns with clinical experience, as CRP represents a sensitive marker of systemic inflammation and tissue damage in pneumonia.</p>
<p>Lactate dehydrogenase (LDH) ranked as the second most important predictor, with elevated levels indicating tissue damage and cellular destruction associated with severe pneumonia. The combination of CRP and LDH provides complementary information about inflammatory response and tissue injury severity.</p>
<p>Neutrophil-to-lymphocyte ratio (NLR) demonstrated high predictive value, with ratios above 10 strongly associated with oxygen therapy needs. This composite marker effectively captures the balance between innate and adaptive immune responses, with higher ratios indicating more severe inflammatory states.</p>
</sec>
<sec id="s3h3"><label>3.8.3</label><title>Secondary predictive features</title>
<p>Neutrophil percentage and lymphocyte percentage provided additional discriminatory information beyond the composite NLR, suggesting that absolute values of these cell populations contribute independent predictive value.</p>
<p>Respiratory distress at admission showed strong predictive capability, serving as a direct clinical marker of respiratory compromise that often precedes formal oxygen therapy initiation.</p>
<p>Platelet count demonstrated moderate predictive importance, with both thrombocytosis and thrombocytopenia being associated with increased oxygen therapy risk through different pathophysiological mechanisms.</p>
</sec>
<sec id="s3h4"><label>3.8.4</label><title>Demographic and clinical context features</title>
<p>Age at admission showed inverse correlation with oxygen therapy requirements, with younger children demonstrating higher risk, consistent with developmental differences in respiratory reserve and immune function.</p>
<p>Comorbidities demonstrated significant predictive value, with approximately 40&#x0025; of the cohort having underlying conditions that increased oxygen therapy risk through various mechanisms including compromised cardiopulmonary reserve, altered immune responses, or baseline respiratory dysfunction.</p>
</sec>
</sec>
<sec id="s3i"><label>3.9</label><title>Model validation and clinical relevance</title>
<sec id="s3i1"><label>3.9.1</label><title>Cross-validation results</title>
<p>The stratified five-fold cross-validation approach ensured robust performance estimation across different patient subgroups. The consistency of performance metrics across validation folds for the top-performing models (coefficient of variation &#x003C; 5&#x0025; for AUC values) indicates stable predictive capability that is unlikely to be due to overfitting.</p>
</sec>
<sec id="s3i2"><label>3.9.2</label><title>Clinical threshold analysis</title>
<p>Analysis of optimal decision thresholds for clinical implementation revealed that the Support Vector Machine model achieved optimal balance between sensitivity and specificity at a probability threshold of 0.35, corresponding to sensitivity of 0.93 and specificity of 0.91. This threshold selection prioritizes detection of patients requiring oxygen therapy while maintaining acceptable false positive rates.</p>
<p>For clinical implementation, a lower threshold (0.25) could be considered to maximize sensitivity (0.98) at the cost of reduced specificity (0.82), depending on institutional preferences for aggressive monitoring vs. resource utilization concerns.</p>
</sec>
</sec>
</sec>
<sec id="s4" sec-type="discussion"><label>4</label><title>Discussion</title>
<sec id="s4a"><label>4.1</label><title>Principal findings and clinical implications</title>
<p>This study demonstrates the feasibility and clinical utility of machine learning techniques for predicting oxygen therapy requirements in pediatric Mycoplasma pneumoniae pneumonia. The developed models, particularly Support Vector Machine, Logistic Regression, and XGBoost, showed exceptional predictive performance with AUC values exceeding 0.93, suggesting effective leverage of routine admission data for identifying children at risk of respiratory deterioration.</p>
<p>The clinical implications are substantial and multifaceted. Healthcare providers can identify children at higher oxygen therapy risk by utilizing machine learning models trained on readily available admission data, enabling earlier intervention, more appropriate monitoring intensity, and efficient hospital resource allocation. The integration of SHAP analysis ensures model interpretability, addressing a critical barrier to clinical adoption of artificial intelligence tools in healthcare settings.</p>
<p>Regarding the epidemiological distribution of severity, our cohort showed a higher rate of oxygen therapy in preschool children (&#x003C;5 years, 28&#x0025;) compared to school-age children (14.5&#x0025;). While classic literature describes <italic>M. pneumoniae</italic> severity as peaking in school age, our findings reflect distinct age-dependent phenotypes supported by our clinical data: younger children presented significantly more often with acute respiratory distress (35.5&#x0025; vs. 19.1&#x0025;) and interstitial patterns, consistent with wheezing-like lower airway obstruction frequently observed in this age group, which may partly explain their higher oxygen requirement. In contrast, older children more frequently exhibited lobar consolidation (25.0&#x0025; vs. 16.7&#x0025;), a phenotype that may be clinically tolerated without hypoxia. This phenotypic heterogeneity reinforces the necessity of including &#x201C;Age&#x201D; as an interaction feature in the model.</p>
<p>The prominence of CRP in our models warrants careful interpretation. Prior meta-analyses have reported inconsistent associations between CRP levels and Mycoplasma pneumoniae severity, with some studies noting substantial heterogeneity and potential risk of bias (<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B10">10</xref>). Our findings differ in part because the outcome studied&#x2014;oxygen therapy&#x2014;reflects respiratory compromise rather than general disease severity. CRP may correlate more strongly with inflammatory burden contributing to hypoxemia, particularly in children with comorbidities, who represented a substantial proportion of our cohort. Additionally, age-adjusted normalization of laboratory values may have reduced developmental variability, allowing CRP to emerge more clearly as a discriminative feature. Nonetheless, CRP should be interpreted as part of a multivariable pattern rather than a standalone predictor.</p>
</sec>
<sec id="s4b"><label>4.2</label><title>Feature importance and pathophysiological insights</title>
<p>The consistent identification of CRP, LDH, and NLR as top predictive features across multiple models reinforces their clinical relevance and provides insights into the pathophysiology of severe Mycoplasma pneumoniae pneumonia. These biomarkers represent well-established indicators of systemic inflammation, tissue damage, and immune dysregulation, with elevated levels serving as early warning signals for respiratory deterioration.</p>
<sec id="s4b1"><label>4.2.1</label><title>Inflammatory response markers</title>
<p>The prominence of CRP and NLR in predictive models aligns with current understanding of Mycoplasma pneumoniae pathogenesis, which involves both direct cellular damage and extensive immune-mediated inflammatory responses. The organism&#x0027;s unique characteristics, including lack of a cell wall and production of various inflammatory mediators, contribute to sustained inflammatory cascades that can progress to severe respiratory compromise.</p>
<p>The particularly strong predictive value of NLR reflects the complex interplay between innate and adaptive immune responses in Mycoplasma pneumoniae infections. Elevated neutrophil counts suggest active inflammatory processes, while relative lymphopenia may indicate immune suppression or sequestration, creating an imbalance associated with disease severity.</p>
</sec>
<sec id="s4b2"><label>4.2.2</label><title>Tissue damage indicators</title>
<p>LDH elevation serves as a marker of cellular destruction and tissue damage, providing complementary information to inflammatory markers. In the context of Mycoplasma pneumoniae pneumonia, elevated LDH may reflect both direct pathogen-mediated cellular injury and secondary damage from inflammatory processes, making it a valuable predictor of oxygen therapy requirements.</p>
</sec>
<sec id="s4b3"><label>4.2.3</label><title>Clinical assessment integration</title>
<p>The inclusion of respiratory distress as a highly predictive feature validates the importance of clinical assessment alongside laboratory parameters. This finding supports integrated prediction models that combine objective biomarkers with clinical observation, providing a more comprehensive approach to risk stratification than either approach alone.</p>
</sec>
</sec>
<sec id="s4c"><label>4.3</label><title>Model performance and algorithm comparison</title>
<sec id="s4c1"><label>4.3.1</label><title>Superior performance of support vector machines</title>
<p>The exceptional performance of SVM (AUC 0.97) in this clinical prediction task reflects the algorithm&#x0027;s strength in handling complex, non-linear relationships in high-dimensional clinical data. SVM&#x0027;s ability to find optimal separating hyperplanes in transformed feature spaces appears particularly well-suited to the clinical variables and outcome patterns observed in pediatric Mycoplasma pneumoniae pneumonia.</p>
<p>The balanced precision and recall achieved by SVM (both 0.93) indicates reliable performance across both positive and negative cases, minimizing both missed diagnoses of high-risk patients and unnecessary intensive monitoring of low-risk patients.</p>
</sec>
<sec id="s4c2"><label>4.3.2</label><title>Strong linear model performance</title>
<p>The excellent performance of Logistic Regression (AUC 0.95) provides important insights into the underlying data structure and clinical relationships. The success of this linear approach suggests that the relationship between predictor variables and oxygen therapy requirements can be effectively modeled through linear combinations of predictors, which has significant implications for clinical interpretability and implementation.</p>
<p>Linear models offer several advantages for clinical deployment, including computational efficiency, direct coefficient interpretation, and easier integration into existing clinical decision support systems. The comparable performance to more complex algorithms supports the potential for simplified clinical tools that maintain high accuracy while maximizing usability.</p>
</sec>
<sec id="s4c3"><label>4.3.3</label><title>Tree-based model insights</title>
<p>The strong performance of XGBoost and LightGBM (AUC 0.94 and 0.93, respectively) demonstrates the value of ensemble methods in capturing complex interactions between clinical variables. These models can automatically identify non-linear relationships and variable interactions that may not be apparent through traditional statistical approaches.</p>
<p>The ability of tree-based models to handle missing data naturally and provide feature importance rankings makes them particularly attractive for clinical applications where data completeness may vary and clinical interpretability is essential.</p>
</sec>
<sec id="s4c4"><label>4.3.4</label><title>Deep learning limitations</title>
<p>The poor performance of TabTransformer highlights important considerations for applying deep learning approaches to clinical tabular data. The limited dataset size (206 patients) appears insufficient for training complex neural architectures that typically require thousands or tens of thousands of examples for effective learning.</p>
<p>This finding suggests that traditional machine learning approaches may be more appropriate for clinical prediction tasks with modest sample sizes, particularly in specialized pediatric populations where large datasets are challenging to assemble.</p>
</sec>
</sec>
<sec id="s4d"><label>4.4</label><title>Clinical implementation considerations</title>
<sec id="s4d1"><label>4.4.1</label><title>Point-of-care integration</title>
<p>The reliance on routine admission laboratory values and clinical assessments makes these models highly suitable for point-of-care implementation. All required predictors (CRP, CBC with differential, LDH, clinical assessment) are typically available within hours of admission, enabling early risk stratification when clinical decisions are most impactful.</p>
<p>Integration into electronic health record systems could provide automated risk scores with minimal workflow disruption, alerting clinicians to high-risk patients requiring enhanced monitoring or early intervention planning.</p>
</sec>
<sec id="s4d2"><label>4.4.2</label><title>Resource allocation and healthcare economics</title>
<p>Accurate prediction of oxygen therapy requirements has significant implications for healthcare resource allocation, particularly in settings with limited pediatric intensive care capacity. Early identification of high-risk patients enables proactive planning for respiratory support equipment, specialized nursing care, and potential transfer arrangements.</p>
<p>Conversely, reliable identification of low-risk patients could support earlier discharge planning and reduced monitoring intensity, optimizing resource utilization while maintaining patient safety.</p>
</sec>
<sec id="s4d3"><label>4.4.3</label><title>Quality improvement and standardization</title>
<p>Implementation of predictive models could support quality improvement initiatives by providing objective, standardized risk assessment across different clinicians and healthcare settings. This standardization may reduce variability in clinical decision-making and improve consistency of care delivery.</p>
</sec>
</sec>
<sec id="s4e"><label>4.5</label><title>Comparison with existing literature</title>
<sec id="s4e1"><label>4.5.1</label><title>Diagnostic vs. prognostic applications</title>
<p>While previous studies have focused primarily on diagnostic differentiation between Mycoplasma pneumoniae and other pneumonia etiologies, this study addresses the clinically important question of prognostic risk stratification within confirmed Mycoplasma pneumoniae cases. This prognostic focus provides more actionable information for clinical decision-making once the diagnosis is established.</p>
</sec>
<sec id="s4e2"><label>4.5.2</label><title>Geographic and population considerations</title>
<p>Most existing machine learning studies in pediatric Mycoplasma pneumoniae pneumonia have originated from Asian healthcare systems, potentially limiting generalizability to European and other populations. This study provides important validation of machine learning approaches in a European pediatric population, demonstrating consistent effectiveness across different healthcare contexts.</p>
<p>The observed comorbidity rates (approximately 40&#x0025;) in this European cohort are higher than reported in some Asian studies, potentially reflecting different referral patterns, healthcare system structures, or patient population characteristics. This difference underscores the importance of population-specific model development and validation.</p>
</sec>
<sec id="s4e3"><label>4.5.3</label><title>Methodological advances</title>
<p>The integration of SHAP analysis for model interpretability represents an important methodological advance over previous studies that relied primarily on feature importance rankings without detailed explanation of individual prediction rationales. This enhanced interpretability addresses a critical gap in clinical machine learning applications.</p>
</sec>
</sec>
<sec id="s4f"><label>4.6</label><title>Study limitations and methodological considerations</title>
<sec id="s4f1"><label>4.6.1</label><title>Sample size and statistical power</title>
<p>The relatively small sample size (<italic>n</italic>&#x2009;&#x003D;&#x2009;206) represents an important limitation and increases the risk of model overfitting, particularly when training complex algorithms. Although we implemented stratified 5-fold cross-validation, hyperparameter tuning, and probability calibration to mitigate this risk, the statistical power remains constrained by the number of oxygen-therapy events (<italic>n</italic>&#x2009;&#x003D;&#x2009;42). Small datasets can yield overly optimistic performance estimates even when rigorous internal validation is applied. Future work should include larger multicenter cohorts, external validation across independent hospitals, and prospective data collection to ensure model stability and generalizability.</p>
<p>However, the exceptional performance of several algorithms suggests that the dataset size was sufficient for developing clinically useful predictive models, particularly given the relatively high event rate (20.4&#x0025; requiring oxygen therapy) that provides adequate positive cases for model training.</p>
</sec>
<sec id="s4f2"><label>4.6.2</label><title>Retrospective design and selection bias</title>
<p>The retrospective design introduces potential limitations related to data completeness and quality. While systematic data collection protocols were implemented, some variables had missing values that required imputation. The impact of missing data was minimized through careful selection of variables with high completion rates and appropriate imputation strategies.</p>
<p>Selection bias may have occurred through the multicenter hospital-based recruitment, potentially enriching the cohort for more severe cases compared to community presentations. This bias may actually enhance the clinical utility of the models by focusing on the hospitalized population where oxygen therapy decisions are most relevant.</p>
</sec>
<sec id="s4f3"><label>4.6.3</label><title>External validity and generalizability</title>
<p>The study was conducted in Italian pediatric hospitals, potentially limiting generalizability to other healthcare systems with different patient populations, clinical practices, or resource availability. External validation in diverse healthcare settings will be essential for confirming model performance and clinical utility.</p>
<p>The relatively high comorbidity rate in this cohort may limit generalizability to healthier pediatric populations, although this characteristic may actually enhance the models&#x0027; applicability to the hospitalized patients most likely to require oxygen therapy.</p>
<p>Several factors may limit the direct generalization of our model to other clinical settings. First, laboratory assays for key biomarkers such as CRP and LDH vary across hospitals in terms of analytical platforms, reference ranges, and calibration standards. These inter-laboratory differences may influence absolute value distributions and would likely require local model re-calibration before deployment. Second, seamless integration into electronic health record (EHR) systems remains a practical barrier. The variables used in our model are routinely collected, but their extraction depends on heterogeneous database architectures, coding practices, and data-entry workflows across institutions. Third, the model assumes timely availability of laboratory results within the first hours of admission. In settings where laboratory turnaround times are longer or where certain tests are not routinely performed at presentation, real-time prediction may not be feasible. These considerations highlight the need for prospective validation and local adaptation before widespread clinical implementation.</p>
</sec>
<sec id="s4f4"><label>4.6.4</label><title>Age-related immunological heterogeneity</title>
<p>Another limitation is the lack of explicit modeling of age-related immunological heterogeneity. Immune system maturation varies substantially across infancy, early childhood, and adolescence, influencing inflammatory marker distributions and clinical presentation. Although age was included as a predictor and laboratory values were standardized using age-adjusted <italic>Z</italic>-scores, we did not stratify model development by age groups or incorporate interaction terms that capture developmental immunological differences. Future studies with larger cohorts should evaluate age-specific models or hierarchical frameworks to better characterize developmental variation in host response to Mycoplasma pneumoniae infection.</p>
</sec>
<sec id="s4f5"><label>4.6.5</label><title>Outcome definition and clinical variability</title>
<p>The definition of oxygen therapy requirement, while based on established clinical guidelines, may be subject to inter-physician variability and institutional practice differences. This variability could introduce noise into the outcome variable, potentially affecting model performance and generalizability.</p>
<p>However, the strong predictive performance suggests that the models successfully captured the underlying clinical patterns associated with respiratory compromise, despite potential variations in clinical decision-making.</p>
<p>The use of oxygen therapy as the primary outcome also presents important limitations. Oxygen supplementation is influenced not only by objective measures of hypoxemia but also by clinician judgment, institutional protocols, and resource availability, introducing variability into the endpoint. Moreover, hypoxia in pediatric patients may arise from mechanisms unrelated to Mycoplasma pneumoniae&#x2013;associated impairment of gas exchange, including metabolic disturbances or increased oxygen consumption. Despite these constraints, oxygen therapy remains a clinically meaningful and routinely documented escalation-of-care marker. Future studies should incorporate more objective physiological endpoints&#x2014;such as continuous SpO&#x2082; trajectories, ROX index, or arterial blood gas parameters&#x2014;and evaluate composite severity outcomes to reduce subjectivity.</p>
</sec>
<sec id="s4f6"><label>4.6.6</label><title>External validation and data sharing challenges</title>
<p>The inability to perform external validation on public datasets represents an important limitation that highlights broader challenges in pediatric clinical machine learning research. Despite extensive efforts to identify suitable validation cohorts, several systemic barriers prevented external validation:</p>
<p>Regulatory and Privacy Barriers: Stringent pediatric data protection regulations (GDPR in Europe, HIPAA in North America) appropriately restrict public sharing of pediatric clinical data, but inadvertently limit validation opportunities for researchers.</p>
<p>Data Standardization Gaps: Lack of standardized variable definitions, laboratory reference ranges, and outcome classifications across institutions creates compatibility challenges even when datasets are theoretically available.</p>
<p>Etiologic Specificity: Most publicly available pneumonia datasets do not provide pathogen-specific subgroups, making validation of Mycoplasma pneumoniae-specific models impossible.</p>
<p>Recommendations for the Field:
<list list-type="order">
<list-item>
<p>Federated learning approaches: Development of privacy-preserving federated learning frameworks that allow model validation across institutions without data sharing</p></list-item>
<list-item>
<p>Data sharing consortia: Establishment of pediatric respiratory infection data-sharing networks with standardized variable definitions</p></list-item>
<list-item>
<p>Synthetic data generation: Development of validated synthetic pediatric datasets for algorithm testing while preserving privacy</p></list-item>
<list-item>
<p>Pre-registration and validation plans: Prospective registration of prediction models with planned validation sites before data collection</p></list-item>
</list>Our compensatory validation approaches (extensive bootstrap validation) provide substantial evidence for model robustness within our geographic and healthcare context. However, we strongly advocate for the development of international validation networks to enable more rigorous evaluation of pediatric clinical prediction models.</p>
<p>Future Validation Plans: We are actively establishing collaborations with other pediatric hospitals to conduct prospective external validation during the 2025&#x2013;2026 respiratory season, with results expected by early 2027.</p>
</sec>
</sec>
<sec id="s4g"><label>4.7</label><title>Future research directions and development priorities</title>
<sec id="s4g1"><label>4.7.1</label><title>Multicenter external validation</title>
<p>The highest priority for future research should be multicenter external validation across diverse healthcare settings, including different countries, healthcare systems, and patient populations. Such validation studies should assess not only predictive performance but also clinical utility and implementation feasibility.</p>
<p>Prospective validation studies would provide the strongest evidence for clinical effectiveness and should include assessment of clinical decision-making impact, resource utilization changes, and patient outcome improvements.</p>
</sec>
<sec id="s4g2"><label>4.7.2</label><title>Temporal modeling and dynamic prediction</title>
<p>Current models utilize admission data for static prediction of oxygen therapy requirements throughout hospitalization. Future research should explore dynamic prediction models that incorporate temporal changes in clinical status, laboratory values, and response to initial treatments.</p>
<p>Time-series modeling approaches could provide updated risk estimates as new clinical information becomes available, enabling more responsive clinical decision support and adaptation to changing patient conditions.</p>
</sec>
<sec id="s4g3"><label>4.7.3</label><title>Integration of advanced biomarkers</title>
<p>While this study focused on readily available clinical variables, future research could explore integration of advanced biomarkers, genetic markers, or novel diagnostic tests that may enhance predictive accuracy.</p>
<p>Biomarkers of specific pathophysiological pathways involved in Mycoplasma pneumoniae pathogenesis, such as cytokine profiles or complement activation markers, could provide mechanistic insights and improved risk stratification.</p>
</sec>
<sec id="s4g4"><label>4.7.4</label><title>Imaging integration and radiomics</title>
<p>Integration of quantitative imaging analysis through radiomic approaches could enhance model performance while providing insights into pathophysiological processes. High-resolution computed tomography features may capture subtle parenchymal changes not apparent on routine chest radiography.</p>
<p>However, such integration must balance improved accuracy against increased cost, radiation exposure, and accessibility constraints in pediatric populations.</p>
</sec>
<sec id="s4g5"><label>4.7.5</label><title>Clinical decision support system development</title>
<p>Translation of research models into functional clinical decision support systems requires substantial additional development work, including user interface design, workflow integration, and clinical validation. Future research should address implementation science questions regarding optimal clinical integration strategies.</p>
<p>Real-time clinical decision support tools should provide actionable recommendations with appropriate uncertainty quantification and clear explanations of contributing factors.</p>
</sec>
</sec>
<sec id="s4h"><label>4.8</label><title>Future digital implementation and clinical integration</title>
<sec id="s4h1"><label>4.8.1</label><title>Electronic health record integration architecture</title>
<p>The proposed prediction model framework has been designed for seamless integration with modern Electronic Health Record (EHR) systems using industry-standard interoperability protocols. Implementation follows a three-layer architecture that separates data extraction, risk computation, and clinical presentation.</p>
<p>Data Integration Layer: Real-time data extraction utilizes Health Level 7 Fast Healthcare Interoperability Resources (HL7 FHIR) standards, ensuring compatibility with diverse EHR platforms including Epic, Cerner, and Allscripts systems. Laboratory results, vital signs, and clinical documentation flow automatically into the prediction pipeline without requiring manual data entry, preserving clinical workflow efficiency.</p>
<p>The system monitors for completion of the required laboratory panel (complete blood count, CRP, LDH), typically available within 2&#x2013;4&#x2005;h of admission. Once the minimum required features become available, risk calculation occurs automatically in the background, with results available to clinicians within seconds of data availability.</p>
<p>Computation Layer: The prediction model will operate on a secure server infrastructure meeting healthcare data security requirements including HIPAA compliance and GDPR data protection standards. Model inference requires minimal computational resources (&#x003C;100&#x2005;ms per patient), enabling real-time risk scoring even during high-volume admission periods.</p>
<p>Version control and model updating capabilities will ensure that improved model iterations can be deployed systematically while maintaining audit trails of prediction provenance. This architecture will support prospective validation studies and continuous quality monitoring of prediction accuracy.</p>
<p>Presentation Layer: Clinical decision support interfaces will integrate directly into existing EHR workflows through embedded widgets or standalone dashboards. Clinicians view risk scores alongside routine laboratory results without navigating away from their standard workspace, minimizing workflow disruption and cognitive burden.</p>
</sec>
<sec id="s4h2"><label>4.8.2</label><title>Clinical decision support interface design</title>
<p>The clinical interface will be designed following human-centered design principles and incorporates feedback from pediatric hospitalists, intensivists, and bedside nurses.</p>
<p>Risk Communication Strategy: Rather than presenting raw probability scores, the interface employs a three-tier color-coded alert system that aligns with existing clinical warning systems:</p>
<p>Green (Low Risk): &#x003C;20&#x0025; probability
<list list-type="bullet">
<list-item>
<p>Standard monitoring protocols</p></list-item>
<list-item>
<p>Routine vital signs assessment every 4&#x2013;6&#x2005;h</p></list-item>
<list-item>
<p>No additional respiratory assessment required</p></list-item>
<list-item>
<p>Typical discharge planning trajectory</p></list-item>
</list>Yellow (Moderate Risk): 20&#x0025;&#x2013;40&#x0025; probability
<list list-type="bullet">
<list-item>
<p>Enhanced respiratory monitoring</p></list-item>
<list-item>
<p>Vital signs assessment every 2&#x2013;4&#x2005;h</p></list-item>
<list-item>
<p>Early involvement of respiratory therapy for assessment</p></list-item>
<list-item>
<p>Delay discharge planning until trend clarification</p></list-item>
</list>Red (High Risk): &#x003E;40&#x0025; probability
<list list-type="bullet">
<list-item>
<p>Intensive monitoring protocols</p></list-item>
<list-item>
<p>Continuous pulse oximetry consideration</p></list-item>
<list-item>
<p>Respiratory therapy consultation within 2&#x2005;h</p></list-item>
<list-item>
<p>Early discussion with intensive care team</p></list-item>
<list-item>
<p>Proactive planning for potential oxygen therapy needs</p></list-item>
</list>Override and Documentation: Clinicians will be able to maintain complete autonomy to override model recommendations with documented rationale. Override patterns are tracked for quality improvement and model recalibration purposes. Common override reasons might include:
<list list-type="bullet">
<list-item>
<p>&#x201C;Clinical improvement since laboratory draw&#x201D;</p></list-item>
<list-item>
<p>&#x201C;Extenuating social factors requiring admission&#x201D;</p></list-item>
<list-item>
<p>&#x201C;Alternative diagnosis now suspected&#x201D;</p></list-item>
</list></p>
</sec>
</sec>
<sec id="s4i"><label>4.9</label><title>Ethical and equity considerations</title>
<sec id="s4i1"><label>4.9.1</label><title>Algorithmic fairness and bias assessment</title>
<p>Future implementation must include comprehensive assessment of model performance across different demographic groups, including age, sex, ethnicity, and socioeconomic status. Ensuring equitable performance is essential for avoiding unintended disparities in clinical care.</p>
<p>Bias assessment should extend beyond demographic factors to include clinical characteristics such as comorbidity patterns, disease severity, and healthcare access factors that may influence both predictor variables and outcomes.</p>
</sec>
<sec id="s4i2"><label>4.9.2</label><title>Clinical autonomy and human oversight</title>
<p>Implementation of predictive models must preserve appropriate clinical autonomy and judgment while providing decision support. Models should enhance rather than replace clinical reasoning, with clear mechanisms for clinical override when circumstances warrant alternative approaches.</p>
<p>Training and education programs will be essential for ensuring appropriate interpretation and utilization of model outputs by clinical teams.</p>
</sec>
<sec id="s4i3"><label>4.9.3</label><title>Privacy and data security</title>
<p>Clinical implementation requires robust data security measures and privacy protections, particularly for pediatric populations. Compliance with applicable regulations and institutional policies must be maintained throughout model development and deployment phases.</p>
</sec>
</sec>
</sec>
<sec id="s5" sec-type="conclusions"><label>5</label><title>Conclusions</title>
<sec id="s5a"><label>5.1</label><title>Summary of key findings</title>
<p>This multicenter retrospective study demonstrates that machine learning models utilizing routine admission data can accurately predict oxygen therapy requirements in pediatric Mycoplasma pneumoniae pneumonia. Support Vector Machine achieved exceptional performance (AUC 0.97), while Logistic Regression, XGBoost, and LightGBM also demonstrated strong predictive capabilities with AUC values exceeding 0.93.</p>
<p>The study identified key predictive features that align with established clinical indicators of disease severity, including C-reactive protein, lactate dehydrogenase, neutrophil-to-lymphocyte ratio, and clinical assessment of respiratory distress. The integration of SHAP analysis provided crucial interpretability, ensuring clinical transparency and supporting potential adoption in pediatric care settings.</p>
</sec>
<sec id="s5b"><label>5.2</label><title>Clinical impact and significance</title>
<p>These findings support the potential for data-driven approaches to enhance risk stratification and clinical decision-making in pediatric respiratory infections. Early identification of children at risk for oxygen therapy could enable proactive clinical interventions, optimize resource allocation, and improve patient outcomes through timely escalation of care.</p>
<p>The reliance on readily available clinical and laboratory data makes these models highly suitable for implementation across diverse healthcare settings without requiring specialized testing or additional resource investments.</p>
</sec>
<sec id="s5c"><label>5.3</label><title>Scientific contribution</title>
<p>This study addresses an important gap in the literature by focusing on prognostic prediction within confirmed Mycoplasma pneumoniae pneumonia cases rather than diagnostic differentiation. The integration of interpretable machine learning approaches with comprehensive clinical data provides a template for future research in pediatric infectious diseases.</p>
<p>The validation of these approaches in a European pediatric population extends the generalizability of machine learning methods beyond the primarily Asian cohorts studied previously, supporting broader international applicability.</p>
</sec>
<sec id="s5d"><label>5.4</label><title>Implementation pathway</title>
<p>Future work addressing multicenter validation, prospective implementation studies, and comprehensive bias assessment will be essential for translating these research findings into routine clinical practice. The development of user-friendly clinical decision support tools with appropriate safeguards and oversight mechanisms represents the next critical phase of this research program.</p>
<p>Success in clinical implementation will require close collaboration between data scientists, clinical teams, healthcare informaticists, and quality improvement specialists to ensure that technological capabilities align with clinical needs and workflow realities.</p>
</sec>
<sec id="s5e"><label>5.5</label><title>Broader implications for pediatric care</title>
<p>The success of these predictive models in Mycoplasma pneumoniae pneumonia suggests broader applicability to other pediatric infectious diseases and clinical conditions. The methodological framework developed here could serve as a template for predictive modeling in other clinical contexts where early risk stratification is crucial for optimal patient management.</p>
<p>The integration of machine learning into pediatric healthcare represents an important evolution in clinical practice, offering the potential for more precise, personalized, and proactive patient care while maintaining the essential human elements of clinical judgment and compassionate care delivery.</p>
</sec>
</sec>
</body>
<back>
<sec id="s8" sec-type="data-availability"><title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s9" sec-type="ethics-statement"><title>Ethics statement</title>
<p>The studies involving humans were approved by Local Ethics Committee Palermo 2, AOR Villa Sofia Cervello, Via Trabucco, 180, 90146 Palermo, Italy. The studies were conducted in accordance with the local legislation and institutional requirements. Written informed consent for participation was obtained from the participants or the participants&#x0027; legal guardians/next of kin in accordance with the national legislation and institutional requirements.</p>
</sec>
<sec id="s10" sec-type="author-contributions"><title>Author contributions</title>
<p>CC: Conceptualization, Data curation, Investigation, Methodology, Project administration, Resources, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing, Validation, Visualization, Software. JA: Data curation, Investigation, Methodology, Software, Validation, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. MR: Visualization, Writing &#x2013; review &#x0026; editing. MLS: Writing &#x2013; review &#x0026; editing, Visualization. MRL: Writing &#x2013; review &#x0026; editing, Visualization. SL: Supervision, Validation, Visualization, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec id="s11"><title>PneumoML study group</title>
<p>Department of Clinical and Experimental Medicine, University of Catania, Catania, Italy: Giuseppe Fabio Parisi. Postgraduate Training Program in Pediatrics, University of Palermo, Palermo, Italy: Giacoma Maria Pisciotta. Unit of Nursing and Midwifery Professions - Hospital Sector, ASP Trapani, Trapani, Italy: Stefania Ruggirello. Unit of Pediatrics, Sant&#x0027;Antonio Abate Hospital, Trapani, Italy: Veronica Vanella.</p>
</sec>
<ack><title>Acknowledgments</title>
<p>We acknowledge the invaluable contributions of the clinical teams at all participating hospitals for their dedication to patient care and meticulous data collection efforts throughout this study period. We extend particular gratitude to the pediatric residents, nursing staff, and laboratory personnel who ensured comprehensive and accurate clinical documentation. We thank the information technology departments at each institution for facilitating secure data extraction, management, and analysis while maintaining strict compliance with privacy regulations and institutional policies. Their technical expertise and commitment to data security were essential for successful study completion. We acknowledge the biostatistics and data management support provided by our institutional research centers, particularly for guidance on advanced machine learning techniques and model validation approaches. This study was conducted using pseudonymized clinical data collected during routine patient care, with all analyses performed in accordance with established ethical guidelines and institutional review board approvals.</p>
</ack>
<sec id="s13" sec-type="COI-statement"><title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s14" sec-type="ai-statement"><title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec id="s15" sec-type="disclaimer"><title>Publisher&#x0027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s16" sec-type="supplementary-material"><title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fdgth.2026.1755878/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fdgth.2026.1755878/full&#x0023;supplementary-material</ext-link></p>
<supplementary-material xlink:href="Datasheet1.pdf" id="SM1" mimetype="application/pdf"/>
<supplementary-material xlink:href="Table1.pdf" id="SM2" mimetype="application/pdf"/>
</sec>
<ref-list><title>References</title>
<ref id="B1"><label>1.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Xie</surname> <given-names>S</given-names></name> <name><surname>Zhang</surname> <given-names>Y</given-names></name> <name><surname>Wang</surname> <given-names>L</given-names></name> <name><surname>Chen</surname> <given-names>H</given-names></name> <name><surname>Liu</surname> <given-names>X</given-names></name> <name><surname>Wang</surname> <given-names>Y</given-names></name><etal/></person-group> <article-title>Development and validation of an early diagnosis model for severe mycoplasma pneumonia in children based on interpretable machine learning</article-title>. <source>Respir Res</source>. (<year>2025</year>) <volume>26</volume>:<fpage>182</fpage>. <pub-id pub-id-type="doi">10.1186/s12931-025-03262-1</pub-id><pub-id pub-id-type="pmid">40361124</pub-id></mixed-citation></ref>
<ref id="B2"><label>2.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Peng</surname> <given-names>X</given-names></name> <name><surname>Li</surname> <given-names>M</given-names></name> <name><surname>Zhang</surname> <given-names>Q</given-names></name> <name><surname>Wang</surname> <given-names>H</given-names></name> <name><surname>Chen</surname> <given-names>L</given-names></name> <name><surname>Liu</surname> <given-names>Y</given-names></name><etal/></person-group> <article-title>A preliminary prediction model of pediatric Mycoplasma pneumoniae pneumonia based on routine blood parameters by using machine learning method</article-title>. <source>BMC Infect Dis</source>. (<year>2024</year>) <volume>24</volume>:<fpage>707</fpage>. <pub-id pub-id-type="doi">10.1186/s12879-024-09613-5</pub-id><pub-id pub-id-type="pmid">39026207</pub-id></mixed-citation></ref>
<ref id="B3"><label>3.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Napolitano</surname> <given-names>N</given-names></name> <name><surname>Berlinski</surname> <given-names>A</given-names></name> <name><surname>Walsh</surname> <given-names>BK</given-names></name> <name><surname>Ginier</surname> <given-names>E</given-names></name> <name><surname>Strickland</surname> <given-names>SL</given-names></name></person-group>. <article-title>AARC Clinical practice guideline: management of pediatric patients with oxygen in the acute care setting</article-title>. <source>Respir Care</source>. (<year>2021</year>) <volume>66</volume>:<fpage>1214</fpage>&#x2013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.4187/respcare.09006</pub-id><pub-id pub-id-type="pmid">33790048</pub-id></mixed-citation></ref>
<ref id="B4"><label>4.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tosif</surname> <given-names>S</given-names></name> <name><surname>Duke</surname> <given-names>T</given-names></name></person-group>. <article-title>Evidence to support oxygen guidelines for children with emergency signs in developing countries: a systematic review and physiological and mechanistic analysis</article-title>. <source>J Trop Pediatr</source>. (<year>2017</year>) <volume>63</volume>:<fpage>402</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1093/tropej/fmw100</pub-id><pub-id pub-id-type="pmid">28158795</pub-id></mixed-citation></ref>
<ref id="B5"><label>5.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Serin</surname> <given-names>O</given-names></name> <name><surname>Johnson</surname> <given-names>M</given-names></name> <name><surname>Patterson</surname> <given-names>K</given-names></name> <name><surname>Williams</surname> <given-names>R</given-names></name> <name><surname>Davis</surname> <given-names>L</given-names></name> <name><surname>Thompson</surname> <given-names>S</given-names></name><etal/></person-group> <article-title>Predicting escalation of care for childhood pneumonia using machine learning: retrospective analysis and model development</article-title>. <source>JMIRX Med</source>. (<year>2025</year>) <volume>6</volume>:<fpage>e57719</fpage>. <pub-id pub-id-type="doi">10.2196/57719</pub-id><pub-id pub-id-type="pmid">40036666</pub-id></mixed-citation></ref>
<ref id="B6"><label>6.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Collins</surname> <given-names>GS</given-names></name> <name><surname>Moons</surname> <given-names>KGM</given-names></name> <name><surname>Dhiman</surname> <given-names>P</given-names></name> <name><surname>Riley</surname> <given-names>RD</given-names></name> <name><surname>Beam</surname> <given-names>AL</given-names></name> <name><surname>Van Calster</surname> <given-names>B</given-names></name><etal/></person-group> <article-title>TRIPOD&#x002B;AI statement: updated guidance for reporting clinical prediction models that use regression or machine learning methods</article-title>. <source>Br Med J</source>. (<year>2024</year>) <volume>385</volume>:<fpage>e078378</fpage>. <pub-id pub-id-type="doi">10.1136/bmj-2023-078378</pub-id></mixed-citation></ref>
<ref id="B7"><label>7.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Pourakbari</surname> <given-names>B</given-names></name> <name><surname>Mamishi</surname> <given-names>S</given-names></name> <name><surname>Bosaghzadeh</surname> <given-names>Z</given-names></name> <name><surname>Jafari</surname> <given-names>SA</given-names></name> <name><surname>Rezaei</surname> <given-names>MS</given-names></name> <name><surname>Mahmoudi</surname> <given-names>S</given-names></name><etal/></person-group> <article-title>Predicting COVID-19 severity in pediatric patients using machine learning: a comparative analysis of algorithms and ensemble methods</article-title>. <source>Sci Rep</source>. (<year>2025</year>) <volume>15</volume>:<fpage>29118</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-025-15366-1</pub-id><pub-id pub-id-type="pmid">40781476</pub-id></mixed-citation></ref>
<ref id="B8"><label>8.</label><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>X</given-names></name> <name><surname>Khetan</surname> <given-names>A</given-names></name> <name><surname>Cvitkovic</surname> <given-names>M</given-names></name> <name><surname>Karnin</surname> <given-names>Z.</given-names></name></person-group> <comment>TabTransformer: Tabular Data Modeling Using Contextual Embeddings. arXiv preprint. (2020). Available online at</comment>: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/2012.06678">https://arxiv.org/abs/2012.06678</ext-link> <comment>(Accessed November 20, 2025).</comment></mixed-citation></ref>
<ref id="B9"><label>9.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>YANG</surname> <given-names>S</given-names></name> <name><surname>LIU</surname> <given-names>X</given-names></name> <name><surname>WANG</surname> <given-names>H</given-names></name> <name><surname>LI</surname> <given-names>H</given-names></name> <name><surname>LI</surname> <given-names>X</given-names></name></person-group>. <article-title>Risk factors for severe Mycoplasma Pneumoniae pneumonia in children: a meta-analysis</article-title>. <source>Chinese Gen Pract</source>. (<year>2024</year>) <volume>27</volume>(<issue>14</issue>):<fpage>1750</fpage>. <pub-id pub-id-type="doi">10.12114/j.issn.1007-9572.2023.0737</pub-id></mixed-citation></ref>
<ref id="B10"><label>10.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jiang</surname> <given-names>Y</given-names></name> <name><surname>Wang</surname> <given-names>X</given-names></name> <name><surname>Li</surname> <given-names>L</given-names></name> <name><surname>Wang</surname> <given-names>Y</given-names></name> <name><surname>Wang</surname> <given-names>X</given-names></name> <name><surname>Zou</surname> <given-names>Y</given-names></name></person-group>. <article-title>Predicting and interpreting key features of refractory Mycoplasma pneumoniae pneumonia using multiple machine learning methods</article-title>. <source>Sci Rep</source>. (<year>2025</year>) <volume>15</volume>(<issue>1</issue>):<fpage>18029</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-025-02962-4</pub-id><pub-id pub-id-type="pmid">40410245</pub-id></mixed-citation></ref>
<ref id="B11"><label>11.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Don&#x00E0;</surname> <given-names>D</given-names></name> <name><surname>Brigadoi</surname> <given-names>G</given-names></name> <name><surname>Grandinetti</surname> <given-names>R</given-names></name> <name><surname>Pedretti</surname> <given-names>L</given-names></name> <name><surname>Boscarino</surname> <given-names>G</given-names></name> <name><surname>Barbieri</surname> <given-names>E</given-names></name><etal/></person-group> <article-title>Treatment of mild to moderate community-acquired pneumonia in previously healthy children: an Italian intersociety consensus (SIPPS-SIP-SITIP-FIMP-SIAIP-SIMRI-FIMMG-SIMG)</article-title>. <source>Ital J Pediatr</source>. (<year>2024</year>) <volume>50</volume>(<issue>1</issue>):<fpage>217</fpage>. <pub-id pub-id-type="doi">10.1186/s13052-024-01786-8</pub-id></mixed-citation></ref>
<ref id="B12"><label>12.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Harris</surname> <given-names>M</given-names></name> <name><surname>Clark</surname> <given-names>J</given-names></name> <name><surname>Coote</surname> <given-names>N</given-names></name> <name><surname>Fletcher</surname> <given-names>P</given-names></name> <name><surname>Harnden</surname> <given-names>A</given-names></name> <name><surname>McKean</surname> <given-names>M</given-names></name><etal/></person-group> <article-title>British Thoracic society guidelines for the management of community acquired pneumonia in children: update 2011</article-title>. <source>Thorax</source>. (<year>2011</year>) <volume>66</volume>(<issue>Suppl 2</issue>):<fpage>ii1</fpage>&#x2013;<lpage>ii23</lpage>. <pub-id pub-id-type="doi">10.1136/thoraxjnl-2011-200598</pub-id><pub-id pub-id-type="pmid">21903691</pub-id></mixed-citation></ref></ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by"><p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/816954/overview">Vangelis Sakkalis</ext-link>, Foundation for Research and Technology Hellas (FORTH), Greece</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by"><p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/919183/overview">Georgios Tzedakis</ext-link>, Foundation for Research and Technology (FORTH), Greece</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1554839/overview">Wanjun Liu</ext-link>, Second Hospital of Anhui Medical University, China</p></fn>
</fn-group>
</back>
</article>