<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIRx Med</journal-id><journal-id journal-id-type="publisher-id">xmed</journal-id><journal-id journal-id-type="index">34</journal-id><journal-title>JMIRx Med</journal-title><abbrev-journal-title>JMIRx Med</abbrev-journal-title><issn pub-type="epub">2563-6316</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v6i1e57719</article-id><article-id pub-id-type="doi">10.2196/57719</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Predicting Escalation of Care for Childhood Pneumonia Using Machine Learning: Retrospective Analysis and Model Development</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Serin</surname><given-names>Oguzhan</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Akbasli</surname><given-names>Izzet Turkalp</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Cetin</surname><given-names>Sena Bocutcu</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Koseoglu</surname><given-names>Busra</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Deveci</surname><given-names>Ahmet Fatih</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ugur</surname><given-names>Muhsin Zahid</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ozsurekci</surname><given-names>Yasemin</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Pediatrics, Hacettepe University Medical School</institution><addr-line>Gevher Nesibe Avenue, Altindag</addr-line><addr-line>Ankara</addr-line><country>Turkey</country></aff><aff id="aff2"><institution>Department of Health Information Systems, University of Health Sciences</institution><addr-line>Istanbul</addr-line><country>Turkey</country></aff><aff id="aff3"><institution>Department of Pediatric Infectious Diseases, Hacettepe University Medical School</institution><addr-line>Ankara</addr-line><country>Turkey</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Amal</surname><given-names>Saeed</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Anonymous</surname><given-names/></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Rogerson</surname><given-names>Colin</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Izzet Turkalp Akbasli, MD, Department of Pediatrics, Hacettepe University Medical School, Gevher Nesibe Avenue, Altindag, Ankara, 06230, Turkey, 90 3051350; <email>izzetakbasli@gmail.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>4</day><month>3</month><year>2025</year></pub-date><volume>6</volume><elocation-id>e57719</elocation-id><history><date date-type="received"><day>24</day><month>02</month><year>2024</year></date><date date-type="rev-recd"><day>19</day><month>12</month><year>2024</year></date><date date-type="accepted"><day>08</day><month>01</month><year>2025</year></date></history><copyright-statement>&#x00A9; Oguzhan Serin, Izzet Turkalp Akbasli, Sena Bocutcu Cetin, Busra Koseoglu, Ahmet Fatih Deveci, Muhsin Zahid Ugur, Yasemin Ozsurekci. Originally published in JMIRx Med (<ext-link ext-link-type="uri" xlink:href="https://med.jmirx.org">https://med.jmirx.org</ext-link>), 4.3.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIRx Med, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://med.jmirx.org/">https://med.jmirx.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://xmed.jmir.org/2025/1/e57719"/><related-article related-article-type="companion" ext-link-type="doi" xlink:href="10.1101/2024.02.22.24303209" xlink:title="Preprint (medRxiv)" xlink:type="simple">https://www.medrxiv.org/content/10.1101/2024.02.22.24303209v1</related-article><related-article related-article-type="companion" ext-link-type="doi" xlink:href="10.2196/71100" xlink:title="Peer-Review Report by Colin Rogerson (Reviewer E)" xlink:type="simple">https://med.jmirx.org/2025/1/e71100</related-article><related-article related-article-type="companion" ext-link-type="doi" xlink:href="10.2196/71369" xlink:title="Peer-Review Report by Anonymous" xlink:type="simple">https://med.jmirx.org/2025/1/e71369</related-article><related-article related-article-type="companion" ext-link-type="doi" xlink:href="10.2196/71098" xlink:title="Authors' Response to Peer-Review Reports" xlink:type="simple">https://med.jmirx.org/2025/1/e71098</related-article><abstract><sec><title>Background</title><p>Pneumonia is a leading cause of mortality in children aged &#x003C;5 years. While machine learning (ML) has been applied to pneumonia diagnostics, few studies have focused on predicting the need for escalation of care in pediatric cases. This study aims to develop an ML-based clinical decision support tool for predicting the need for escalation of care in community-acquired pneumonia cases.</p></sec><sec><title>Objective</title><p>The primary objective was to develop a robust predictive tool to help primary care physicians determine where and how a case should be managed.</p></sec><sec sec-type="methods"><title>Methods</title><p>Data from 437 children with community-acquired pneumonia, collected before the COVID-19 pandemic, were retrospectively analyzed. Pediatricians encoded key clinical features from unstructured medical records based on Integrated Management of Childhood Illness guidelines. After preprocessing with Synthetic Minority Oversampling Technique&#x2013;Tomek to handle imbalanced data, feature selection was performed using Shapley additive explanations values. The model was optimized through hyperparameter tuning and ensembling. The primary outcome was the level of care severity, defined as the need for referral to a tertiary care unit for intensive care or respiratory support.</p></sec><sec sec-type="results"><title>Results</title><p>A total of 437 cases were analyzed, and the optimized models predicted the need for transfer to a higher level of care with an accuracy of 77% to 88%, achieving an area under the receiver operator characteristic curve of 0.88 and an area under the precision-recall curve of 0.96. Shapley additive explanations value analysis identified hypoxia, respiratory distress, age, weight-for-age <italic>z</italic> score, and complaint duration as the most important clinical predictors independent of laboratory diagnostics.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study demonstrates the feasibility of applying ML techniques to create a prognostic care decision tool for childhood pneumonia. It provides early identification of cases requiring escalation of care by combining foundational clinical skills with data science methods.</p></sec></abstract><kwd-group><kwd>childhood pneumonia</kwd><kwd>community-acquired pneumonia</kwd><kwd>machine learning</kwd><kwd>clinical decision support system</kwd><kwd>prognostic care decision</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Pneumonia is responsible for 14% of all mortality in children aged &#x003C;5 years and is included in World Health Organization (WHO) reports as the cause of death in 740,180 children in 2019 alone [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. The Global Action Plan for the Prevention and Control of Pneumonia and Diarrhea, which was released by the WHO and UNICEF, aimed to reduce the mortality rate from pneumonia and diarrhea in children aged &#x003C;5 years [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. They have set targets that include vaccination, water and air sanitation, exclusively breastfeeding in the first 6 months, and eliminating pediatric HIV cases, along with appropriate pneumonia and diarrhea care.</p><p>It has been demonstrated that timely and accurate diagnosis of pneumonia and appropriately initiated treatment reduce mortality by up to 28% [<xref ref-type="bibr" rid="ref4">4</xref>]. Diagnosis can often be difficult, since the clinical presentation of pneumonia in children is variable [<xref ref-type="bibr" rid="ref5">5</xref>]. For this reason, the WHO has published the Integrated Management of Childhood Illness (IMCI) guidelines, which guide physicians in diagnosing, treating, and identifying danger signs of pneumonia [<xref ref-type="bibr" rid="ref6">6</xref>]. While some cases of pneumonia are treatable with appropriate interventions, even low-cost or low-tech options [<xref ref-type="bibr" rid="ref1">1</xref>], pneumonia remains a leading cause of morbidity and mortality, particularly in resource-limited countries and regions [<xref ref-type="bibr" rid="ref2">2</xref>]. Managing high-risk populations continues to present significant challenges, especially in intensive care settings where patients often require advanced respiratory support. In addition, it has been shown that families seeking health services in resource-limited settings causes delays in providing appropriate treatment, leading to disease progression [<xref ref-type="bibr" rid="ref7">7</xref>]. These highlight the need to improve medical care decisions, particularly in regions with limited resources, to reduce pneumonia-related morbidity and mortality.</p><p>Early and accurate recognition of patients who may require escalation of care to tertiary facilities is essential, particularly for those who will require mechanical ventilation or advanced respiratory support [<xref ref-type="bibr" rid="ref8">8</xref>]. Predicting which patients will deteriorate is challenging due to the heterogeneous presentation of pneumonia, and clinical features such as hypoxia, respiratory distress, nutritional status, and comorbidities are critical markers that necessitate closer monitoring or transfer [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Prolonged duration of illness and failure to respond to initial treatments are also important as they may indicate inadequate treatment, misdiagnosis, or incorrect identification of potential pathogens, which can lead to the escalation of care [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref11">11</xref>].</p><p>Data science can provide actionable evidence for effective clinical intervention in pediatric diseases in the future [<xref ref-type="bibr" rid="ref12">12</xref>] and can reduce inequality in health care [<xref ref-type="bibr" rid="ref13">13</xref>]. Also, using big data and machine learning (ML) technologies is promising for childhood pneumonia in low- and middle-income countries (LMICs), especially patient-risk stratification for developing severe disease and mortality [<xref ref-type="bibr" rid="ref14">14</xref>]. Because of their flexibility and high accuracy, ML models are used in medicine in the fields of prediction (prognostics) and classification (diagnostics) [<xref ref-type="bibr" rid="ref12">12</xref>]. Additionally, the use of ML offers great promise for decision support in managing community-acquired pneumonia (CAP) in children, as demonstrated in recent studies. These include predicting intensive care unit needs [<xref ref-type="bibr" rid="ref15">15</xref>], low-cost and noninvasive diagnostics for childhood pneumonia in resource-limited settings [<xref ref-type="bibr" rid="ref16">16</xref>], supporting pathogen identification at admission only using basic clinical and laboratory features [<xref ref-type="bibr" rid="ref11">11</xref>], and using natural language processing with ML for supporting clinical decisions on radiology reports [<xref ref-type="bibr" rid="ref17">17</xref>].</p><p>It has been seen that the vast majority of data science studies on pneumonia aims to provide diagnostic support to the physician by processing radiological images [<xref ref-type="bibr" rid="ref18">18</xref>]. However, diagnostic utilities are mostly unavailable in LMICs and primary care units. Therefore, physicians need prognostic support algorithms that distinguish between serious and nonserious cases without using advanced diagnostic equipment.</p><p>We aimed to develop an ML-based clinical decision support tool for childhood pneumonia that can be used by non&#x2013;intensive care physicians, particularly those working in LMICs, in predicting the escalation of care and thereby ensuring the effective diagnosis and treatment of pneumonia, which is one of the 2025 goals of the WHO [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref3">3</xref>].</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Case Definition and Patient Selection</title><p>Our study included pediatric patients who received inpatient treatment at Hacettepe University Medical School, a large, urban, tertiary, academic medical center in Ankara, T&#x00FC;rkiye, between January 2014 and April 2020. The center serves a diverse range of pediatric patients from both urban and rural areas across the country, including those requiring advanced multidisciplinary care as well as those with less severe conditions. All patients were diagnosed with CAP based on the most recent IMCI guidelines, which provide a structured clinical framework focused on clinical features rather than advanced imaging or laboratory results [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. Patients younger than 28 days of age (neonatal age), those older than 18 years, and those who had been hospitalized within the last 14 days were excluded.</p><p>The medical records of 437 patients were retrospectively examined by pediatricians, who encoded the candidate features from unstructured admission notes based on the IMCI guidelines (<xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>). These variables were chosen based on their clinical value in clinical decision-making and their availability in primary care.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Candidate features: clinical variables.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Clinical variables</td><td align="left" valign="bottom">Description</td></tr></thead><tbody><tr><td align="left" valign="top">Age</td><td align="left" valign="top">Age in months at the time of admission</td></tr><tr><td align="left" valign="top">Weight (<italic>z</italic> score)</td><td align="left" valign="top">Standardized score based on Turkish children reference values [<xref ref-type="bibr" rid="ref20">20</xref>], indirectly reflecting nutritional status</td></tr><tr><td align="left" valign="top">Gender</td><td align="left" valign="top">Biological sex (male or female)</td></tr><tr><td align="left" valign="top">Complaint period</td><td align="left" valign="top">Duration (days) from symptom onset to admission</td></tr><tr><td align="left" valign="top">Comorbidity</td><td align="left" valign="top">Presence of any significant underlying medical conditions, including congenital disorders, genetic syndromes, neuromuscular diseases, and chronic respiratory or cardiac issues</td></tr><tr><td align="left" valign="top">Recent antibiotics usage</td><td align="left" valign="top">Prescribed oral antibiotic use within the 14 days before admission, suggesting an inadequately treated infection or failure to respond initial care</td></tr><tr><td align="left" valign="top">Fever</td><td align="left" valign="top">Presence of elevated body temperature at admission</td></tr><tr><td align="left" valign="top">Cough</td><td align="left" valign="top">A key respiratory symptom at admission</td></tr><tr><td align="left" valign="top">Loss of appetite</td><td align="left" valign="top">Sign of systemic illness, reflecting impact on the patient&#x2019;s well-being</td></tr><tr><td align="left" valign="top">Respiratory distress</td><td align="left" valign="top">Presence of shortness of breath, rapid breathing (tachypnea), nasal flaring, or chest wall retractions at initial examination</td></tr><tr><td align="left" valign="top">Abnormal lung sounds</td><td align="left" valign="top">Auscultatory findings (eg, crackles or wheezing), indicative of pulmonary pathology at initial examination</td></tr><tr><td align="left" valign="top">Hypoxia</td><td align="left" valign="top">SaO<sub>2</sub><sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> measured by pulse oximetry; hypoxia is defined as SaO<sub>2</sub> below 92% at initial examination</td></tr><tr><td align="left" valign="top">Level of care severity</td><td align="left" valign="top">Primary outcome; whether the patient requires pneumonia care at a tertiary care unit, including PICU<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> admission or respiratory support (oxygenation or ventilation), at any point during the hospital stay</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>SaO<sub>2</sub>: peripheral blood oxygen saturation.</p></fn><fn id="table1fn2"><p><sup>b</sup>PICU: pediatric intensive care unit.</p></fn></table-wrap-foot></table-wrap><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Candidate features: laboratory variables.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Laboratory variables</td><td align="left" valign="top">Unit</td></tr></thead><tbody><tr><td align="left" valign="top">Hemoglobin</td><td align="left" valign="top">Grams per deciliter (g/dL)</td></tr><tr><td align="left" valign="top">Leukocytes</td><td align="left" valign="top">Cells per liter (&#x00D7;10<sup>6</sup>/L)</td></tr><tr><td align="left" valign="top">Lymphocytes</td><td align="left" valign="top">Cells per liter (&#x00D7;10<sup>6</sup>/L)</td></tr><tr><td align="left" valign="top">Neutrophils</td><td align="left" valign="top">Cells per liter (&#x00D7;10<sup>6</sup>/L)</td></tr><tr><td align="left" valign="top">Platelets</td><td align="left" valign="top">Cells per liter (&#x00D7;10<sup>9</sup>/L)</td></tr><tr><td align="left" valign="top">C-reactive protein</td><td align="left" valign="top">Milligrams per liter (mg/L)</td></tr><tr><td align="left" valign="top">Albumin</td><td align="left" valign="top">Grams per deciliter (g/dL)</td></tr><tr><td align="left" valign="top">Sodium</td><td align="left" valign="top">Milliequivalents per liter (mEq/L)</td></tr><tr><td align="left" valign="top">Aspartate aminotransferase</td><td align="left" valign="top">Units per liter (U/L)</td></tr><tr><td align="left" valign="top">Alanine aminotransferase</td><td align="left" valign="top">Units per liter (U/L)</td></tr></tbody></table></table-wrap><p>The primary outcome was the &#x201C;level of care severity,&#x201D; scaled as severe or nonsevere. This categorization was made by physician-encoders based on whether the patient required referral to a tertiary care unit, using medical notes during the hospital stay. Children classified as severe included those admitted to the pediatric intensive care unit or those who required oxygenation or ventilation support at any time during the hospital stay.</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>This study&#x2019;s design and procedures were approved by the Hacettepe University Clinical Research Ethics Committee with protocol GO-20/1182. Since this study is a retrospective analysis using previously collected data, informed consent was not required as per the ethics committee&#x2019;s approval. All data used in this study were deidentified before analysis to ensure participant privacy and confidentiality. No compensation was provided to participants, as this study did not involve direct human participant recruitment.</p></sec><sec id="s2-3"><title>Study Population</title><p>This study included 437 hospitalized patients with CAP, categorized into nonsevere (n=133, 30.4%) and severe cases (n=304, 69.6%). Demographic and clinical candidate variables, along with laboratory indices, were collected. Group comparisons were made using the Mann-Whitney <italic>U</italic> test for continuous variables and the <italic>&#x03C7;</italic><sup>2</sup> test for categorical variables, with significance set at <italic>P</italic>&#x003C;.05. A summary of these characteristics and statistical comparisons are provided in <xref ref-type="table" rid="table3">Table 3</xref>.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Characteristics of the study population by level of care severity (N=437).</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Candidate variables</td><td align="left" valign="bottom">Nonsevere (n=133, 30.4%)</td><td align="left" valign="bottom">Severe (n=304, 69.6%)</td><td align="left" valign="bottom">Test statistic (<italic>df</italic>)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Age (months), median (IQR)</td><td align="left" valign="top">44 (13 to 98)</td><td align="left" valign="top">23 (7 to 64.5)</td><td align="left" valign="top">16,602<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.003</td></tr><tr><td align="left" valign="top">Weight (<italic>z</italic> scores), median (IQR)</td><td align="left" valign="top">&#x2212;0.57 (&#x2212;1.4 to 0.45)</td><td align="left" valign="top">&#x2212;0.7 (&#x2212;2.5 to 0.4)</td><td align="left" valign="top">17,784<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.045</td></tr><tr><td align="left" valign="top">Complaint period (days), median (IQR)</td><td align="left" valign="top">4 (2 to 7)</td><td align="left" valign="top">4 (2 to 7)</td><td align="left" valign="top">19,274<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.44</td></tr><tr><td align="left" valign="top" colspan="3">Gender, n (%)</td><td align="left" valign="top">0.05<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.83</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">68 (30.9)</td><td align="left" valign="top">152 (69.1)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">65 (30)</td><td align="left" valign="top">152 (70)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">Comorbidity, n (%)</td><td align="left" valign="top">85 (28.7)</td><td align="left" valign="top">211 (71.3)</td><td align="left" valign="top">1.28<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> (1)</td><td align="left" valign="top">.26</td></tr><tr><td align="left" valign="top">Recent antibiotic usage, n (%)</td><td align="left" valign="top">40 (26.3)</td><td align="left" valign="top">112 (73.7)</td><td align="left" valign="top">1.87<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> (1)</td><td align="left" valign="top">.17</td></tr><tr><td align="left" valign="top">Fever, n (%)</td><td align="left" valign="top">100 (32.3)</td><td align="left" valign="top">210 (67.7)</td><td align="left" valign="top">1.68<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> (1)</td><td align="left" valign="top">.20</td></tr><tr><td align="left" valign="top">Cough, n (%)</td><td align="left" valign="top">115 (31.3)</td><td align="left" valign="top">253 (68.8)</td><td align="left" valign="top">0.50<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> (1)</td><td align="left" valign="top">.48</td></tr><tr><td align="left" valign="top">Loss of appetite, n (%)</td><td align="left" valign="top">37 (32)</td><td align="left" valign="top">80 (68)</td><td align="left" valign="top">0.11<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> (1)</td><td align="left" valign="top">.74</td></tr><tr><td align="left" valign="top">Respiratory distress, n (%)</td><td align="left" valign="top">43 (17.1)</td><td align="left" valign="top">208 (82.9)</td><td align="left" valign="top">49.30<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> (1)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Abnormal lung sounds, n (%)</td><td align="left" valign="top">102 (26.9)</td><td align="left" valign="top">277 (73.1)</td><td align="left" valign="top">16.70<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> (1)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Hypoxia, n (%)</td><td align="left" valign="top">20 (7.7)</td><td align="left" valign="top">240 (92.3)</td><td align="left" valign="top">156.82<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> (1)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Hemoglobin (g/dL), median (IQR)</td><td align="left" valign="top">11.6 (10.4 to 12.9)</td><td align="left" valign="top">11.6 (10.6 to 12.6)</td><td align="left" valign="top">20,022<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.87</td></tr><tr><td align="left" valign="top">Leukocytes (&#x00D7;10<sup>6</sup>/L), median (IQR)</td><td align="left" valign="top">9900 (6800 to 14,600)</td><td align="left" valign="top">10,950 (8050 to 15,850)</td><td align="left" valign="top">17,837<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.05</td></tr><tr><td align="left" valign="top">Lymphocytes (&#x00D7;10<sup>6</sup>/L), median (IQR)</td><td align="left" valign="top">2300 (1400 to 3700)</td><td align="left" valign="top">2800 (1900 to 4400)</td><td align="left" valign="top">17,039<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.01</td></tr><tr><td align="left" valign="top">Neutrophils (&#x00D7;10<sup>6</sup>/L), median (IQR)</td><td align="left" valign="top">5285 (2700 to 9200)</td><td align="left" valign="top">6500 (3650 to 10,900)</td><td align="left" valign="top">17,645<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.045</td></tr><tr><td align="left" valign="top">Platelets (&#x00D7;10<sup>9</sup>/L), median (IQR)</td><td align="left" valign="top">310 (225 to 386)</td><td align="left" valign="top">317.5 (230.5 to 425)</td><td align="left" valign="top">19,399<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.50</td></tr><tr><td align="left" valign="top">C-reactive protein (mg/L), median (IQR)</td><td align="left" valign="top">2.06 (0.79 to 7.67)</td><td align="left" valign="top">2.06 (0.83 to 7.35)</td><td align="left" valign="top">19,842<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.76</td></tr><tr><td align="left" valign="top">Albumin (g/dL), median (IQR)</td><td align="left" valign="top">3.9 (3.73 to 4.2)</td><td align="left" valign="top">3.9 (3.4 to 4.2)</td><td align="left" valign="top">17,121<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.01</td></tr><tr><td align="left" valign="top">Sodium (mEq/L), median (IQR)</td><td align="left" valign="top">136 (135 to 138)</td><td align="left" valign="top">136 (134 to 138)</td><td align="left" valign="top">19,657<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.64</td></tr><tr><td align="left" valign="top">Aspartate aminotransferase (U/L), median (IQR)</td><td align="left" valign="top">35 (26 to 42)</td><td align="left" valign="top">35 (28 to 50)</td><td align="left" valign="top">18,382<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.13</td></tr><tr><td align="left" valign="top">Alanine aminotransferase (U/L), median (IQR)</td><td align="left" valign="top">17 (12 to 26)</td><td align="left" valign="top">18 (13 to 29)</td><td align="left" valign="top">18,457<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">.15</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>Mann-Whitney <italic>U</italic> test.</p></fn><fn id="table3fn2"><p><sup>b</sup>Chi-square test.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-4"><title>Data Preprocessing</title><p>Data preprocessing, analysis, visualization, and model setup were conducted using Python (version 3.12; Python Software Foundation). We used Python libraries such as <italic>Pandas</italic>, <italic>NumPy</italic>, <italic>Matplotlib</italic>, <italic>Seaborn</italic>, and <italic>Plotly</italic> for exploratory data analysis. For model development, the <italic>PyCaret</italic> library was used, which includes an unsupervised anomaly detection module to identify and handle anomalous data points. <italic>PyCaret</italic> also offers various preprocessing modules to iteratively handle missing data using the light gradient boosting machine (LightGBM) algorithm. In this method, missing values were treated as dependent variables and predicted based on other available features, minimizing bias. Individual feature weights were applied during this process. Specifically, of the 415 cases, the following features had missing values: C-reactive protein (n=34, 8.2%), albumin (n=10, 2.4%), sodium (n=8, 1.9%), aspartate aminotransferase (n=16, 3.9%), and alanine aminotransferase (n=16, 3.9%). For numerical data, min-max scaling was applied, while categorical data were processed using one-hot encoding. These preprocessing steps ensured the dataset was well prepared for model training and validation.</p></sec><sec id="s2-5"><title>Handling the Imbalanced Dataset</title><p>The balance of the dataset was assessed using Shannon entropy, yielding a value of 0.7, which indicates an imbalanced dataset. To address this, we applied Synthetic Minority Oversampling Technique (SMOTE)&#x2013;Tomek, a refined variation of the widely recognized SMOTE. This approach combines oversampling of the minority class with the removal of overlapping samples from the majority class through Tomek links. So, the ratio of samples becomes 1:1. The <italic>Imblearn</italic> library was used for implementing data oversampling.</p><p>The dataset was split into two sets using the <italic>train_test_split</italic> method of the <italic>SciKit-Learn</italic> library. In the beginning, we allocated 5% of the general dataset as test data in order to prevent data leakage. The remaining 95% was split into training (352/415, 85%) and validation (63/415, 15%) sets.</p></sec><sec id="s2-6"><title>Algorithms</title><p><italic>PyCaret</italic> provides efficient implementations of state-of-the-art algorithms and is reusable among scientific disciplines. We used the <italic>PyCaret</italic> classifier module for classification, which includes the following models: ridge classifier, linear discriminant analysis, na&#x00EF;ve Bayes, extra tree classifier, extreme gradient boosting (XGBoost), random forest, gradient boosting classifier, LightGBM, CatBoost classifier, logistic regression, k-neighbors classifier, decision tree, AdaBoost classifier, quadratic discriminant analysis, support vector machine with linear kernel, and dummy classifier.</p><p>In our work, we considered 10-fold cross-validation. While developing our model with <italic>PyCaret</italic> tools, we implemented the tuning function using the <italic>Tune-Sklearn</italic> library and the <italic>hyper-band</italic> optimization algorithm to obtain a set of best-performing parameters. For ensembling, we also used <italic>PyCaret</italic> classifier ensemble, stack, and blender methods. Ensembling methods have strong evidence that they can significantly enhance the accuracy of classifications [<xref ref-type="bibr" rid="ref21">21</xref>]. After the optimization of parameters, in the last phase, we used the most common ensemble methods provided by the <italic>PyCaret</italic> library to further improve our model&#x2019;s performance (<xref ref-type="fig" rid="figure1">Figure 1</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>The experimental setup: in this figure, we illustrate the experimental process of our models. Initially, we cleaned the data by identifying 5% of cases as abnormal data using unsupervised learning. We then split the data into a train set (85%) and a validation set (15%) using the <italic>PyCaret</italic> classifier model. The base model with the highest AUC-ROC value was the RF algorithm. Subsequently, we determined the optimal number of features as 18 using RFECV and selected the top 18 features based on Shapley values. We then balanced the dataset using the SMOTE-Tomek method and developed high-performing models. After optimizing the hyperparameters, we selected the best-performing model and created new models by using ensemble methods. In parallel, we developed a new model using only clinical findings for clinical prediction. AdaBoost: AdaBoost classifier; AUC-ROC: area under the receiver operator characteristic curve; CatBoost: CatBoost classifier; DT: decision tree; Dummy: dummy classifier; ET: extra tree classifier; GBC: gradient boosting classifier; KNN: k-neighbors classifier; LDA: linear discriminant analysis; LightGBM: light gradient boosting machine; LR: logistic regression; NB: na&#x00EF;ve Bayes; QDA: quadratic discriminant analysis; RF: random forest; RFECV: recursive feature elimination with cross-validation; Ridge: ridge classifier; SMOTE: Synthetic Minority Oversampling Technique; SVM: support vector machine linear kernel classifier; XGBoost: extreme gradient boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="xmed_v6i1e57719_fig01.png"/></fig></sec><sec id="s2-7"><title>Feature Selection and Data-Reducing Methods</title><p>Feature selection is a process of one-by-one evaluation to determine which features are effective on the results within the dataset. Irrelevant or partially relevant features can negatively impact ML model performance and make the ML model learn based on irrelevant features. These methods are aimed at eliminating irrelevant features and keeping the strong features to reduce the dimension of the dataset. Recursive feature elimination is a feature selection method that fits a model and removes the irrelevant features until the specified number of features is reached. Recursive feature elimination with cross-validation (RFECV) aims to select the optimal number of features using permutation importance and recursive feature elimination. In this study, we used the <italic>RFECV</italic> module from <italic>yellowbrick</italic> library for selecting the optimum feature number. The Shapley additive explanations (SHAP) method is an innovative tool for explaining ML decision-making processes for datasets. The goal of the SHAP method is to present and explain the prediction with respect to the contribution of each feature to the predicted value. In RFECV, the features are ranked by a permutation importance measure. The SHAP algorithm was used for feature selection (<xref ref-type="fig" rid="figure2">Figure 2</xref>), as it provides more consistent and accurate importance values compared to the permutation approach. Ultimately, RFECV algorithms showed that 18 parameters are sufficient to explain nearly 90% of variances. Overall, 13 clinical and 5 laboratory variables were selected according to their SHAP values (<xref ref-type="fig" rid="figure2">Figure 2</xref>).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Feature selection: SHAP values are presented for the random forest classifier model with the highest AUC-ROC score in the dataset before feature selection, using the <italic>SHAP</italic> library&#x2019;s <italic>plot_summary</italic> module. The y-axis shows the importance of each feature, with the most important feature at the top and the least important at the bottom. The colors represent the contribution of each feature to the model&#x2019;s prediction. For example, features that have a large positive contribution to the prediction are shown in a warm color (eg, red), while features that have a large negative contribution are shown in a cool color (eg, blue). In this example, hypoxia is the most important attribute in the plot. The presence of hypoxia (hypoxia=1) causes the model to move closer to the target class, while its absence causes the model to move away from the target class. This predicts that hypoxia is an aggravating factor, while high levels of albumin have a protective effect for the target class. In summary, hypoxia is an adverse factor, and high albumin levels are protective. ALT: alanine aminotransferase; AST: aspartate aminotransferase; AUC-ROC: area under the receiver operator characteristic curve; CRP: C-reactive protein; SHAP: Shapley additive explanations.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="xmed_v6i1e57719_fig02.png"/></fig></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Study Population Characteristics</title><p>A comparison of the demographic and clinical characteristics between the nonsevere and severe groups is presented in <xref ref-type="table" rid="table3">Table 3</xref>. Of the 437 patients, 304 (69.6%) met the primary outcome, requiring the escalation of care. Patients in the severe care group were significantly younger, with a median age of 23 months compared to 44 months in the nonsevere level of care group (<italic>P</italic>=.003). Additionally, the severe group had lower weight <italic>z</italic> scores (<italic>P</italic>=.045).</p><p>Key clinical differences included higher rates of respiratory distress (208/304, 82.9% vs 43/133, 17.1%; <italic>P</italic>&#x003C;.001), abnormal lung sounds (277/304, 73.1% vs 102/133, 26.9%; <italic>P</italic>&#x003C;.001), and hypoxia (240/304, 92.3% vs 20/133, 7.7%; <italic>P</italic>&#x003C;.001) in the severe group. In terms of laboratory findings, the severe group had higher leukocyte counts (<italic>P</italic>=.005), neutrophil counts (<italic>P</italic>=.045), and lymphocyte counts (<italic>P</italic>=.001). Albumin levels were slightly lower in the severe group (<italic>P</italic>=.01). No significant differences were observed between the groups in gender distribution (<italic>P</italic>=.83), comorbidities (<italic>P</italic>=.26), recent antibiotic use (<italic>P</italic>=.17), or C-reactive protein levels (<italic>P</italic>=.76).</p></sec><sec id="s3-2"><title>Model Performances</title><p>In this section, we present a comparison of the performance of 16 different algorithms for raw and preprocessed datasets. We used various evaluation metrics such as accuracy, area under the receiver operator characteristic curve (AUC-ROC), recall, precision, <italic>F</italic><sub>1</sub>-score, Cohen &#x03BA;, and Matthews correlation coefficient to assess model performance. To analyze model performance, all prediction experiments were conducted using 10-fold cross-validation. Subsequently, the models were optimized, and their performances were evaluated on a balanced dataset using SMOTE-Tomek and feature selection. The performances of the three models with the highest performance (CatBoost, XGBoost, and LightGBM) were evaluated by applying hyperparameter optimization and ensemble methods. <xref ref-type="table" rid="table4">Table 4</xref> compares the results obtained with CatBoost, XGBoost, and LightGBM among the optimized and nonoptimized results, as well as the results of the combinations with the highest performance from the basic ensembling methods (ensembling, blending, and stacking methods). The highest AUC-ROC value was achieved by using optimized LightGBM as the meta-model in the stacking method.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Comparative performance of machine learning models for the escalation of care prediction. Italicized values represent the highest scores for each column.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom">AUC-ROC<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td><td align="left" valign="bottom">AUC-PRC<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup></td><td align="left" valign="bottom">Recall</td><td align="left" valign="bottom">Precision</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="bottom">Cohen &#x03BA;</td><td align="left" valign="bottom">MCC<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top">CatBoost<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup></td><td align="left" valign="top">0.77</td><td align="left" valign="top">0.85</td><td align="left" valign="top">0.94</td><td align="left" valign="top">0.75</td><td align="left" valign="top">0.91</td><td align="left" valign="top">0.82</td><td align="left" valign="top">0.52</td><td align="left" valign="top">0.54</td></tr><tr><td align="left" valign="top">LightGBM<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup><sup>,<xref ref-type="table-fn" rid="table4fn6">f</xref></sup></td><td align="left" valign="top">0.80</td><td align="left" valign="top">0.87</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0.79</td><td align="left" valign="top">0.92</td><td align="left" valign="top">0.85</td><td align="left" valign="top">0.58</td><td align="left" valign="top">0.59</td></tr><tr><td align="left" valign="top">XGBoost<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup><sup>,<xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td><td align="left" valign="top">0.77</td><td align="left" valign="top">0.83</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0.72</td><td align="left" valign="top"><italic>0.94</italic></td><td align="left" valign="top">0.82</td><td align="left" valign="top">0.54</td><td align="left" valign="top">0.57</td></tr><tr><td align="left" valign="top">Ensembling<sup><xref ref-type="table-fn" rid="table4fn8">h</xref></sup></td><td align="left" valign="top">0.77</td><td align="left" valign="top">0.86</td><td align="left" valign="top">0.95</td><td align="left" valign="top">0.72</td><td align="left" valign="top"><italic>0.94</italic></td><td align="left" valign="top">0.82</td><td align="left" valign="top">0.54</td><td align="left" valign="top">0.57</td></tr><tr><td align="left" valign="top">Stacking<sup><xref ref-type="table-fn" rid="table4fn9">i</xref></sup></td><td align="left" valign="top">0.80</td><td align="left" valign="top"><italic>0</italic>.88</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0.79</td><td align="left" valign="top">0.92</td><td align="left" valign="top">0.85</td><td align="left" valign="top">0.58</td><td align="left" valign="top">0.59</td></tr><tr><td align="left" valign="top">Blending-1<sup><xref ref-type="table-fn" rid="table4fn10">j</xref></sup></td><td align="left" valign="top">0.77</td><td align="left" valign="top">0.86</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0.75</td><td align="left" valign="top">0.91</td><td align="left" valign="top">0.82</td><td align="left" valign="top">0.52</td><td align="left" valign="top">0.57</td></tr><tr><td align="left" valign="top">Blending-2<sup><xref ref-type="table-fn" rid="table4fn11">k</xref></sup></td><td align="left" valign="top"><italic>0</italic>.85</td><td align="left" valign="top">0.84</td><td align="left" valign="top">0.96</td><td align="left" valign="top"><italic>0</italic>.95</td><td align="left" valign="top">0.85</td><td align="left" valign="top"><italic>0.90</italic></td><td align="left" valign="top"><italic>0.63</italic></td><td align="left" valign="top"><italic>0.64</italic></td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>AUC-ROC: area under the receiver operating characteristic curve.</p></fn><fn id="table4fn2"><p><sup>b</sup>AUC-PRC: area under the precision-recall curve.</p></fn><fn id="table4fn3"><p><sup>c</sup>MCC: Matthews correlation coefficient.</p></fn><fn id="table4fn4"><p><sup>d</sup>The performance of unoptimized CatBoost.</p></fn><fn id="table4fn5"><p><sup>e</sup>LightGBM: light gradient boosting machine.</p></fn><fn id="table4fn6"><p><sup>f</sup>The performance values obtained after optimization of XGBoost and LightGBM.</p></fn><fn id="table4fn7"><p><sup>g</sup>XGBoost: extreme gradient boosting.</p></fn><fn id="table4fn8"><p><sup>h</sup>The performance of the optimized LightGBM ensembling method, which achieved the highest results among CatBoost, XGBoost, and LightGBM algorithms.</p></fn><fn id="table4fn9"><p><sup>i</sup>The performance of the model with optimized LightGBM as a meta-model in the stacking method, as it showed the highest performance.</p></fn><fn id="table4fn10"><p><sup>j</sup>The combination of optimized LightGBM and XGBoost with higher performance in the blending method.</p></fn><fn id="table4fn11"><p><sup>k</sup>Using the top-5, highest-ranked clinical features, the peak performance was realized by using a method that incorporated the optimized CatBoost, LightGBM, and XGBoost models.</p></fn></table-wrap-foot></table-wrap><p>In addition to the metrics reported in <xref ref-type="table" rid="table4">Table 4</xref>, we evaluated the performance of the <italic>Blending-2</italic> model using the precision-recall curve metric, which is particularly useful for imbalanced datasets. The precision-recall curve plot for this model, using the top-5 ranked clinical features, is provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The model achieved a strong average precision-recall score of 0.96, further highlighting its robustness in handling imbalanced data.</p></sec><sec id="s3-3"><title>Feature Importance</title><p>The optimized LightGBM in the model, developed with balanced and feature-selected data, was responsible for the attainment of the highest performance. Upon evaluation of clinical features according to SHAP values, a ranking was established based on their feature importance scores, with the highest score being garnered by the top-5 clinical features (hypoxia, respiratory distress, age, <italic>z</italic> score of weight for age, and antibiotic usage before admission; <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). The application of a workflow using these 5 features, as done previously, resulted in the highest accuracy performance (84%), which was achieved through the use of the ensemble method, incorporating the blending method of the optimized CatBoost, LightGBM, and XGBoost models.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><p>Pneumonia, the leading cause of childhood mortality, is also one of the most common causes of hospitalization [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. It remains a significant global health burden, particularly in children aged &#x003C;5 years, where timely and accurate clinical management is crucial for reducing mortality [<xref ref-type="bibr" rid="ref8">8</xref>]. While prevention strategies are well documented, the clinical challenge lies in efficiently identifying patients who require escalated care. In this study, we present a contemporary approach to building an ML-based, prognostic care referral decision support tool that assists primary care physicians in determining where the case should be managed with an accuracy of more than 80%.</p><p>Today, there is widespread knowledge of the prevention, diagnosis, treatment, and management of complications in CAP, but due to resource limitations, it is not possible for all physicians and patients to benefit from this [<xref ref-type="bibr" rid="ref14">14</xref>]. Recent advancements in medical informatics have the potential to reduce health care disparities and empower physicians in resource-limited settings [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref15">15</xref>], offering new hope for identifying high-risk populations and preventing mortality where current methods fall short.</p><p>The recent COVID-19 pandemic has impacted several medical fields, including the disruption of research practices by shifting researchers&#x2019; focus and patient recruitment [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>] and significantly reducing the incidence of non&#x2013;COVID-19 pneumonia by preventing transmission [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref27">27</xref>]. In the current postpandemic state, non&#x2013;COVID-19 childhood pneumonia remains a global health concern, especially in resource-limited settings according to the most recent reports [<xref ref-type="bibr" rid="ref2">2</xref>], with respiratory infections likely to rise again as pandemic measures have already been eased [<xref ref-type="bibr" rid="ref28">28</xref>]. Now, focusing back to reducing the mortality of CAP is critical to ensure pediatric pneumonia care benefits from recent advancements that COVID-19 provided [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. This study, built primarily on prepandemic cases, provides a foundational context for future studies on CAP using ML in the postpandemic era.</p><p>Since March 2020, a substantial amount of data about COVID-19 have been published, including COVID-19&#x2013;related artificial intelligence studies focused on pneumonia diagnosis by radiological findings [<xref ref-type="bibr" rid="ref31">31</xref>]. However, pneumonia diagnosis is clinical, and routine chest radiographs are not necessary for the confirmation diagnosis [<xref ref-type="bibr" rid="ref32">32</xref>] and do not improve outcomes [<xref ref-type="bibr" rid="ref33">33</xref>]. In addition, chest radiography can be used only in inpatient settings to identify complications or evaluate response to treatment.</p><p>Although strong diagnostic support algorithms have been published in pneumonia-related studies in recent years, there is still a need for prognostic studies for pneumonia management [<xref ref-type="bibr" rid="ref31">31</xref>]. Determining the severity of a disease or predicting its prognosis answers essential questions of physicians in medical decision-making, such as &#x201C;Where should it be treated? Outpatient? ICU?&#x201D; &#x201C;Which therapy should I start? How long should I give it?&#x201D; and &#x201C;When should I discharge the patient? When should I call for control?&#x201D; There are several studies and guidelines in the literature for severity assessment and prognosis prediction of pneumonia [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. For the majority, mortality and the development of complications were the primary outcomes, and clinical, radiological, and laboratory variables are the key predictors. Yet, there is a limited number of studies predicting required referral to tertiary care based on basic clinical and laboratory features available in primary care settings [<xref ref-type="bibr" rid="ref15">15</xref>].</p><p>This study reviewed important pneumonia prognostic predictors of children hospitalized in a major academic medical center. The primary outcome of interest was the level of care severity, classified as severe or nonsevere based on the need for pediatric intensive care unit admission or oxygen/ventilation support. The main objective of this study was not only to build the best model but also to answer the primary care physician&#x2019;s question: &#x201C;Where should the case be managed?&#x201D; Our model demonstrated promising predictive accuracy, with an AUC-ROC exceeding 0.85 and an accuracy of 77% to 88% (<xref ref-type="table" rid="table4">Table 4</xref>). The key clinical features identified&#x2014;hypoxia, respiratory distress, age, <italic>z</italic> score of weight for age, and complaint period (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>)&#x2014;align with existing clinical guidelines, which emphasize the importance of respiratory and nutritional status in predicting disease severity [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref36">36</xref>].</p><p>In this study, we used SMOTE-Tomek, a method proven effective in medical tasks, to address class imbalance without losing valuable clinical information [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>], which was essential given the significantly imbalanced and small sample&#x2013;sized dataset. Additionally, we used RFECV and SHAP, both of which have been established as robust methods in previous studies [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>], for feature selection. These techniques not only improved our model&#x2019;s performance but also allowed us to isolate the most clinically significant features (<xref ref-type="fig" rid="figure2">Figure 2</xref>, also see <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>), enabling clinicians to decide using their own skills without involving additional diagnostic tools.</p><p>The clinical application of a prognostic care decision model is particularly relevant in settings where early and accurate escalation of care is needed. For example, by focusing on these top-5 clinical features or using a decision support tool like ours, even less experienced primary care physicians could assess risk and anticipate tertiary care referrals without advanced diagnostics. Additionally, in emergency settings, these tools could assist in triaging patients to prioritize those needing immediate respiratory support or mechanical ventilation, allowing earlier interventions and more effective resource allocation&#x2014;crucial for LMICs&#x2014;potentially reducing morbidity and mortality.</p><p>One significant limitation of this study is its reliance on data from a single tertiary hospital (Hacettepe University), which may limit generalizability. While the dataset includes patients referred from both urban and rural areas, the focus on a tertiary center introduces a selection bias, as most cases represent severe care levels (304/437, 69.6%). This is likely because less severe CAP cases are managed in primary or secondary care, not referred to tertiary centers, limiting the model&#x2019;s applicability in less severe cases. Additionally, the relatively small sample size of 437 patients limits the model&#x2019;s generalizability, as larger datasets are typically needed to optimize ML models and ensure robust performance across diverse populations. Expanding the dataset to include patients from multiple centers, especially primary and secondary care institutions, could improve the model&#x2019;s generalizability and applicability. Lastly, the retrospective nature of the data and the missing time frames of tertiary care unit transfers may not fully capture real-time clinical decision-making or the urgency of care decisions.</p><p>In conclusion, this study demonstrates the feasibility of developing an ML-based prognostic decision support tool for childhood pneumonia referral, with an accuracy of 77% to 88%. Incorporating foundational clinical skills for key prognostic predictors with advanced data science methods holds promise for improving pneumonia outcomes by accurately predicting the need for the escalation of care.</p></sec></body><back><ack><p>During the preparation of this work, the authors used OpenAI GPT-4o [<xref ref-type="bibr" rid="ref41">41</xref>] to restructure sentences for enhanced readability, as they are not native English speakers. After using this tool/service, the authors reviewed and edited the content as needed and took full responsibility for the content of the publication.</p></ack><fn-group><fn fn-type="con"><p>OS contributed to the creation of the work plan, interpretation of statistical analysis and machine learning algorithms, coinvestigation of the literature, and writing the revised manuscript. ITA contributed to the building of machine learning algorithms, coinvestigation of the literature, and writing the results and methods. SBC contributed to scanning patients from the hospital electronic health record system and encoding the attributes of the patients&#x2019; data in the case report form (&#x201C;Human Encoder-1&#x201D;). BK contributed to the scanning patients from the hospital electronic health record system and encoding the attributes of the patients&#x2019; data in the case report form (&#x201C;Human Encoder-2&#x201D;). AFD contributed to the building of the machine learning algorithms and optimizing the dataset. MZU contributed to the coding of advanced statistical and machine learning algorithms, and the creation of the clinical decision support system interface. YO contributed to the creation of the work plan, interpretation of statistical analysis, and gathering the team of investigators.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AUC-ROC</term><def><p>area under the receiver operator characteristic curve</p></def></def-item><def-item><term id="abb2">CAP</term><def><p>community-acquired pneumonia</p></def></def-item><def-item><term id="abb3">IMCI</term><def><p>Integrated Management of Childhood Illness</p></def></def-item><def-item><term id="abb4">LightGBM</term><def><p>light gradient boosting machine</p></def></def-item><def-item><term id="abb5">LMIC</term><def><p>low- and middle-income country</p></def></def-item><def-item><term id="abb6">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb7">RFECV</term><def><p>recursive feature elimination with cross-validation</p></def></def-item><def-item><term id="abb8">SHAP</term><def><p>Shapley additive explanations</p></def></def-item><def-item><term id="abb9">SMOTE</term><def><p>Synthetic Minority Oversampling Technique</p></def></def-item><def-item><term id="abb10">WHO</term><def><p>World Health Organization</p></def></def-item><def-item><term id="abb11">XGBoost</term><def><p>extreme gradient boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="web"><article-title>Pneumonia in children</article-title><source>World Health Organization</source><year>2022</year><month>11</month><day>11</day><access-date>2024-10-01</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/news-room/fact-sheets/detail/pneumonia">https://www.who.int/news-room/fact-sheets/detail/pneumonia</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>United Nations Inter-Agency Group for Child Mortality Estimation</collab></person-group><article-title>Levels and trends in child mortality, report 2023</article-title><source>UNICEF</source><year>2024</year><month>03</month><day>12</day><access-date>2024-10-01</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://data.unicef.org/resources/levels-and-trends-in-child-mortality-2024/">https://data.unicef.org/resources/levels-and-trends-in-child-mortality-2024/</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Qazi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Aboubaker</surname><given-names>S</given-names> </name><name name-style="western"><surname>MacLean</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Ending preventable child deaths from pneumonia and diarrhoea by 2025. development of the integrated Global Action Plan for the Prevention and Control of Pneumonia and Diarrhoea</article-title><source>Arch Dis Child</source><year>2015</year><month>02</month><volume>100 Suppl 1</volume><fpage>S23</fpage><lpage>S28</lpage><pub-id pub-id-type="doi">10.1136/archdischild-2013-305429</pub-id><pub-id pub-id-type="medline">25613963</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sazawal</surname><given-names>S</given-names> </name><name name-style="western"><surname>Black</surname><given-names>RE</given-names> </name><collab>Pneumonia Case Management Trials Group</collab></person-group><article-title>Effect of pneumonia case management on mortality in neonates, infants, and preschool children: a meta-analysis of community-based trials</article-title><source>Lancet Infect Dis</source><year>2003</year><month>09</month><volume>3</volume><issue>9</issue><fpage>547</fpage><lpage>556</lpage><pub-id pub-id-type="doi">10.1016/s1473-3099(03)00737-0</pub-id><pub-id pub-id-type="medline">12954560</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shah</surname><given-names>SN</given-names> </name><name name-style="western"><surname>Bachur</surname><given-names>RG</given-names> </name><name name-style="western"><surname>Simel</surname><given-names>DL</given-names> </name><name name-style="western"><surname>Neuman</surname><given-names>MI</given-names> </name></person-group><article-title>Does this child have pneumonia?: the rational clinical examination systematic review</article-title><source>JAMA</source><year>2017</year><month>08</month><day>1</day><volume>318</volume><issue>5</issue><fpage>462</fpage><lpage>471</lpage><pub-id pub-id-type="doi">10.1001/jama.2017.9039</pub-id><pub-id pub-id-type="medline">28763554</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>World Health Organization</collab></person-group><article-title>Handbook: IMCI integrated management of childhood illness</article-title><source>World Health Organization</source><year>2005</year><comment><ext-link ext-link-type="uri" xlink:href="https://iris.who.int/handle/10665/42939">https://iris.who.int/handle/10665/42939</ext-link></comment></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ferdous</surname><given-names>F</given-names> </name><name name-style="western"><surname>Ahmed</surname><given-names>S</given-names> </name><name name-style="western"><surname>Das</surname><given-names>SK</given-names> </name><etal/></person-group><article-title>Pneumonia mortality and healthcare utilization in young children in rural Bangladesh: a prospective verbal autopsy study</article-title><source>Trop Med Health</source><year>2018</year><month>05</month><day>25</day><volume>46</volume><fpage>17</fpage><pub-id pub-id-type="doi">10.1186/s41182-018-0099-4</pub-id><pub-id pub-id-type="medline">29875615</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shaima</surname><given-names>SN</given-names> </name><name name-style="western"><surname>Alam</surname><given-names>T</given-names> </name><name name-style="western"><surname>Bin Shahid</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Prevalence, predictive factors, and outcomes of respiratory failure in children with pneumonia admitted in a developing country</article-title><source>Front Pediatr</source><year>2022</year><month>05</month><day>4</day><volume>10</volume><fpage>841628</fpage><pub-id pub-id-type="doi">10.3389/fped.2022.841628</pub-id><pub-id pub-id-type="medline">35601439</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sonego</surname><given-names>M</given-names> </name><name name-style="western"><surname>Pellegrin</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Becker</surname><given-names>G</given-names> </name><name name-style="western"><surname>Lazzerini</surname><given-names>M</given-names> </name></person-group><article-title>Risk factors for mortality from acute lower respiratory infections (ALRI) in children under five years of age in low and middle-income countries: a systematic review and meta-analysis of observational studies</article-title><source>PLoS One</source><year>2015</year><month>01</month><day>30</day><volume>10</volume><issue>1</issue><fpage>e0116380</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0116380</pub-id><pub-id pub-id-type="medline">25635911</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McAllister</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Shi</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Global, regional, and national estimates of pneumonia morbidity and mortality in children younger than 5 years between 2000 and 2015: a systematic analysis</article-title><source>Lancet Glob Health</source><year>2019</year><month>01</month><volume>7</volume><issue>1</issue><fpage>e47</fpage><lpage>e57</lpage><pub-id pub-id-type="doi">10.1016/S2214-109X(18)30408-X</pub-id><pub-id pub-id-type="medline">30497986</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chang</surname><given-names>TH</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>SR</given-names> </name><etal/></person-group><article-title>Clinical characteristics of hospitalized children with community-acquired pneumonia and respiratory infections: Using machine learning approaches to support pathogen prediction at admission</article-title><source>J Microbiol Immunol Infect</source><year>2023</year><month>08</month><volume>56</volume><issue>4</issue><fpage>772</fpage><lpage>781</lpage><pub-id pub-id-type="doi">10.1016/j.jmii.2023.04.011</pub-id><pub-id pub-id-type="medline">37246060</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bennett</surname><given-names>TD</given-names> </name><name name-style="western"><surname>Callahan</surname><given-names>TJ</given-names> </name><name name-style="western"><surname>Feinstein</surname><given-names>JA</given-names> </name><etal/></person-group><article-title>Data science for child health</article-title><source>J Pediatr</source><year>2019</year><month>05</month><volume>208</volume><fpage>12</fpage><lpage>22</lpage><pub-id pub-id-type="doi">10.1016/j.jpeds.2018.12.041</pub-id><pub-id pub-id-type="medline">30686480</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name><name name-style="western"><surname>P&#x00E9;rez-Stable</surname><given-names>EJ</given-names> </name><name name-style="western"><surname>Bourne</surname><given-names>PE</given-names> </name><etal/></person-group><article-title>Big data science: opportunities and challenges to address minority health and health disparities in the 21st century</article-title><source>Ethn Dis</source><year>2017</year><month>04</month><day>20</day><volume>27</volume><issue>2</issue><fpage>95</fpage><lpage>106</lpage><pub-id pub-id-type="doi">10.18865/ed.27.2.95</pub-id><pub-id pub-id-type="medline">28439179</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sheikh</surname><given-names>M</given-names> </name><name name-style="western"><surname>Jehan</surname><given-names>F</given-names> </name></person-group><article-title>Using big data for risk stratification of childhood pneumonia in low-income and middle-income countries (LMICs): challenges and opportunities</article-title><source>EBioMedicine</source><year>2021</year><month>12</month><volume>74</volume><fpage>103740</fpage><pub-id pub-id-type="doi">10.1016/j.ebiom.2021.103740</pub-id><pub-id pub-id-type="medline">34916165</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>HY</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>TH</given-names> </name><etal/></person-group><article-title>Evaluation of the need for intensive care in children with pneumonia: machine learning approach</article-title><source>JMIR Med Inform</source><year>2022</year><month>01</month><day>27</day><volume>10</volume><issue>1</issue><fpage>e28934</fpage><pub-id pub-id-type="doi">10.2196/28934</pub-id><pub-id pub-id-type="medline">35084358</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kanwal</surname><given-names>K</given-names> </name><name name-style="western"><surname>Khalid</surname><given-names>SG</given-names> </name><name name-style="western"><surname>Asif</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zafar</surname><given-names>F</given-names> </name><name name-style="western"><surname>Qurashi</surname><given-names>AG</given-names> </name></person-group><article-title>Diagnosis of community-acquired pneumonia in children using photoplethysmography and machine learning-based classifier</article-title><source>Biomed Signal Process Control</source><year>2024</year><month>01</month><volume>87</volume><fpage>105367</fpage><pub-id pub-id-type="doi">10.1016/j.bspc.2023.105367</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Smith</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Spann</surname><given-names>A</given-names> </name><name name-style="western"><surname>McCoy</surname><given-names>AB</given-names> </name><etal/></person-group><article-title>Natural language processing and machine learning to enable clinical decision support for treatment of pediatric pneumonia</article-title><source>AMIA Annu Symp Proc</source><year>2020</year><month>01</month><day>25</day><volume>2020</volume><fpage>1130</fpage><lpage>1139</lpage><pub-id pub-id-type="medline">33936489</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zech</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Badgeley</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Costa</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Titano</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Oermann</surname><given-names>EK</given-names> </name></person-group><article-title>Variable generalization performance of a deep learning model to detect pneumonia in chest radiographs: a cross-sectional study</article-title><source>PLoS Med</source><year>2018</year><month>11</month><day>6</day><volume>15</volume><issue>11</issue><fpage>e1002683</fpage><pub-id pub-id-type="doi">10.1371/journal.pmed.1002683</pub-id><pub-id pub-id-type="medline">30399157</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gera</surname><given-names>T</given-names> </name><name name-style="western"><surname>Shah</surname><given-names>D</given-names> </name><name name-style="western"><surname>Garner</surname><given-names>P</given-names> </name><name name-style="western"><surname>Richardson</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sachdev</surname><given-names>HS</given-names> </name></person-group><article-title>Integrated management of childhood illness (IMCI) strategy for children under five</article-title><source>Cochrane Database Syst Rev</source><year>2016</year><month>06</month><day>22</day><volume>2016</volume><issue>6</issue><fpage>CD010123</fpage><pub-id pub-id-type="doi">10.1002/14651858.CD010123.pub2</pub-id><pub-id pub-id-type="medline">27378094</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Neyzi</surname><given-names>O</given-names> </name><name name-style="western"><surname>Bundak</surname><given-names>R</given-names> </name><name name-style="western"><surname>G&#x00F6;k&#x00E7;ay</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Reference values for weight, height, head circumference, and body mass index in Turkish children</article-title><source>J Clin Res Pediatr Endocrinol</source><year>2015</year><month>12</month><volume>7</volume><issue>4</issue><fpage>280</fpage><lpage>293</lpage><pub-id pub-id-type="doi">10.4274/jcrpe.2183</pub-id><pub-id pub-id-type="medline">26777039</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mahajan</surname><given-names>P</given-names> </name><name name-style="western"><surname>Uddin</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hajati</surname><given-names>F</given-names> </name><name name-style="western"><surname>Moni</surname><given-names>MA</given-names> </name></person-group><article-title>Ensemble learning for disease prediction: a review</article-title><source>Healthcare (Basel)</source><year>2023</year><month>06</month><day>20</day><volume>11</volume><issue>12</issue><fpage>1808</fpage><pub-id pub-id-type="doi">10.3390/healthcare11121808</pub-id><pub-id pub-id-type="medline">37372925</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jain</surname><given-names>S</given-names> </name><name name-style="western"><surname>Williams</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Arnold</surname><given-names>SR</given-names> </name><etal/></person-group><article-title>Community-acquired pneumonia requiring hospitalization among U.S. children</article-title><source>N Engl J Med</source><year>2015</year><month>02</month><day>26</day><volume>372</volume><issue>9</issue><fpage>835</fpage><lpage>845</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa1405870</pub-id><pub-id pub-id-type="medline">25714161</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shao</surname><given-names>JH</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>KH</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>SH</given-names> </name></person-group><article-title>COVID-19-related disruptions in implementation of a randomized control trial: an autoethnographic report</article-title><source>Appl Nurs Res</source><year>2023</year><month>08</month><volume>72</volume><fpage>151698</fpage><pub-id pub-id-type="doi">10.1016/j.apnr.2023.151698</pub-id><pub-id pub-id-type="medline">37423680</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sohrabi</surname><given-names>C</given-names> </name><name name-style="western"><surname>Mathew</surname><given-names>G</given-names> </name><name name-style="western"><surname>Franchi</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Impact of the coronavirus (COVID-19) pandemic on scientific research and implications for clinical academic training - a review</article-title><source>Int J Surg</source><year>2021</year><month>02</month><volume>86</volume><fpage>57</fpage><lpage>63</lpage><pub-id pub-id-type="doi">10.1016/j.ijsu.2020.12.008</pub-id><pub-id pub-id-type="medline">33444873</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kuitunen</surname><given-names>I</given-names> </name><name name-style="western"><surname>Artama</surname><given-names>M</given-names> </name><name name-style="western"><surname>M&#x00E4;kel&#x00E4;</surname><given-names>L</given-names> </name><name name-style="western"><surname>Backman</surname><given-names>K</given-names> </name><name name-style="western"><surname>Heiskanen-Kosma</surname><given-names>T</given-names> </name><name name-style="western"><surname>Renko</surname><given-names>M</given-names> </name></person-group><article-title>Effect of social distancing due to the COVID-19 pandemic on the incidence of viral respiratory tract infections in children in Finland during early 2020</article-title><source>Pediatr Infect Dis J</source><year>2020</year><month>12</month><volume>39</volume><issue>12</issue><fpage>e423</fpage><lpage>e427</lpage><pub-id pub-id-type="doi">10.1097/INF.0000000000002845</pub-id><pub-id pub-id-type="medline">32773660</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Changing clinical characteristics of pediatric inpatients with pneumonia during COVID-19 pandamic: a retrospective study</article-title><source>Ital J Pediatr</source><year>2024</year><month>04</month><day>23</day><volume>50</volume><issue>1</issue><fpage>84</fpage><pub-id pub-id-type="doi">10.1186/s13052-024-01651-8</pub-id><pub-id pub-id-type="medline">38650007</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>C</given-names> </name></person-group><article-title>Pediatric non-COVID-19 community-acquired pneumonia in COVID-19 pandemic</article-title><source>Int J Gen Med</source><year>2021</year><month>10</month><day>27</day><volume>14</volume><fpage>7165</fpage><lpage>7171</lpage><pub-id pub-id-type="doi">10.2147/IJGM.S333751</pub-id><pub-id pub-id-type="medline">34737611</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lastrucci</surname><given-names>V</given-names> </name><name name-style="western"><surname>Bonaccorsi</surname><given-names>G</given-names> </name><name name-style="western"><surname>Forni</surname><given-names>S</given-names> </name><etal/></person-group><article-title>The indirect impact of COVID-19 large-scale containment measures on the incidence of community-acquired pneumonia in older people: a region-wide population-based study in Tuscany, Italy</article-title><source>Int J Infect Dis</source><year>2021</year><month>08</month><volume>109</volume><fpage>182</fpage><lpage>188</lpage><pub-id pub-id-type="doi">10.1016/j.ijid.2021.06.058</pub-id><pub-id pub-id-type="medline">34216731</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Latif</surname><given-names>S</given-names> </name><name name-style="western"><surname>Usman</surname><given-names>M</given-names> </name><name name-style="western"><surname>Manzoor</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Leveraging data science to combat COVID-19: a comprehensive review</article-title><source>IEEE Trans Artif Intell</source><year>2020</year><month>09</month><day>2</day><volume>1</volume><issue>1</issue><fpage>85</fpage><lpage>103</lpage><pub-id pub-id-type="doi">10.1109/TAI.2020.3020521</pub-id><pub-id pub-id-type="medline">37982070</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>H</given-names> </name></person-group><article-title>Global research trends in pediatric COVID-19: a bibliometric analysis</article-title><source>Front Public Health</source><year>2022</year><month>02</month><day>16</day><volume>10</volume><fpage>798005</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2022.798005</pub-id><pub-id pub-id-type="medline">35252087</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chumbita</surname><given-names>M</given-names> </name><name name-style="western"><surname>Cill&#x00F3;niz</surname><given-names>C</given-names> </name><name name-style="western"><surname>Puerta-Alcalde</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Can artificial intelligence improve the management of pneumonia</article-title><source>J Clin Med</source><year>2020</year><month>01</month><day>17</day><volume>9</volume><issue>1</issue><fpage>248</fpage><pub-id pub-id-type="doi">10.3390/jcm9010248</pub-id><pub-id pub-id-type="medline">31963480</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bradley</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Byington</surname><given-names>CL</given-names> </name><name name-style="western"><surname>Shah</surname><given-names>SS</given-names> </name><etal/></person-group><article-title>The management of community-acquired pneumonia in infants and children older than 3 months of age: clinical practice guidelines by the Pediatric Infectious Diseases Society and the Infectious Diseases Society of America</article-title><source>Clin Infect Dis</source><year>2011</year><month>10</month><volume>53</volume><issue>7</issue><fpage>e25</fpage><lpage>e76</lpage><pub-id pub-id-type="doi">10.1093/cid/cir531</pub-id><pub-id pub-id-type="medline">21880587</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Harris</surname><given-names>M</given-names> </name><name name-style="western"><surname>Clark</surname><given-names>J</given-names> </name><name name-style="western"><surname>Coote</surname><given-names>N</given-names> </name><etal/></person-group><article-title>British Thoracic Society guidelines for the management of community acquired pneumonia in children: update 2011</article-title><source>Thorax</source><year>2011</year><month>10</month><volume>66 Suppl 2</volume><fpage>ii1</fpage><lpage>23</lpage><pub-id pub-id-type="doi">10.1136/thoraxjnl-2011-200598</pub-id><pub-id pub-id-type="medline">21903691</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dean</surname><given-names>P</given-names> </name><name name-style="western"><surname>Florin</surname><given-names>TA</given-names> </name></person-group><article-title>Factors associated with pneumonia severity in children: a systematic review</article-title><source>J Pediatric Infect Dis Soc</source><year>2018</year><month>12</month><day>3</day><volume>7</volume><issue>4</issue><fpage>323</fpage><lpage>334</lpage><pub-id pub-id-type="doi">10.1093/jpids/piy046</pub-id><pub-id pub-id-type="medline">29850828</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Araya</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lovera</surname><given-names>D</given-names> </name><name name-style="western"><surname>Zarate</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Application of a prognostic scale to estimate the mortality of children hospitalized with community-acquired pneumonia</article-title><source>Pediatr Infect Dis J</source><year>2016</year><month>04</month><volume>35</volume><issue>4</issue><fpage>369</fpage><lpage>373</lpage><pub-id pub-id-type="doi">10.1097/INF.0000000000001018</pub-id><pub-id pub-id-type="medline">26629871</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Williams</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Grijalva</surname><given-names>CG</given-names> </name><etal/></person-group><article-title>Predicting severe pneumonia outcomes in children</article-title><source>Pediatrics</source><year>2016</year><month>10</month><volume>138</volume><issue>4</issue><fpage>e20161019</fpage><pub-id pub-id-type="doi">10.1542/peds.2016-1019</pub-id><pub-id pub-id-type="medline">27688362</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Zeng</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zou</surname><given-names>B</given-names> </name><name name-style="western"><surname>Wei</surname><given-names>F</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>L</given-names> </name></person-group><article-title>Effective prediction of three common diseases by combining SMOTE with Tomek links technique for imbalanced medical data</article-title><conf-name>2016 IEEE International Conference of Online Analysis and Computing Science (ICOACS)</conf-name><conf-date>May 28-29, 2016</conf-date><conf-loc>Chongqing, China</conf-loc><fpage>225</fpage><lpage>228</lpage><pub-id pub-id-type="doi">10.1109/ICOACS.2016.7563084</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>R</given-names> </name><name name-style="western"><surname>Greenstein</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Fackler</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Bergmann</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bembea</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Winslow</surname><given-names>RL</given-names> </name></person-group><article-title>Prediction of impending septic shock in children with sepsis</article-title><source>Crit Care Explor</source><year>2021</year><month>06</month><day>15</day><volume>3</volume><issue>6</issue><fpage>e0442</fpage><pub-id pub-id-type="doi">10.1097/CCE.0000000000000442</pub-id><pub-id pub-id-type="medline">34151278</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Akhtar</surname><given-names>F</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Pei</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Rajput</surname><given-names>A</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Q</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Hung</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yen</surname><given-names>N</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>JW</given-names> </name></person-group><article-title>Optimal features subset selection for large for gestational age classification using GridSearch based recursive feature elimination with cross-validation scheme</article-title><source>Frontier Computing: Theory, Technologies and Applications (FC 2019). Lecture Notes in Electrical Engineering, vol 551</source><year>2020</year><publisher-name>Springer</publisher-name><fpage>63</fpage><lpage>71</lpage><pub-id pub-id-type="doi">10.1007/978-981-15-3250-4_8</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Man</surname><given-names>X</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>EP</given-names> </name></person-group><article-title>The best way to select features? comparing MDA, LIME, and SHAP</article-title><source>J Financ Data Sci Winter</source><year>2021</year><volume>3</volume><issue>1</issue><fpage>127</fpage><lpage>139</lpage><pub-id pub-id-type="doi">10.3905/jfds.2020.1.047</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="web"><article-title>GPT-4o</article-title><source>OpenAI</source><access-date>2025-02-12</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://platform.openai.com/docs/models/gpt-4o">https://platform.openai.com/docs/models/gpt-4o</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Precision-recall curve (PRC) for the blending model with top 5 features.</p><media xlink:href="xmed_v6i1e57719_app1.png" xlink:title="PNG File, 21 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Shapley additive explanations (SHAP) values forward selection method.</p><media xlink:href="xmed_v6i1e57719_app2.png" xlink:title="PNG File, 386 KB"/></supplementary-material></app-group></back></article>