Development of a Multi-Model Ensemble Tool for Early Prediction of 48-Hour Respiratory Failure Risk in CAP Patients

preprint OA: closed CC-BY-4.0
📄 Open PDF Full text JSON View at publisher
Full text 54,283 characters · extracted from preprint-html · click to expand
Development of a Multi-Model Ensemble Tool for Early Prediction of 48-Hour Respiratory Failure Risk in CAP Patients | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Development of a Multi-Model Ensemble Tool for Early Prediction of 48-Hour Respiratory Failure Risk in CAP Patients Yali Xu , Shubin Guo , Ying Chen , Andong Li , Qi Lyu , Xue Mei doi: https://doi.org/10.1101/2025.11.06.25339737 Yali Xu a Department of Emergency Medicine Clinical Research Center, Beijing Chaoyang Hospital Affiliated to Capital Medical University , Beijing, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Shubin Guo a Department of Emergency Medicine Clinical Research Center, Beijing Chaoyang Hospital Affiliated to Capital Medical University , Beijing, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: guoshubin0025{at}163.com mei_xue202507{at}163.com Ying Chen a Department of Emergency Medicine Clinical Research Center, Beijing Chaoyang Hospital Affiliated to Capital Medical University , Beijing, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Andong Li a Department of Emergency Medicine Clinical Research Center, Beijing Chaoyang Hospital Affiliated to Capital Medical University , Beijing, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Qi Lyu a Department of Emergency Medicine Clinical Research Center, Beijing Chaoyang Hospital Affiliated to Capital Medical University , Beijing, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Xue Mei a Department of Emergency Medicine Clinical Research Center, Beijing Chaoyang Hospital Affiliated to Capital Medical University , Beijing, China Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: guoshubin0025{at}163.com mei_xue202507{at}163.com Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Objective To develop a predictive tool capable of early identification of the risk of acute respiratory failure within 48 hours of hospital admission in patients with community-acquired pneumonia (CAP). Method A retrospective cohort of 257 CAP patients (median age: 76.0 years, IQR: 68.0–84.0; 56.4% male) was analyzed, among whom 148 (57.6%) developed respiratory failure within 48 hours. From 55 clinical variables, key predictors were selected using LASSO regression. Predictive models were then constructed using multivariable logistic regression (MLR) and machine learning algorithms including XGBoost, LightGBM, and Random Forest. To address the probability calibration issue of the XGBoost model, Platt scaling was applied. A final ensemble model was built by weighted averaging of the calibrated XGBoost, LightGBM, and MLR models. Feature importance was analyzed using SHAP (SHapley Additive exPlanations), and clinical utility was evaluated via decision curve analysis (DCA) and calibration plots. Result Respiratory rate, TNF-α, IL-1β, heart rate, pleural effusion, and body temperature were identified as the most important predictors. Other key features included total bilirubin, serum calcium, albumin/globulin ratio, and platelet count. The weighted ensemble model outperformed individual models, achieving an AUC of 0.792 on the test set. Conclusion We developed a predictive tool based on multi-model ensemble learning and interpretable machine learning techniques (SHAP), which provides a basis for early risk stratification and prevention of acute respiratory failure in hospitalized CAP patients. 1. Introduction Community-acquired pneumonia (CAP) is defined as an acute infection of the lower respiratory tract involving the lung parenchyma that is acquired outside of hospital settings. It remains one of the top five causes of mortality worldwide [ 1 ]. Despite ongoing advances in diagnostic technologies and antimicrobial therapies, a subset of CAP patients experience rapid disease progression after hospital admission, leading to the development of acute respiratory failure (ARF). This complication significantly complicates clinical management and markedly increases mortality risk. As one of the most common and severe complications of CAP, ARF is a major driver of poor clinical outcomes in these patients [ 2 ]. CAP patients who develop ARF are substantially more likely to require mechanical ventilation [ 3 ], with reported mortality rates reaching up to 50% [ 4 ]. Even among survivors, long-term adverse effects may persist. Hypoxemia associated with respiratory failure increases the risk of neurodegeneration, cognitive impairment [ 5 ], and delirium [ 6 ] in elderly patients, leading to reduced quality of life post-discharge [ 7 ]. Therefore, the early identification of CAP patients at risk of developing ARF during hospitalization is of critical clinical importance. Machine learning (ML) techniques have emerged as powerful tools for analyzing diverse and complex data types, and they are increasingly being applied in predictive healthcare analytics. While traditional risk stratification tools such as the CURB-65 score and the Pneumonia Severity Index (PSI) are widely recommended for CAP assessment, phenotype-based analyses suggest that these scoring systems rely on a limited number of clinical variables and may fail to capture the heterogeneity present in multimodal clinical data [ 4 ]. As a result, these conventional tools may fall short in accurately identifying CAP patients at high risk for ARF, limiting their utility in precision early warning systems. In contrast, ML algorithms are well suited to analyze high-dimensional and complex clinical datasets, as they can capture both linear and nonlinear interactions among variables, thereby uncovering synergistic relationships within the data [ 8 ]. ML-based approaches have shown significant promise in predicting respiratory failure [ 9 ]; however, studies focusing specifically on the early prediction of ARF in CAP patients remain scarce. In this study, we developed clinical prediction models to assess the risk of ARF within the first 48 hours of hospitalization in patients with CAP. We employed logistic regression and five ML algorithms: Extreme Gradient Boosting (XGBoost), Light Gradient Boosting Machine (LightGBM), k-Nearest Neighbors (KNN), Support Vector Machine (SVM), and Random Forest. These models were trained on clinical data collected at the time of hospital admission. To enhance robustness and minimize the bias associated with any single algorithm, we combined the three best-performing models using a weighted ensemble approach. Finally, to improve model interpretability, we utilized SHapley Additive exPlanations (SHAP) to identify and rank the most important predictive features. 2. Materials and Methods 2.1 Study Design and Population This was a retrospective observational study. The study population consisted of patients admitted to the Emergency Department of Beijing Chaoyang Hospital for community-acquired pneumonia (CAP) and subsequently hospitalized between September 2024 and March 2025.Inclusion criteria were as follows:1. Age ≥18 years; 2. Diagnosis consistent with CAP, defined as radiographic evidence of pulmonary infiltrates compatible with pneumonia and at least one acute lower respiratory tract infection symptom or sign: cough, chest pain, dyspnea, fever >38° C, hypothermia <35°C, or abnormal breath sounds not explained by other causes;3. Hospitalization for ≥48 hours after admission through the emergency department due to CAP.Exclusion criteria included: 1. Pregnancy;2. Presence of respiratory failure prior to admission;3. Hospitalization primarily due to other more severe internal medical conditions not related to pneumonia;4. Death within 48 hours of admission;5. Presence of primary or metastatic malignancies involving the lungs or pleura;6. Concurrent malignancy undergoing active treatment. 2.2 Data Collection Clinical data were collected from the hospital’s electronic medical records system, including: (1)Baseline characteristics:age, sex; (2) Vital signs at admission:heart rate, respiratory rate, temperature, systolic and diastolic blood pressure, and mental status; (3) Comorbidities:chronic pulmonary diseases, hypertension, coronary artery disease, cerebrovascular disease, congestive heart failure, renal dysfunction, myocardial infarction, diabetes, and history of malignancy (excluding respiratory system malignancies); (4) Laboratory tests:levels of transaminases, lactate dehydrogenase, triglycerides, total bilirubin, direct and indirect bilirubin, albumin, globulin, creatinine, blood urea nitrogen, serum sodium, potassium, calcium, phosphorus, lactate, serum glucose, N-terminal pro-brain natriuretic peptide (NT-proBNP), D-dimer, total white blood cell count, neutrophil percentage, red blood cell count, red cell distribution width, hemoglobin, platelet count, and albumin-to-globulin ratio; (5) Inflammatory and cytokine markers:C-reactive protein (CRP), procalcitonin (PCT); cytokines included tumor necrosis factor-α (TNF-α), interleukin-1β (IL-1β), IL-6, IL-8, and IL-10; (6) Radiographic findings: presence of pleural effusion on chest imaging. 2.3 Outcome Definition The primary outcome was the development of respiratory failure within 48 hours of hospital admission. Respiratory failure was defined by meeting at least one of the following criteria:1. Documentation of respiratory failure (including “respiratory failure” or “acute respiratory failure”) in the clinical records; 2. Arterial blood gas analysis showing PaO₂ ≤ 60 mmHg or an acute increase in PaCO₂ ≥ 45 mmHg within 48 hours of admission; 3. Clinical records indicating the use of high-flow oxygen therapy or mechanical ventilation. 2.4 Data Preprocessing Samples with >20% missing data were excluded. For variables with missing values, multiple imputation was performed using the ‘mice’ package (version 3.17.0) in R. Outliers in clinical and laboratory data—such as vital signs and biochemical values—were retained, as they may hold significant clinical meaning. Some lab test results that exceeded detectable limits were recorded in the electronic system using symbols such as “>” or “ 50pg/mL). Since such symbolic values cannot be processed by machine learning algorithms, we replaced these values with the respective maximum or minimum detectable limit values. 2.5 Model Development and Validation We employed several supervised learning algorithms to construct predictive models: multivariable logistic regression (MLR), k-nearest neighbors (KNN), support vector machine (SVM), extreme gradient boosting (XGBoost), random forest (RF), and Light Gradient Boosting Machine (LightGBM). Patients were randomly divided into a training set and a test set at a 7:3 ratio. Ten-fold cross-validation was used during model training to prevent overfitting and enhance generalizability. Model performance was assessed using the area under the receiver operating characteristic curve (AUROC), and clinical utility was evaluated through decision curve analysis (DCA).Additionally, we developed an ensemble model by averaging the three top-performing models on the test set using a weighted approach. This ensemble strategy was intended to reduce bias introduced by the inherent limitations of any single algorithm and improve prediction performance for respiratory failure. 3. Statistical Analysis All data processing and statistical analyses were performed using R software (version 4.1.3). Categorical variables were expressed as counts and percentages (N, %) and compared between groups using the chi-square test. For continuous variables, the distribution was first assessed for normality. Normally distributed variables were presented as mean (standard deviation (SD))and compared using the t-test. Non-normally distributed variables were reported as median and interquartile range (IQR: Q1-Q3) and analyzed using the Mann–Whitney U test. A p-value < 0.05 was considered statistically significant. 4. Results 4.1 Baseline Characteristics A total of 257 patients met the inclusion and exclusion criteria and were included in the final analysis for predicting the risk of acute respiratory failure (ARF) within 48 hours of admission for community-acquired pneumonia (CAP). The median age was 76.0 years (IQR: 68.0–84.0), and 145 (56.4%) were male. Among them, 148 patients (57.6%) developed ARF within 48 hours of admission. Baseline characteristics are summarized in Table 1 . View this table: View inline View popup Table 1. Baseline characteristics. Regarding vital signs, patients in the ARF group (positive group) had a significantly higher respiratory rate than those in the non-ARF group (negative group) (21.0 vs. 18.0 breaths/min, p < 0.001), and heart rate was also significantly higher in the ARF group (103.5 vs. 91.0 beats/min, p < 0.001). In laboratory parameters, the ARF group had significantly higher levels of lactate dehydrogenase (268 vs. 232 U/L, p = 0.025), lower levels of immunoglobulin (26.85 vs. 28.00 g/L, p = 0.050), and elevated D-dimer (1.36 vs. 0.90 mg/L, p = 0.036). Inflammatory markers including IL-1β (5.67 vs. 2.44 pg/mL, p < 0.001) and TNF-α (3.40 vs. 1.16 pg/mL, p < 0.001) were significantly higher in the ARF group. No significant differences were observed between the two groups regarding baseline comorbidities. 4.2 Model Development To identify key predictive features associated with acute respiratory failure (ARF) within 48 hours of admission, Least Absolute Shrinkage and Selection Operator (LASSO) regression was applied to all candidate variables ( Figure 1A and 1B ). LASSO addresses multicollinearity and prevents overfitting by penalizing less informative variables, effectively shrinking their coefficients toward zero. At the optimal regularization parameter (λ = 0.045), LASSO selected eight features: respiratory rate, tumor necrosis factor-α (TNF-α), pleural effusion, temperature, interleukin-1 β (IL-1β), heart rate, total bilirubin, and interleukin-8 (IL-8). These features were then entered into a multivariable logistic regression (MLR) model to adjust for potential confounders. The final MLR model retained six predictors: respiratory rate, TNF-α, pleural effusion, temperature, IL-1β, and heart rate. Download figure Open in new tab Figure 1A. illustrates the variation in binomial deviance across different levels of regularization strength (Log(λ)) during lasso regression model training using 10-fold cross-validation. The red dots represent the mean deviance at each λ value, while the grey error bars indicate the corresponding standard errors. The blue dashed line marks the X value that minimizes the mean deviance {lambda.min = 0.045), indicating the model with the optimal performance on the validation set. Download figure Open in new tab Figure 1B. Coefficient paths in Lasso regression under varying values of the regularization parameter λ, with the x-axis representing the logarithm of λ (Log Lambda). Each curve corresponds to the trajectory of a predictor’s coefficient as λ changes. As λ increases (moving leftward), more coefficients aregradually shrunk toward zero. To leverage the ability of machine learning (ML) algorithms to capture complex nonlinear interactions among variables, we trained five ML models using the full feature set: k-nearest neighbors (KNN), support vector machine (SVM), extreme gradient boosting (XGBoost), Light Gradient Boosting Machine (LightGBM), and random forest (RF). Model performance in both training and test datasets is presented in Figure 2A and 2B . Download figure Open in new tab Figure 2A. ROC Curves for Different Models on the Training Set. This figure shows the Receiver Operating Characteristic (ROC) curves for six classification models evaluated on the training set. The x-axis represents 1 – specificity (false positive rate), and the y-axis represents sensitivity (true positive rate). Each colored curve corresponds to a specific model, with the Area Under the ROC Curve (AUROC) values listed in the legend. The models with the highest performance were Random Forest (AUROC = 0.945), SVM (AUROC = 0.929), and XGBoost (AUROC = 0.858). Download figure Open in new tab Figure 2B displays the ROC curves of each model evaluated on the test set. Compared to the training results, all models showed a decrease in AUROC values on the test set, which is a common occurrence when assessing model generalization. Among them, LightGBM (AUROC = 0. 786), XGBoost (AUROC = 0. 781), and multiple logistic regression (MLR, AUROC = 0. 771) achieved the best performance. The reductions in AUROC for these models were all less than 10%compared to their corresponding training set values, indicating good model fitting. In the training set, the top-performing models were Random Forest (AUROC = 0.945), followed by SVM (AUROC = 0.929), and XGBoost (AUROC = 0.858). In the test set, performance declines were less than 10% for all models, suggesting good generalizability. The best-performing models in the test set were LightGBM (AUROC = 0.786), XGBoost (AUROC = 0.781), and MLR (AUROC = 0.771). To evaluate the clinical utility of these models across different risk thresholds, decision curve analysis (DCA) was performed on the top three models in the test set ( Figure 3A ). Across most threshold ranges, all three models demonstrated superior net benefit compared to the “treat all” and “treat none” strategies, with comparable performance among the models, thereby supporting their utility in risk-based clinical decision-making. Download figure Open in new tab Figure 3A. This figure illustrates the standardized net benefit of multiple logistic regression (MLR), XGBoost, and LightGBM across a range of high-risk threshold probabilities. The x-axis represents the threshold for classifying individuals as high risk, with the corresponding cost-benefit ratios shown below. The y-axis shows the standardized net benefit. The “All” curve assumes all individuals are treated as high risk, while the “None” line indicates no individuals are treated. Across most ranges of risk thresholds, the net benefits of all three models exceed those of the “All” and “None” strategies, andtheir net benefit curves are generally similar. Download figure Open in new tab Figure 3B The plot shows the calibration performance of the LightGBM, XGBoost, and multiple logistic regression (MLR) models, comparing predicted probabilities with observed event rates. The x-axis represents the predicted probability of an event, while the y-axis indicates the actual observed event rate. The dashed diagonal line represents perfect calibration, where predicted probabilities exactly match observed outcomes. The MLR and LightGBM models demonstrate better agreement between predicted and observed probabilities on the test set, indicating superior calibration. In contrast, the XGBoost model shows noticeable deviation in the high-probability range, suggesting potential overestimationin those regions. Download figure Open in new tab Figure 3C. Calibration performance of the original XGBoost model (orange) and the Platt-scaled XGBoost model (blue) across different predicted probability intervals. After Platt scaling, the calibration of XGBoostl improved notably across all probability ranges, with the blue curve aligning more closely with the ideal calibration line. Calibration performance was assessed by plotting calibration curves for the LightGBM, MLR, and XGBoost models ( Figure 3B ). The MLR and LightGBM models exhibited relatively smooth and well-aligned calibration curves. In contrast, the XGBoost model showed greater variability and substantial deviations, particularly in the high predicted probability range. To correct calibration bias in the XGBoost model, post hoc calibration was performed using Platt scaling—a logistic regression-based method. Because tree-based ensemble models such as XGBoost are prone to overfitting, especially in small datasets, Platt scaling helps by fitting a logistic function to the predicted scores. The recalibrated XGBoost model demonstrated a notably improved calibration curve, particularly in high-risk predictions, aligning more closely with the ideal reference line ( Figure 3C ), thereby reducing overprediction. Based on these findings, LightGBM, MLR, and the calibrated XGBoost model were selected for ensemble modeling using a weighted averaging strategy. This approach was motivated by several considerations:First, each model contributes distinct strengths. Tree-based models (LightGBM and XGBoost) excel at capturing nonlinear relationships, while MLR offers high interpretability and robust performance with linear associations.By combining models of different types, the ensemble captures a broader range of data patterns and compensates for the individual limitations of each method.Ensemble learning also enhances robustness against performance degradation caused by distributional shifts.Finally, given the relatively small sample size, a simple weighted averaging method was chosen to reduce computational complexity and mitigate overfitting, while maintaining strong predictive performance. The weighted ensemble model was constructed by integrating predictions from LightGBM, MLR, and the recalibrated XGBoost model. Figure 4A presents the receiver operating characteristic (ROC) curves for the ensemble and its three constituent models. The ensemble achieved an AUROC of 0.792 (95% CI: 0.682– 0.897), with an accuracy of 0.75 (95% CI: 0.637–0.842), sensitivity of 0.813, specificity of 0.705, positive predictive value (PPV) of 0.667, and negative predictive value (NPV) of 0.838. Calibration performance of the ensemble and base models is shown in Figure 4B . A comparison of predictive performance metrics across all four models on the test set is provided in Table 2 . Download figure Open in new tab Figure 4A. ROC curve comparison of the ensemble model and base models on the test set. The plot displays the receiver operating characteristic (ROC) curves for LightGBM (purple), multiple logistic regression (MLR, green), Platt-calibrated XGBoost (blue), and their ensemble model (red). The ensemble model (red curve) outperforms each individual model overall, with an AUC of 0.792. Download figure Open in new tab Figure 4B. Calibration curve comparison of the ensemble model and base models on the test set. The figure shows the observed event rates across different predicted probability intervals for the ensemble model (red), LightGBM (purple), multiple logistic regression (MLR, green), and Platt-calibrated XGBoost (blue). The ensemble model demonstrates better or comparable calibration performance across multiple probability intervals compared to the individual models. View this table: View inline View popup Table 2. Performance of the ARF risk prediction models in the CAP testing Cohort. 4.3 Model Interpretability To improve the interpretability of the ensemble model and identify key features associated with the onset of acute respiratory failure (ARF) within 48 hours of hospital admission in patients with community-acquired pneumonia (CAP), SHapley Additive exPlanations (SHAP) values were calculated. SHAP values offer both individual-level interpretability and global insights into feature importance and the directional impact of each variable on model predictions. By ranking the mean absolute SHAP values, we identified the top ten most influential features contributing to the ensemble model’s predictions, as illustrated in Figure 5A. Respiratory rate was the most important predictor, followed by tumor necrosis factor-α (TNF-α), interleukin-1β (IL-1β), heart rate, and pleural effusion. Additional key features included body temperature, total bilirubin, serum calcium, albumin-to-globulin ratio, and platelet count. A SHAP beeswarm plot (Figure 5B) visualizes the distribution of SHAP values for the top 10 features, showing their influence on individual predictions. Higher SHAP values reflect a stronger positive contribution to the predicted risk of ARF, while lower SHAP values indicate a negative association. An increased respiratory rate was consistently linked to higher SHAP values, significantly elevating the predicted ARF risk—highlighting its role as a crucial early warning sign. Similarly, elevated levels of TNF-α and IL-1β were strongly associated with increased risk, suggesting that heightened inflammatory activity may play a central role in the pathogenesis of early respiratory failure. Elevated heart rate, body temperature, and the presence of pleural effusion also contributed positively to the predicted likelihood of ARF. 5. Discussion In this study, we developed and validated a multi-model, weighted ensemble prediction tool to assess the risk of acute respiratory failure (ARF) within 48 hours of hospital admission in patients with community-acquired pneumonia (CAP). By integrating XGBoost, LightGBM, and multivariable logistic regression—with post hoc calibration applied to the XGBoost model—the ensemble approach achieved superior predictive performance (AUC = 0.792), consistent calibration, and strong clinical decision-support capabilities. Additionally, interpretability was enhanced using SHapley Additive exPlanations (SHAP), which improved the model’s transparency and clinical applicability. Based on an in-depth analysis of our findings, several key conclusions can be drawn. The ensemble model outperformed individual base learners in terms of both accuracy and robustness. By leveraging the complementary strengths of different algorithms and balancing feature-level biases, the weighted ensemble approach improved overall predictive capability. Respiratory rate emerged as the most important predictor of ARF in CAP patients, followed by the inflammatory markers tumor necrosis factor-α (TNF-α) and interleukin-1β (IL-1β). Elevated respiratory rate, along with increased levels of TNF-α and IL-1β, was positively associated with ARF risk. Other relevant predictors included heart rate, pleural effusion, and body temperature, whereas total bilirubin, serum calcium, albumin-to-globulin ratio (AGR), and platelet count contributed less to model prediction. Our findings regarding the predictive importance of respiratory rate and heart rate are consistent with prior studies. In our cohort, patients who developed ARF had significantly higher respiratory rates (21.0 vs. 18.0 breaths/min, p < 0.001) and heart rates (103.5 vs. 91.0 bpm, p < 0.001) compared to those without ARF. Lyu et al. employed machine learning models to predict ARF in critically ill pneumonia patients in the ICU and similarly identified respiratory rate as a key feature [ 10 ]. Wang et al. developed a model for early ARF prediction in septic patients and also confirmed respiratory rate as an independent risk factor [ 11 ]. Elevated respiratory rate is often a compensatory response to hypoxemia, and a high rate at admission may serve as an early warning sign of oxygen deficiency. Bendavid et al. likewise found that both respiratory and heart rates were significant predictors of ARF in patients with COVID-19 [ 12 ]. In our study, TNF-α and IL-1β also emerged as critical inflammatory biomarkers associated with ARF risk. TNF-α is a potent pro-inflammatory cytokine that is activated early during infection and regulates a wide range of immune responses, including apoptosis, fever induction, and acute-phase protein synthesis. Lee et al. reported significantly higher TNF-α levels in both serum and bronchoalveolar lavage fluid (BALF) among ICU patients with fatal CAP compared to survivors, underscoring its association with disease severity and mortality [ 13 ]. Bacci et al. further validated these findings, noting elevated TNF-α concentrations in patients requiring mechanical ventilation, those with acute kidney injury (AKI), ICU admission, high CRB scores, and early mortality (<7 days) [ 14 ]. Similarly, IL-1β plays a central role in acute inflammatory responses and has shown promise as a prognostic biomarker. Secreted by macrophages, dendritic cells, and endothelial cells, IL-1β promotes immune cell recruitment and amplifies local inflammation through the stimulation of other cytokines. While Lee et al. did not observe significant differences in overall IL-1β levels between survivors and non-survivors, elevated BALF IL-1β concentrations were found in CAP patients with ARDS who did not survive, suggesting its role in localized pulmonary inflammation [ 13 ]. Bacci et al. also linked IL-1β with ARDS and early mortality, particularly in patients with high CRB scores [ 14 ]. Moreover, IL-1β has been associated with CAP-related complications such as pleural effusion and systemic inflammatory response syndrome (SIRS) [ 15 ]. A pediatric study also demonstrated that high IL-1β levels were associated with the need for pleural drainage in cases of pneumonia [ 16 ]. Collectively, these findings support the utility of IL-1β as a potential early biomarker for ARF risk stratification in CAP. Pleural effusion has long been recognized as a critical factor influencing clinical outcomes in patients with community-acquired pneumonia (CAP). As a common complication of pneumonia, pleural effusion is associated with adverse outcomes, including prolonged hospital stays [ 18 ], increased risk of respiratory failure, and a higher likelihood of requiring mechanical ventilation [ 12 , 17 – 20 ]. It often reflects extensive pleural involvement, leading to lung compression and impaired expansion, thereby increasing the likelihood of ARF. In hypoxemic patients, pleural effusion can exacerbate oxygenation impairment. Notably, pleural effusion frequently precedes significant declines in oxygenation indices, providing a potential window for early risk identification. Additional predictors identified in our analysis included body temperature, total bilirubin (TBIL), serum calcium, albumin-to-globulin ratio (AGR), and platelet count. Fever represents a host defense response that can enhance immune function [ 21 ]; however, excessive hyperthermia may adversely affect the cardiovascular, respiratory, and nervous systems and has been associated with increased mortality [ 22 ]. High fever (≥39.5°C) has been linked to poorer outcomes, likely due to increased metabolic demand, cardiovascular stress, and elevated oxygen consumption [ 23 ]. TBIL, a commonly used marker of liver function, also possesses antioxidant and anti-inflammatory properties. Nonetheless, elevated TBIL levels have been associated with worse outcomes in patients with sepsis, COVID-19, and other critical illnesses [ 24 – 26 ]. High TBIL may reflect impaired hepatic clearance, systemic inflammation, increased apoptosis, and oxidative stress, all of which can contribute to pulmonary injury and the development of ARF [ 27 , 28 ]. Abnormal serum calcium levels have been associated with poor prognosis and increased mortality in various conditions [ 29 – 33 ]. Hypocalcemia may lead to ARF through mechanisms such as muscle weakness, laryngospasm, or bronchospasm, whereas severe hypercalcemia can result in somnolence, confusion, or coma, ultimately precipitating respiratory failure [ 30 ]. Albumin and globulin, as major plasma proteins, reflect nutritional and immune status, respectively[ 34 ]. The albumin-to-globulin ratio (AGR) is considered a more robust prognostic indicator than either component alone. Abnormal AGR has been associated with unfavorable outcomes in several clinical contexts [ 35 – 37 ], and it may serve as an independent predictor of prognosis in both pneumonia and ARF [ 38 , 39 ]. Our analysis also revealed that elevated platelet counts were significantly associated with an increased risk of ARF. Excessive platelet activation can promote thrombosis, reduce pulmonary perfusion, and contribute to respiratory failure [ 40 ]. High platelet counts may reflect underlying systemic inflammation and coagulation imbalance, both of which are implicated in ARF pathogenesis. In CAP—particularly in pneumococcal infections—platelet activation has also been linked to cardiovascular complications such as myocardial infarction and stroke [ 41 ]. Despite the promising results, several limitations must be acknowledged. First, this was a retrospective, single-center study conducted at Beijing Chaoyang Hospital, which may introduce selection bias. The relatively small sample size (n = 257) and geographic limitation may reduce the generalizability of our findings. Second, the analysis was restricted to clinical data collected within the first 48 hours of admission, without longitudinal follow-up. As a result, dynamic changes in clinical status—such as treatment response or evolving vital signs—were not captured. Third, the model was only internally validated; external validation using larger, multi-center datasets is necessary to confirm its reliability and broader applicability. 6. Conclusion This study developed a multi-model ensemble-based clinical prediction tool to evaluate the risk of acute respiratory failure (ARF) within 48 hours of hospital admission in patients with community-acquired pneumonia (CAP). Model interpretability based on SHAP (SHapley Additive exPlanations) highlighted the pivotal roles of clinical features such as respiratory rate, inflammatory markers (TNF-α and IL-1β), and heart rate in predicting ARF. The proposed model is well-suited for early risk stratification and personalized decision support in hospitalized CAP patients. 7. Declarations Abbreviations: T, temperature; SBP, systolic blood pressure; DBP, diastolic blood pressure; Lac, lactate; AST, aspartate aminotransferase; ALT, alanine aminotransferase; LDH, lactate dehydrogenase; TG, triglycerides; TBIL, total bilirubin; DBIL, direct bilirubin; Alb, albumin; Glb, globulin; BUN, blood urea nitrogen; Na, serum sodium; K, serum potassium; Ca, serum calcium; P, serum phosphorus; Glu, glucose; Nt_BNP, N-terminal pro-brain natriuretic peptide; PT, prothrombin time; APTT, activated partial thromboplastin time; INR, international normalized ratio; WBC, white blood cell count; NEUT%, neutrophil percentage; RBC, red blood cell count; HCT, hematocrit; Hb, hemoglobin; Plt, platelet count; AG_Ratio, albumin-to-globulin ratio; CRP, C-reactive protein; PCT, procalcitonin; IL, interleukin; TNF, tumor necrosis factor; GCS, Glasgow Coma Scale.MLR:multivariable logistic regression model.LightGBM:Light Gradient Boosting Machine.Cal_XGBoost:calibrated Extreme Gradient Boosting.AUROC:area under the receiver operating characteristic curve.PPV: positive predictive value.NPV: negative predictive value. Ethics approval and consent to participate The study has been approved by the Ethics Committee of Beijing Chaoyang Hospital, affiliated with Capital Medical University. Based on the committee’s review, the research uses only anonymized data and does not involve direct human participation. Therefore, the Ethics Committee has waived the requirement for written informed consent. The study adheres to the ethical principles outlined in the Declaration of Helsinki. Consent for publication Not Applicable. Availability of data and materials The datasets used and analysed during the current study available from the corresponding author on reasonable request. Competing Interests No conflict of interest is declared by all the authors. Funding Not Applicable. Authors’ contributions YLX Contributed to data curation, conceptualization, data analysis, and manuscript writing. YC and QL Contributed to methodology and data curation. ADL Contributed to methodology. XM reviewed the initial draft. SBG Supervised and reviewed the manuscript. All authors approved the final manuscript and are responsible for its content. Data Availability The datasets used and analysed during the current study available from the corresponding author on reasonable request. Acknowledgements The authors would like to thank all those who contributed to the completion of this work. References 1. ↵ GBD 2016 Lower Respiratory Infections Collaborators . Estimates of the global, regional, and national morbidity, mortality, and aetiologies of lower respiratory infections in 195 countries, 1990-2016: a systematic analysis for the Global Burden of Disease Study 2016 . Lancet Infect Dis . 2018 ; 18 ( 11 ): 1191 – 1210 . doi: 10.1016/S1473-3099(18)30310-4 OpenUrl CrossRef PubMed 2. ↵ Vanoni NM , Carugati M , Borsa N , et al. Management of Acute Respiratory Failure Due to Community-Acquired Pneumonia: A Systematic Review . Med Sci (Basel ). 2019 ; 7 ( 1 ): 10 . doi: 10.3390/medsci7010010 OpenUrl CrossRef PubMed 3. ↵ Woodhead M , Welch CA , Harrison DA , Bellingan G , Ayres JG . Community-acquired pneumonia on the intensive care unit: secondary analysis of 17,869 cases in the ICNARC Case Mix Programme Database . Crit Care . 2006 ; 10 Suppl 2( Suppl 2 ): S1 . doi: 10.1186/cc4927 OpenUrl CrossRef 4. ↵ Aliberti S , Dela Cruz CS , Amati F , Sotgiu G , Restrepo MI . Community-acquired pneumonia . Lancet . 2021 ; 398 ( 10303 ): 906 – 919 . doi: 10.1016/S0140-6736(21)00630-9 OpenUrl CrossRef PubMed 5. ↵ McMorris T , Hale BJ , Barwood M , Costello J , Corbett J . Effect of acute hypoxia on cognition: A systematic review and meta-regression analysis . Neurosci Biobehav Rev . 2017 ; 74 (Pt A ): 225 – 232 . doi: 10.1016/j.neubiorev.2017.01.019 OpenUrl CrossRef PubMed 6. ↵ Gong F , Ai Y , Zhang L , Peng Q , Zhou Q , Gui C . Relationship between PaO2/FiO2 and delirium in intensive care: A cross-sectional study . J Intensive Med . 2023 ; 3 ( 1 ): 73 – 78 . doi: 10.1016/j.jointm.2022.08.002 OpenUrl CrossRef PubMed 7. ↵ Brummel NE , Balas MC , Morandi A , Ferrante LE , Gill TM , Ely EW . Understanding and reducing disability in older adults following critical illness . Crit Care Med . 2015 ; 43 ( 6 ): 1265 – 1275 . doi: 10.1097/CCM.0000000000000924 OpenUrl CrossRef PubMed 8. ↵ Hosni M , Abnane I , Idri A , Carrillo de Gea JM , Fernández Alemán JL . Reviewing ensemble classification methods in breast cancer . Comput Methods Programs Biomed . 2019 ; 177 : 89 – 112 . doi: 10.1016/j.cmpb.2019.05.019 OpenUrl CrossRef PubMed 9. ↵ Wong AKI , Cheung PC , Kamaleswaran R , Martin GS , Holder AL . Machine Learning Methods to Predict Acute Respiratory Failure and Acute Respiratory Distress Syndrome . Front Big Data . 2020 ; 3 : 579774 . doi: 10.3389/fdata.2020.579774 OpenUrl CrossRef PubMed 10. ↵ Lyu G , Nakayama M . Prediction of respiratory failure risk in patients with pneumonia in the ICU using ensemble learning models . PLoS One . 2023 ; 18 ( 9 ): e0291711 . doi: 10.1371/journal.pone.0291711 OpenUrl CrossRef PubMed 11. ↵ Wang B , Chen J , Wang M . Establishment and validation of a predictive model for respiratory failure within 48 h following admission in patients with sepsis: a retrospective cohort study . Front Physiol . 2023 ; 14 : 1288226 . doi: 10.3389/fphys.2023.1288226 OpenUrl CrossRef PubMed 12. ↵ Bendavid I , Statlender L , Shvartser L , et al. A novel machine learning model to predict respiratory failure and invasive mechanical ventilation in critically ill patients suffering from COVID-19 . Sci Rep . 2022 ; 12 ( 1 ): 10573 . doi: 10.1038/s41598-022-14758-x OpenUrl CrossRef 13. ↵ Lee YL , Chen W , Chen LY , et al. Systemic and bronchoalveolar cytokines as predictors of in-hospital mortality in severe community-acquired pneumonia . J Crit Care . 2010 ; 25 ( 1 ): 176 .e7-13. doi: 10.1016/j.jcrc.2009.05.002 OpenUrl CrossRef 14. ↵ Bacci MR , Leme RCP , Zing NPC , et al. IL-6 and TNF-α serum levels are associated with early death in community-acquired pneumonia patients . Braz J Med Biol Res . 2015 ; 48 ( 5 ): 427 – 432 . doi: 10.1590/1414-431X20144402 OpenUrl CrossRef PubMed 15. ↵ San José ME , Ferreiro L , Soneira ME , et al. Utility of measurement of interleukin-1ß and interleukin-8 in the diagnosis of complicated parapneumonic pleural effusions . Am J Clin Pathol . 2014 ; 142 ( 4 ): 467 – 473 . doi: 10.1309/AJCPDC7PS8TIPBXP OpenUrl CrossRef PubMed 16. ↵ Korkmaz MF , Güzel A , Açıkgöz M , Okuyucu A , Alaçam H . Reliability of Pro-adrenomedullin and Interleukin 1β in Predicting Severity of Community-Acquired Pneumonia in Pediatric Patients . Ann Clin Lab Sci . 2018 ; 48 ( 1 ): 81 – 89 . OpenUrl Abstract / FREE Full Text 17. ↵ Fine MJ , Auble TE , Yealy DM , et al. A prediction rule to identify low-risk patients with community-acquired pneumonia . N Engl J Med . 1997 ; 336 ( 4 ): 243 – 250 . doi: 10.1056/NEJM199701233360402 OpenUrl CrossRef PubMed Web of Science 18. ↵ Fimognari FL , De Vincentis A , Arone A , Baffa Bellucci F , Ricchio R , Antonelli Incalzi R . Clinical outcomes and phenotypes of respiratory failure in older subjects admitted to an acute care geriatric hospital ward . Intern Emerg Med . 2024 ; 19 ( 5 ): 1359 – 1367 . doi: 10.1007/s11739-024-03625-4 OpenUrl CrossRef PubMed 19. Wang Y , Huang L , Qian J , et al. Clinical profile and risk factors for respiratory failure in children with Mycoplasma pneumoniae infection . Biomol Biomed . Published online January 22, 2025 . doi: 10.17305/bb.2024.11641 OpenUrl CrossRef 20. ↵ Kim SH , Lee E , Song ES , Lee YY . Clinical Significance of Pleural Effusion in Mycoplasma pneumoniae Pneumonia in Children . Pathogens . 2021 ; 10 ( 9 ): 1075 . doi: 10.3390/pathogens10091075 OpenUrl CrossRef PubMed 21. ↵ Young PJ , Saxena M , Beasley R , et al. Early peak temperature and mortality in critically ill patients with or without infection . Intensive Care Med. Published online January 31 , 2012 . doi: 10.1007/s00134-012-2478-3 OpenUrl CrossRef 22. ↵ Greer DM , Funk SE , Reaven NL , Ouzounelli M , Uman GC . Impact of fever on outcome in patients with stroke and neurologic injury: a comprehensive meta-analysis . Stroke . 2008 ; 39 ( 11 ): 3029 – 3035 . doi: 10.1161/STROKEAHA.108.521583 OpenUrl Abstract / FREE Full Text 23. ↵ Marcusohn E , Gibory I , Miller A , Lipsky AM , Neuberger A , Epstein D . The association between the degree of fever as measured in the emergency department and clinical outcomes of hospitalized adult patients . Am J Emerg Med . 2022 ; 52 : 92 – 98 . doi: 10.1016/j.ajem.2021.11.045 OpenUrl CrossRef PubMed 24. ↵ Zhai R , Sheu CC , Su L , et al. Serum bilirubin levels on ICU admission are associated with ARDS development and mortality in sepsis . Thorax . 2009 ; 64 ( 9 ): 784 – 790 . doi: 10.1136/thx.2009.113464 OpenUrl Abstract / FREE Full Text 25. Yang ZX , Lv XL , Yan J . Serum Total Bilirubin Level Is Associated With Hospital Mortality Rate in Adult Critically Ill Patients: A Retrospective Study . Front Med (Lausanne ). 2021 ; 8 : 697027 . doi: 10.3389/fmed.2021.697027 OpenUrl CrossRef PubMed 26. ↵ Ding ZY , Li GX , Chen L , et al. Association of liver abnormalities with in-hospital mortality in patients with COVID-19 . J Hepatol . 2021 ; 74 ( 6 ): 1295 – 1302 . doi: 10.1016/j.jhep.2020.12.012 OpenUrl CrossRef PubMed 27. ↵ Strnad P , Tacke F , Koch A , Trautwein C . Liver - guardian, modifier and target of sepsis . Nat Rev Gastroenterol Hepatol . 2017 ; 14 ( 1 ): 55 – 66 . doi: 10.1038/nrgastro.2016.168 OpenUrl CrossRef PubMed 28. ↵ Ruan Z , Li D , Chen X , Qiu Z . Association of serum total bilirubin and potential predictors with mortality in acute respiratory failure: A retrospective cohort study . Heart Lung . 2023 ; 57 : 12 – 18 . doi: 10.1016/j.hrtlng.2022.08.006 OpenUrl CrossRef PubMed 29. ↵ Tao RJ , Luo XL , Xu W , et al. Viral infection in community acquired pneumonia patients with fever: a prospective observational study . J Thorac Dis . 2018 ; 10 ( 7 ): 4387 – 4395 . doi: 10.21037/jtd.2018.06.33 OpenUrl CrossRef PubMed 30. ↵ Dai J , Guo Y , Zhou Q , Duan XJ , Shen J , Zhang X . The relationship between red cell distribution width, serum calcium ratio, and in-hospital mortality among patients with acute respiratory failure: A retrospective cohort study of the MIMIC-IV database . Medicine (Baltimore ). 2024 ; 103 ( 15 ): e37804 . doi: 10.1097/MD.0000000000037804 OpenUrl CrossRef PubMed 31. Bennouar S , Cherif AB , Kessira A , Bennouar DE , Abdi S . Vitamin D Deficiency and Low Serum Calcium as Predictors of Poor Prognosis in Patients with Severe COVID-19 . J Am Coll Nutr . 2021 ; 40 ( 2 ): 104 – 110 . doi: 10.1080/07315724.2020.1856013 OpenUrl CrossRef 32. Zhao J , Liu M , Yu D , Zhang Y . Serum calcium and mortality in pediatric pneumonia patients admitted to the PICU: a retrospective cohort study . Sci Rep . 2024 ; 14 ( 1 ): 18683 . doi: 10.1038/s41598-024-69885-4 OpenUrl CrossRef PubMed 33. ↵ Fatima J , Shukla V , Siddiqi Z , Kumar D , Mateen S , Gupta AB . Correlation of Serum Calcium with Severity and Outcomes in Patients of COVID-19 Pneumonia . J Family Med Prim Care . 2024 ; 13 ( 4 ): 1421 – 1427 . doi: 10.4103/jfmpc.jfmpc_1595_23 OpenUrl CrossRef PubMed 34. ↵ Yang D , Shen J , Huang H , et al. Elevated Albumin to Globulin Ratio on Day 7 is Associated with Improved Function Outcomes in Acute Ischemic Stroke Patients with Intravenous Thrombolysis . J Inflamm Res . 2022 ; 15 : 2695 – 2705 . doi: 10.2147/JIR.S347026 OpenUrl CrossRef PubMed 35. ↵ Peng F , Sun L , Chen T , et al. Albumin-globulin ratio and mortality in patients on peritoneal dialysis: a retrospective study . BMC Nephrol . 2020 ; 21 ( 1 ): 51 . doi: 10.1186/s12882-020-1707-1 OpenUrl CrossRef PubMed 36. Choe H , Kamono E , Abe K , et al. Accuracy of Albumin, Globulin, and Albumin-Globulin Ratio for Diagnosing Periprosthetic Joint Infection: A Systematic Review and Meta-Analysis . J Clin Med . 2023 ; 12 ( 24 ): 7512 . doi: 10.3390/jcm12247512 OpenUrl CrossRef PubMed 37. ↵ Roberts WS , Delladio W , Price S , Murawski A , Nguyen H . The efficacy of albumin-globulin ratio to predict prognosis in cancer patients . Int J Clin Oncol . 2023 ; 28 ( 9 ): 1101 – 1111 . doi: 10.1007/s10147-023-02380-4 OpenUrl CrossRef PubMed 38. ↵ Ulloque-Badaracco JR , Mosquera-Rojas MD , Hernandez-Bustamante EA , Alarcón-Braga EA , Herrera-Añazco P , Benites-Zapata VA . Prognostic value of albumin-to-globulin ratio in COVID-19 patients: A systematic review and meta-analysis . Heliyon . 2022 ; 8 ( 5 ): e09457 . doi: 10.1016/j.heliyon.2022.e09457 OpenUrl CrossRef 39. ↵ Chen L , Xu M , Huang Q , Liu Y , Ren W . Clinical significance of albumin to globulin ratio among patients with stroke-associated pneumonia . Front Nutr . 2022 ; 9 : 970573 . doi: 10.3389/fnut.2022.970573 OpenUrl CrossRef PubMed 40. ↵ Zamani Rarani F , Zamani Rarani M , Hamblin MR , Rashidi B , Hashemian SMR , Mirzaei H . Comprehensive overview of COVID-19-related respiratory failure: focus on cellular interactions . Cell Mol Biol Lett . 2022 ; 27 ( 1 ): 63 . doi: 10.1186/s11658-022-00363-3 OpenUrl CrossRef PubMed 41. ↵ Feldman C , Anderson R . Platelets and Their Role in the Pathogenesis of Cardiovascular Events in Patients With Community-Acquired Pneumonia . Front Immunol . 2020 ; 11 : 577303 . doi: 10.3389/fimmu.2020.577303 OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted November 09, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Development of a Multi-Model Ensemble Tool for Early Prediction of 48-Hour Respiratory Failure Risk in CAP Patients Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Development of a Multi-Model Ensemble Tool for Early Prediction of 48-Hour Respiratory Failure Risk in CAP Patients Yali Xu , Shubin Guo , Ying Chen , Andong Li , Qi Lyu , Xue Mei medRxiv 2025.11.06.25339737; doi: https://doi.org/10.1101/2025.11.06.25339737 Share This Article: Copy Citation Tools Development of a Multi-Model Ensemble Tool for Early Prediction of 48-Hour Respiratory Failure Risk in CAP Patients Yali Xu , Shubin Guo , Ying Chen , Andong Li , Qi Lyu , Xue Mei medRxiv 2025.11.06.25339737; doi: https://doi.org/10.1101/2025.11.06.25339737 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Emergency Medicine Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (300) Cardiovascular Medicine (4435) Dentistry and Oral Medicine (444) Dermatology (382) Emergency Medicine (608) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1509) Epidemiology (15229) Forensic Medicine (30) Gastroenterology (1124) Genetic and Genomic Medicine (6600) Geriatric Medicine (668) Health Economics (997) Health Informatics (4536) Health Policy (1368) Health Systems and Quality Improvement (1613) Hematology (541) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15916) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (146) Nephrology (667) Neurology (6599) Nursing (346) Nutrition (998) Obstetrics and Gynecology (1144) Occupational and Environmental Health (957) Oncology (3332) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (663) Pediatrics (1693) Pharmacology and Therapeutics (691) Primary Care Research (711) Psychiatry and Clinical Psychology (5447) Public and Global Health (9232) Radiology and Imaging (2198) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (593) Sexual and Reproductive Health (712) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a00aded9edf8ee10',t:'MTc3OTYxMDcxNQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall
last seen: 2026-05-23T02:00:01.238055+00:00
License: CC-BY-4.0