<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id><journal-id journal-id-type="publisher-id">formative</journal-id><journal-id journal-id-type="index">27</journal-id><journal-title>JMIR Formative Research</journal-title><abbrev-journal-title>JMIR Form Res</abbrev-journal-title><issn pub-type="epub">2561-326X</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e65585</article-id><article-id pub-id-type="doi">10.2196/65585</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Explainable Machine Learning Framework for Dynamic Monitoring of Disease Prognostic Risk: Retrospective Cohort Study</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Ishikawa</surname><given-names>Tetsuo</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff5">5</xref><xref ref-type="aff" rid="aff6">6</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Shinoda</surname><given-names>Masahiro</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Oya</surname><given-names>Megumi</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff6">6</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ashizaki</surname><given-names>Koichi</given-names></name><degrees>BA</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ota</surname><given-names>Shinichiro</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kamachi</surname><given-names>Kenichi</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sakurada</surname><given-names>Kazuhiro</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Kawakami</surname><given-names>Eiryo</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Shinkai</surname><given-names>Masaharu</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Predictive Medicine Special Project, RIKEN Center for Integrative Medical Sciences, RIKEN</institution><addr-line>1-7-22 Suehiro-cho, Tsurumi-ku</addr-line><addr-line>Yokohama</addr-line><country>Japan</country></aff><aff id="aff2"><institution>Department of Extended Intelligence for Medicine, The Ishii-Ishibashi Laboratory, Keio University School of Medicine</institution><addr-line>Tokyo</addr-line><country>Japan</country></aff><aff id="aff3"><institution>Department of Artificial Intelligence Medicine, Graduate School of Medicine, Chiba University</institution><addr-line>Chiba</addr-line><country>Japan</country></aff><aff id="aff4"><institution>Department of Respiratory Medicine, Tokyo Shinagawa Hospital</institution><addr-line>Tokyo</addr-line><country>Japan</country></aff><aff id="aff5"><institution>Collective Intelligence Research Laboratory, Graduate School of Arts and Sciences, The University of Tokyo</institution><addr-line>Tokyo</addr-line><country>Japan</country></aff><aff id="aff6"><institution>Division of Applied Mathematical Science, RIKEN Center for Interdisciplinary Theoretical and Mathematical Sciences, RIKEN</institution><addr-line>Yokohama</addr-line><country>Japan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Sarvestan</surname><given-names>Javad</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Mete</surname><given-names>Ani</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Kasani</surname><given-names>Payam Hosseinzadeh</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Venkatesh</surname><given-names>S</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Eiryo Kawakami, MD, PhD, Predictive Medicine Special Project, RIKEN Center for Integrative Medical Sciences, RIKEN, 1-7-22 Suehiro-cho, Tsurumi-ku, Yokohama, 230-0045, Japan, 81 45-503-7000; <email>eiryo.kawakami@riken.jp</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>7</day><month>8</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e65585</elocation-id><history><date date-type="received"><day>20</day><month>08</month><year>2024</year></date><date date-type="rev-recd"><day>26</day><month>05</month><year>2025</year></date><date date-type="accepted"><day>28</day><month>05</month><year>2025</year></date></history><copyright-statement>&#x00A9; Tetsuo Ishikawa, Masahiro Shinoda, Megumi Oya, Koichi Ashizaki, Shinichiro Ota, Kenichi Kamachi, Kazuhiro Sakurada, Eiryo Kawakami, Masaharu Shinkai. Originally published in JMIR Formative Research (<ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>), 7.8.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://formative.jmir.org/2025/1/e65585"/><abstract><sec><title>Background</title><p>Patients&#x2019; clinical status often evolves rapidly after an initial diagnosis, with each patient exhibiting a distinct disease trajectory. As a result, static risk scores fall short in supporting timely interventions&#x2014;an issue highlighted by COVID-19, where deaths have stemmed from heterogeneous pathways such as pneumonia, multiorgan failure, or exacerbation of preexisting conditions.</p></sec><sec><title>Objective</title><p>This study aims to propose a dynamic prognostic risk assessment framework based on longitudinal data collected during hospitalization, using COVID-19 as an example. Our aim was to develop and validate an interpretable framework that (1) screens prognosis at admission and (2) dynamically updates mortality risk throughout hospitalization, thereby providing clinicians with early, explainable warnings while minimizing additional cognitive load.</p></sec><sec sec-type="methods"><title>Methods</title><p>In this retrospective study, we extracted electronic medical records of 382 COVID-19 cases treated at Tokyo Shinagawa Hospital between January 27 and September 30, 2020. At admission, gradient boosting decision trees (Light Gradient Boosting Machine) were used to predict the maximum clinical deterioration, including death, based on data available at initial diagnosis. Model performance was evaluated using the area under the receiver operating characteristic curve (AUC). For in-hospital monitoring, random survival forests (RSF) were trained on a longitudinal dataset that combined static demographic characteristics with serially measured vital signs and laboratory results. The model dynamically assessed daily mortality risk by calculating a 7-day cumulative hazard function, with risk scores recalculated each day during hospitalization. RSF accuracy was evaluated in an independent one-third test set using the concordance index (C-index), an integrated Brier score (1-50 days), and mean time-dependent AUC. SurvSHAP(t), an extension of Shapley Additive Explanations, was applied to provide time-dependent explanations of each variable&#x2019;s contribution to the prediction.</p></sec><sec sec-type="results"><title>Results</title><p>The prediction at initial diagnosis showed good agreement with the actual severity outcomes (AUC of 0.717 for predicting hospitalization/severity &#x2265;2; 0.878 for severity &#x2265;3; 0.951 for severity &#x2265;4; 0.952 for severity &#x2265;5; and 0.970 for death/severity=6), although some cases exhibited discrepancies between the predicted and actual prognoses. The dynamic mortality risk assessment during hospitalization using the RSF achieved a test-set C-index of 0.941, an integrated Brier score of 0.315, and a mean time-dependent AUC of 0.936. This dynamic assessment was able to distinguish between dead and surviving patients as early as 1&#x2010;2 weeks before the outcome. Early in hospitalization, C-reactive protein was an important risk factor for mortality; during the middle period, peripheral oxygen saturation (SpO<sub>2</sub>) gained importance; and immediately before death, platelets and &#x03B2;-D-glucan were the primary risk factors.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Integrating static admission triage with daily, explainable RSF predictions enables early identification of patients with COVID-19 at high risk of deterioration. By surfacing phase-specific, actionable predictors, the framework supports timely interventions and more efficient resource allocation. Prospective, multicenter studies are warranted to validate its generalizability and clinical impact.</p></sec></abstract><kwd-group><kwd>COVID-19</kwd><kwd>prognostic modeling</kwd><kwd>electronic health records</kwd><kwd>time-varying biomarkers</kwd><kwd>clinical decision support</kwd><kwd>interpretable AI</kwd><kwd>random survival forests</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>During hospitalization, various adverse events and complications arise from the disease and its treatment, sometimes leading to death [<xref ref-type="bibr" rid="ref1">1</xref>]. Therefore, health care professionals take great care not to overlook signs of deterioration based on blood tests and vital-sign measurements [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. The recent surge in hospital admissions driven by COVID-19 and population aging has intensified this burden [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Predicting patient outcomes and issuing timely alerts can reduce the burden and enable the advanced preparation of scarce medical resources. To frame the scope of this study, we ask a single overarching question: How can clinicians anticipate deterioration early enough to intervene, while minimizing additional cognitive load?</p><p>The task is complicated by the heterogeneity of risk factors and signs of deterioration, which makes uniform risk assessment challenging, even for patients with the same disease [<xref ref-type="bibr" rid="ref6">6</xref>]. Taking COVID-19 as an example, causes of death range from pneumonia to multiorgan failure and exacerbation of preexisting diseases [<xref ref-type="bibr" rid="ref7">7</xref>]. Detecting such diverse paths to deterioration requires a personalized monitoring strategy that tracks multiple prognostic biomarkers over time. This clinical heterogeneity defines the modeling gap that data-driven methods must fill.</p><p>Recent reports indicate that machine learning models using electronic health records can accurately predict individual deterioration and mortality, thereby aiding health care professionals in clinical decision-making [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. However, most existing prognostic models are trained on static snapshots, struggle to generalize across heterogeneous populations, or fail to provide interpretable insights. While deep learning models applied to longitudinal intensive care unit data can assess risks dynamically [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>], their &#x201C;black-box&#x201D; nature restricts bedside adoption [<xref ref-type="bibr" rid="ref12">12</xref>]. Accordingly, the next generation of prognostic tools must be both dynamic and interpretable to earn clinical trust.</p><p>Real-world deployment adds further hurdles: missing data, irregular sampling, inconsistent documentation, and limited computation resources in busy wards. Methods must therefore be accurate, explainable, and robust to data imperfections, while remaining fast enough for routine use. Taken together, limited interpretability, data-quality issues, and computational constraints form a 3-fold barrier that this work seeks to overcome.</p><p>To address these limitations, we leverage random survival forests (RSFs) to capture time-varying trajectories and pair them with SurvSHAP(t), an extension of Shapley Additive Explanations (SHAP) that provides context-specific, time-dependent rationale [<xref ref-type="bibr" rid="ref13">13</xref>]. In contrast to models that assume linear relationships (eg, Cox proportional hazards), RSF flexibly models nonlinear, time-dependent interactions; SurvSHAP(t) embeds explanation directly alongside prediction, closing the trust gap.</p><p>Building on these insights, we first confirm the predictability of prognosis at initial diagnosis with a machine learning model that anticipates the highest COVID-19 severity from baseline data. We then propose a dynamic prognostic-risk framework that continuously updates survival estimates using longitudinal information (<xref ref-type="fig" rid="figure1">Figure 1</xref>) and visualizes the drivers of individual risk. This 2-stage design&#x2014;static triage at admission followed by dynamic risk updates&#x2014;constitutes the narrative arc of the paper.</p><p>We therefore present an interpretable, dynamic prognostic framework designed to enhance clinicians&#x2019; understanding of patient status, enable precise treatment allocation, and optimize the use of medical resources.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Conceptual diagram illustrating the diversity of pathological changes. In this study, we first assess the ability to predict a patient&#x2019;s maximum COVID-19 severity using data from the initial diagnosis. We then introduce a dynamic prognostic risk assessment framework that continuously monitors hospitalized patients based on their longitudinal data. BP: blood pressure; CRP: C-reactive protein; ECMO: extracorporeal membrane oxygenation; GBDT: gradient boosting decision trees; Plt: platelet.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e65585_fig01.png"/></fig></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design, Setting, and Population</title><p>This retrospective cohort study screened 382 patients with COVID-19 treated between January 2020 and September 2020 at the Department of Respiratory Medicine, Tokyo Shinagawa Hospital. Patients aged under 18 years and those with unknown severity changes during hospitalization or clinical outcomes were excluded from the analysis. This included cases in which the prognosis was unclear because of hospital transfer, observation censoring, or insufficient documentation of the time point at which severity changed. Inpatients with a discrepancy of more than 4 days between the date of first diagnosis and the date of admission were excluded from the prognostic screening but were included in the dynamic risk assessment. The included cases were randomly divided into training and test datasets at a 2:1 ratio using a stratified sampling method to preserve the distribution of severity outcomes.</p><p>For risk classification at initial diagnosis, patients who experienced severity changes were included in the dataset. Overall, 201 outpatients and 161 inpatients were included. We extracted data from the electronic medical records, including 84 variables, such as symptoms, background information, and blood and urine biomarkers, for prognostic screening at initial diagnosis (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><p>For the dynamic prognostic risk assessment framework, the dataset included 182 inpatients with longitudinal data collected during hospitalization. From the electronic medical records, 72 variables, including blood and urine biomarkers, vital signs, and background information during hospitalization, were extracted for dynamic risk assessment (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). The median length of stay for inpatients was 11 days.</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>This study was approved by the local institutional review board of RIKEN and Tokyo Shinagawa Hospital (approval number 20-A-06). It was conducted in accordance with the 1964 Declaration of Helsinki and its later amendments, or comparable ethical standards. The requirement for informed consent was waived because of the retrospective nature of the study. All data used in this study were deidentified before analysis. Specifically, any directly identifiable personal information (eg, names, addresses, or medical record numbers) was removed. The deidentification process adhered to relevant institutional and national data protection guidelines. As the data were not anonymized in the strictest sense, but were instead deidentified with safeguards in place, individual participants cannot be readily identified by the investigators.</p></sec><sec id="s2-3"><title>Severity Classification</title><p>We adopted the oxygen-support status scores proposed by Grein et al [<xref ref-type="bibr" rid="ref14">14</xref>] to classify patient severity. The score uses an ordinal scale from 1 to 6 based on the level of oxygenation: (1) discharged or not hospitalized; (2) room air; (3) low-flow oxygen support; (4) noninvasive intervention, including nasal high-flow oxygen therapy or noninvasive positive pressure ventilation; (5) invasive mechanical ventilation or extracorporeal membrane oxygenation (ECMO); and (6) death. In addition to the original score, where 1 indicated discharge status, outpatients were assigned a score of 1.</p></sec><sec id="s2-4"><title>Machine Learning for Prognostic Classification at Initial Diagnosis</title><p>Gradient boosting decision trees (GBDT) [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>] were used to predict the highest severity from data at initial diagnosis. GBDT is related to random forest and uses boosting to enhance predictive performance. Among various GBDT implementations, the Python package (Python Foundation) Light Gradient Boosting Machine (LightGBM; version 4.5.0) was used because of its superior computing speed. We included all variables with less than 15% missing values, given that COVID-19 severity and mortality are influenced by a wide range of factors. Although 265 biomarkers were recorded at the first visit, most were not measured in nonhospitalized patients. To ensure that the selected biomarkers would be applicable across a broad clinical spectrum, we included only laboratory test variables that were routinely measured in both hospitalized and nonhospitalized (outpatient) patients at the time of initial diagnosis. This approach was intended to support early-stage risk prediction and avoid biasing the model toward inpatient-specific features. Biomarkers available in less than 50% of the patient population were excluded to reduce the impact of missing data on model performance, resulting in 53 biomarkers collected from 4 days before to 1 day after the initial diagnosis. Missing values were imputed using the missForest package (version 1.5) in R (R Foundation) [<xref ref-type="bibr" rid="ref17">17</xref>].</p><p>As a preprocessing step, variables with absolute Spearman correlation coefficients of 0.85 or higher in the training data were excluded, retaining only those with the strongest correlation with severity. While this univariate filtering approach does not account for potential multivariate interactions among features, it was adopted to reduce feature redundancy and multicollinearity, which could otherwise impair the stability and efficiency of model training.</p><p>LightGBM hyperparameters were optimized using Bayesian optimization with repeated cross-validation via Optuna version 4.2.1 [<xref ref-type="bibr" rid="ref18">18</xref>]. We applied the best model to the test dataset to obtain predicted probabilities and plotted the corresponding receiver operating characteristic curve. The area under the receiver operating characteristic curve was calculated to evaluate the predictive performance of the initial diagnosis model for each severity classification. To evaluate the importance of variables in the prediction, we used SHAP values [<xref ref-type="bibr" rid="ref13">13</xref>] for the test data. Importantly, when models were developed for different severity subgroups, hyperparameter optimization and SHAP analysis were performed separately for each group to account for subgroup-specific characteristics.</p><p>To validate the advantage of the selected LightGBM model, we initially implemented and evaluated 5 machine learning algorithms for predicting hospital admission (ie, threshold &#x2265;2): LightGBM, random forest, support vector machine, Elastic Net, and decision tree. Among these, LightGBM and random forest demonstrated the highest predictive performance for binary classification (Figure S1 in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref> and Table S3 in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). However, random forest required substantially longer training and inference times. Considering the need for computational efficiency and scalability in clinical applications, we selected LightGBM for subsequent analyses involving higher severity cut-offs.</p></sec><sec id="s2-5"><title>Dynamic Risk Assessment of Mortality During Hospitalization</title><p>We used survival models, including Cox proportional hazards models and RSFs [<xref ref-type="bibr" rid="ref19">19</xref>], to evaluate patient mortality risk during hospitalization. The Cox proportional hazards model analyzes time-to-event data and associated predictors under the proportional hazards assumption. To accommodate a large number of predictors, regularized versions of the Cox model were used, including Cox-LASSO (least absolute shrinkage and selection operator) (L1), Cox-Ridge (L2), and Cox ElasticNet (a combination of L1 and L2 penalties).</p><p>To emulate real-time risk assessment, we implemented a dynamic updating mechanism in which the model recalculates cumulative hazard scores on each day of hospitalization. For each patient, the RSF model is applied iteratively at time points <italic>t</italic>, <italic>t</italic>+1, <italic>t</italic>+2, and so on, using only data observed up to the corresponding time. This time-restricted evaluation prevents data leakage from future observations and allows us to assess how well the model performs when used prospectively in a clinical setting. The RSF estimates the cumulative hazard function (CHF) by aggregating the outputs of multiple survival trees constructed using the random forest algorithm. Like random forest, RSF is robust to outliers and enables accurate risk assessment for event occurrence. To dynamically predict mortality risk, 72 variables were used in the analysis, including background factors (eg, age and BMI), as well as biomarkers and vital signs measured over time during hospitalization. We used variables that were measured in most patients (&#x003E;180 patients for biomarkers and &#x003E;150 patients for background and vital information). Missing values were imputed using the last observation carried forward method; if no prior values were available, continuous variables were filled with the median, and categorical variables with the mode. The Python (Python Foundation) package scikit-survival, which includes implementations of Cox and RSF models, was used for the analysis. To evaluate the dynamic risk of mortality, we used the 7-day CHF (ie, the estimated probability of death within 7 days) calculated using the RSF as an index of mortality risk. The 7-day CHF was calculated for each patient on each day of hospitalization.</p><p>The performance of the survival models was evaluated using 3 metrics: concordance index (C-index), integrated Brier score, and mean cumulative/dynamic AUC (mean AUC).</p><p>In clinical practice, it is important to identify the factors that increase the risk of mortality. The variable importance of the RSF models was calculated for the test data using SurvSHAP(t) [<xref ref-type="bibr" rid="ref20">20</xref>], which provides a time-dependent explanation of the survival function predicted using SHAP. SurvSHAP(t) allowed us to determine how each variable affects the survival function at each time point. We obtained the mean aggregated SurvSHAP(t) across all days of hospitalization, which showed how each variable contributed to the prediction for every patient at every time point.</p></sec><sec id="s2-6"><title>Variable Selection for Dynamic Risk Assessment</title><p>To balance clinical applicability with the computational cost of SurvSHAP(t), we performed variable selection during the RSF training process. First, we trained an RSF model using all 72 variables on the training data and calculated permutation importance scores using the implementation in the scikit-learn Python package. The RSF model was then retrained using the top 10 variables with the highest permutation importance.</p><p>Additional technical details of the machine learning implementation not covered in the main text are presented in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Patient Demographics</title><p>The median age of the 382 patients with COVID-19 was 39 years; 233 were male and 149 were female (<xref ref-type="table" rid="table1">Table 1</xref>). Of the 51 inpatients who required oxygen, 30 required low-flow oxygen, 3 needed high-flow oxygen, 8 were treated with invasive ventilation/ECMO, and 10 died.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Baseline characteristics of patients with COVID-19 by severity outcome.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom" colspan="6">Severity outcome of COVID-19</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">1: Not admitted</td><td align="left" valign="bottom">2: Room air</td><td align="left" valign="bottom">3: Oxygen administration</td><td align="left" valign="bottom">4: Noninvasive ventilation</td><td align="left" valign="bottom">5: ECMO<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup>/invasive ventilation</td><td align="left" valign="bottom">6: Death</td></tr></thead><tbody><tr><td align="left" valign="top">Number of cases, n</td><td align="left" valign="top">201</td><td align="left" valign="top">130</td><td align="left" valign="top">30</td><td align="left" valign="top">3</td><td align="left" valign="top">8</td><td align="left" valign="top">10</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">Length of stay (days), </named-content>median (range)</td><td align="left" valign="top">N/A<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top">10 (2-52)</td><td align="left" valign="top">20 (11-36)</td><td align="left" valign="top">47 (31-48)</td><td align="left" valign="top">39 (25-73)</td><td align="left" valign="top">23 (12-37)</td></tr><tr><td align="left" valign="top">Age (years), median (range)</td><td align="left" valign="top">34 (18-93)</td><td align="left" valign="top">39 (19-98)</td><td align="left" valign="top">59 (30-93)</td><td align="left" valign="top">70 (68-85)</td><td align="left" valign="top">58 (49-75)</td><td align="left" valign="top">79 (50-94)</td></tr><tr><td align="left" valign="top" colspan="7">Sex, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">75 (37)</td><td align="left" valign="top">60 (46)</td><td align="left" valign="top">9 (30)</td><td align="left" valign="top">2 (67)</td><td align="left" valign="top">2 (25)</td><td align="left" valign="top">1 (10)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">126 (63)</td><td align="left" valign="top">70 (54)</td><td align="left" valign="top">21 (70)</td><td align="left" valign="top">1 (33)</td><td align="left" valign="top">6 (75)</td><td align="left" valign="top">9 (90)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>ECMO: extracorporeal membrane oxygenation.</p></fn><fn id="table1fn2"><p><sup>b</sup>N/A: not applicable.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Prognostic Predictability of COVID-19 at Initial Diagnosis</title><p>To evaluate the predictability of COVID-19 prognosis at initial diagnosis, we constructed prognostic models based on the following information available at that time: symptoms, background information, and biomarkers. Using the severity scale defined by Grein et al [<xref ref-type="bibr" rid="ref14">14</xref>], we assigned a score to each patient at initial presentation and, if hospitalized, at subsequent time points. The highest score observed across these time points was used as the outcome to be predicted. The AUCs represent the performance of the model in predicting whether patients would reach each severity threshold during hospitalization: 0.717 for severity &#x2265;2, 0.878 for &#x2265;3, 0.951 for &#x2265;4, 0.952 for &#x2265;5, and 0.970 for 6 (ie, death), as shown in <xref ref-type="fig" rid="figure2">Figure 2A</xref>. When we examined the concordance between the predicted probability and the actual severity outcome, we found that most patients with an actual severity of &#x2265;3 had a high predicted probability of severity of &#x2265;2. By contrast, patients with an actual severity of 1 or 2 showed a wide distribution of predicted probabilities&#x2014;from low to high&#x2014;indicating no clear distinction between the 2 (<xref ref-type="fig" rid="figure2">Figure 2B</xref>, top panel). For the other predictions, the predicted probabilities and actual severity showed good concordance; however, some cases remained where the severity risk was not accurately determined (eg, patients who ultimately had mild disease but were predicted to have a high risk of severe illness; <xref ref-type="fig" rid="figure2">Figure 2B</xref>).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Screening for severity prognosis at the initial diagnosis. (A) Receiver operating characteristic curves and the AUC values for prediction models of severity outcomes based on the oxygen-support status score. The 95% CIs for the AUC are shown in parentheses. (B) Box and jitter plots showing the prediction probabilities that test cases exceed the severity threshold (indicated by the dashed line). The center line of the box indicates the median; box limits represent the upper and lower quartiles; whiskers extend to 1.5&#x00D7; the IQR. Each dot represents an individual observation. (C) Variable importance in each predictive model evaluated using SHAP values. Bar plots show the mean absolute SHAP value for each variable across individual patients in the test dataset. (D) Heatmap of symptoms observed at initial diagnosis. Columns represent individual patients, ordered by severity level and sorted to minimize missing values and symptom absence. (E) Box and jitter plots showing the distribution of key continuous variables across severity groups. Plot elements are defined as in panel B. Alb: albumin; ALP: alkaline phosphatase; AMY: amylase; APTT: activated partial thromboplastin time; AUC: area under the receiver operating characteristic curve; Baso-%: basophil %; CK: creatine kinase; Cl: chloride; Cre: creatinine; CRP: C-reactive protein; eGFR-Cre: estimated glomerular filtration rate-creatinine; Eosino-%: eosinophil %; GLU: blood glucose; LDH: lactate dehydrogenase; Lympho-Count: lymphocyte count; MCH: mean corpuscular hemoglobin; MCHC: mean corpuscular hemoglobin concentration; MCV: mean corpuscular volume; Mono-Count: monocyte count; MPV: mean platelet volume; N/A: not available; PDW: platelet distribution width; Plt: platelet; PT: prothrombin time; Neutro-%: neutrophil %; RDW: red cell distribution width; SHAP: Shapley Additive Explanations; T-Bil: total bilirubin; TP: total protein; UA: uric acid; UN: urea nitrogen; WBC: white blood cell; &#x03B3;-GTP: gamma-glutamyl transpeptidase.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e65585_fig02.png"/></fig><p>Subsequently, we evaluated the variable importance of each prediction. The presence of pneumonia was identified as the most important predictor for whether severity would be &#x2265;2 (<xref ref-type="fig" rid="figure2">Figure 2C</xref>, leftmost panel). Most hospitalized patients with a severity of &#x2265;2 showed pneumonia at initial diagnosis, and all patients with a severity of &#x2265;3 had pneumonia (<xref ref-type="fig" rid="figure2">Figure 2D</xref>). Conversely, as the target severity level of prediction increased, the importance of symptoms decreased. Instead, biomarkers such as the lymphocyte count, prothrombin time (PT), C-reactive protein (CRP), creatinine, and amylase levels emerged as the top predictors (<xref ref-type="fig" rid="figure2">Figure 2C</xref>). BMI was also an important factor in predicting whether the severity was &#x2265;4 or &#x2265;5. Age remained an important factor across all severity levels. Among the important predictors, we examined the distribution of age and biomarkers according to actual severity prognosis. Age and BMI were higher in patients with a severity of &#x2265;3 than in others, while biomarkers such as PT, CRP, creatinine, red blood cell volume distribution width, and blood glucose values were higher in patients with a severity of &#x2265;4 (<xref ref-type="fig" rid="figure2">Figure 2E</xref>). Lymphocyte counts, estimated glomerular filtration rate (eGFR)-creatinine, and albumin values were lower in more severe cases than in less severe cases, and platelet counts were particularly low in mortality cases (<xref ref-type="fig" rid="figure2">Figure 2E</xref>). Amylase levels showed a peculiar distribution: they were low in patients with severity levels 4, 5, and 6, but extremely high in some patients with a severity level of 6 (<xref ref-type="fig" rid="figure2">Figure 2E</xref>).</p></sec><sec id="s3-3"><title>Dynamic Mortality Risk Assessment Based on Longitudinal Data During Hospitalization</title><p>Outcome screening based on information from the initial diagnosis was accurate but incomplete. This suggests that a patient&#x2019;s prognosis is not fully determined at the time of diagnosis and may change depending on the disease course and treatment after admission. When we investigated changes in severity status after admission, we found that oxygen administration and noninvasive ventilation were typically initiated within 5 days after admission, whereas invasive ventilation was often introduced more than 5 days after admission; death generally occurred more than 20 days after admission (<xref ref-type="fig" rid="figure3">Figure 3A</xref>). Additionally, many deaths occurred without invasive ventilation (<xref ref-type="fig" rid="figure3">Figure 3A</xref>, top panel). This is likely because most mortality cases involved older adults who were not eligible for invasive ventilation or ECMO, even when their condition deteriorated. These observations suggest that, during the weeks between admission and death or discharge, patients undergo changes in their condition that cannot be fully assessed based on oxygen-support status.</p><p>We then used survival models, including RSF [<xref ref-type="bibr" rid="ref19">19</xref>], to evaluate mortality risk during hospitalization. Initially, we attempted to develop a Cox proportional hazards model using all 72 variables, but the model could not be created due to multicollinearity. Therefore, we developed Cox proportional hazards models with L1 (LASSO), L2 (Ridge), and combined L1+L2 (Elastic Net) penalties. The Cox model achieved the highest performance, as evaluated by the C-index, when the Elastic Net penalty was applied. Its performance was comparable to that of the RSF model using all 72 variables (<xref ref-type="table" rid="table2">Table 2</xref>). When we retrained an RSF model using the top 10 important variables selected during the RSF learning process, as described in the &#x201C;Methods&#x201D; section, the performance improved substantially. We also constructed a Cox model based on the same top 10 variables selected by RSF. Although this model exhibited markedly better performance compared with the regularized Cox model, it did not match the predictive accuracy of the RSF model using the same variables. These findings highlight the critical importance of variable selection in enhancing model performance, as well as the value of accounting for interactions and nonlinear effects&#x2014;factors that the Cox model does not incorporate.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Dynamic mortality risk assessment during hospitalization. (A) Changes in severity status during hospitalization for each severity outcome group. The plot shows how the number of patients receiving procedures such as ventilation or oxygen administration changes over time after admission. (B) Daily mortality risk trajectories for each patient for each day of hospitalization in the test dataset. Mortality risk is shown as the 7-day CHF (ie, the risk of death within 7 days), calculated using the RSF. Filled circles in mortality cases indicate the date of last observation. (C) Daily mortality risk trajectories for each patient for each day of hospitalization in the training dataset. (D) Important variables contributing to the RSF-based mortality prediction. SurvSHAP(t) provides a time-dependent explanation of how each variable influences each patient&#x2019;s CHF. The left panel shows the mean aggregated SurvSHAP(t) for each case, that is, the mean value of aggregated SurvSHAP(t) across all days of hospitalization. Each circle represents the contribution of a variable to the prediction for each patient in the test dataset. The right panel shows the mean absolute value of SurvSHAP(t) across all patients in the test dataset. (E) Mean aggregated SurvSHAP(t) for each case (left), and mean aggregated |SurvSHAP(t)| across all cases (right) in the training dataset. AMY: amylase; Ca: calcium; CHF: cumulative hazard function; CRP: C-reactive protein; Plt: platelets; PT: prothrombin time; RSF: random survival forests; SpO<sub>2</sub>: peripheral oxygen saturation</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e65585_fig03.png"/></fig><p>For all 4 mortality cases in the test dataset, an increase in mortality risk was observed 1&#x2010;2 weeks before the outcome, and the CHF (ie, the estimated probability of death within 7 days) reached approximately 0.3 or higher at the time of death (<xref ref-type="fig" rid="figure3">Figure 3B</xref>). Conversely, in patients recovering from invasive or noninvasive ventilation, the CHF also increased around 1 week after admission, similar to the mortality cases, but then decreased and rarely exceeded 0.2. In mild cases that progressed with oxygen administration or room air, there was little increase in CHF. Similar changes in CHF were observed in the training dataset, which included 6 deaths, suggesting consistency of the predictive model between the training and test datasets (<xref ref-type="fig" rid="figure3">Figure 3C</xref>).</p><p>The average contribution of the variables to the RSF prediction for each patient was evaluated using the mean aggregated SurvSHAP(t). In addition to background factors such as age and BMI, blood test variables measured multiple times during hospitalization, such as platelets, amylase, and &#x03B2;-D-glucan, had the highest importance in mortality prediction (<xref ref-type="fig" rid="figure3">Figure 3D</xref>). Age, amylase level, and platelet count were identified as important predictors of mortality at initial diagnosis. Most of the important variables showed high contributions only in mortality cases; however, some, such as age and BMI, showed a high mean aggregated SurvSHAP(t) even in milder cases, suggesting that they are nonspecific factors. Conversely, important blood test variables such as &#x03B2;-D-glucan, platelets, and calcium (Ca) contributed less in some mortality cases, suggesting heterogeneity of deterioration. In the training data, these predictors also showed high contributions, especially in mortality cases, although there was some shuffling in their rankings (<xref ref-type="fig" rid="figure3">Figure 3E</xref>).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Performance metrics of mortality risk prediction models.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">Concordance index</td><td align="left" valign="bottom">Integrated Brier score</td><td align="left" valign="bottom">Cumulative area under the receiver operating characteristic curve</td></tr></thead><tbody><tr><td align="left" valign="top">Cox-LASSO<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="top">0.715</td><td align="left" valign="top">1.14</td><td align="left" valign="top">0.560</td></tr><tr><td align="left" valign="top">Cox-Ridge</td><td align="left" valign="top">0.595</td><td align="left" valign="top">1.53</td><td align="left" valign="top">0.481</td></tr><tr><td align="left" valign="top">Cox ElasticNet</td><td align="left" valign="top">0.845</td><td align="left" valign="top">1.31</td><td align="left" valign="top">0.731</td></tr><tr><td align="left" valign="top">Random survival forests with all 72 variables</td><td align="left" valign="top">0.843</td><td align="left" valign="top">0.664</td><td align="left" valign="top">0.753</td></tr><tr><td align="left" valign="top">Random survival forests with the top 10 variables</td><td align="left" valign="top"><italic>0.941</italic><sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="top">0.315</td><td align="left" valign="top"><italic>0.936</italic></td></tr><tr><td align="left" valign="top">Cox with the top 10 variables</td><td align="left" valign="top">0.919</td><td align="left" valign="top"><italic>0.272</italic></td><td align="left" valign="top">0.882</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>LASSO: least absolute shrinkage and selection operator.</p></fn><fn id="table2fn2"><p><sup>b</sup>Italicized values indicate the model with the best performance for each indicator.</p></fn></table-wrap-foot></table-wrap><p>We chose the 7-day time frame because it is clinically meaningful in the context of inpatient care, where monitoring and interventions typically follow a weekly cycle. It provides a practical horizon for anticipating deterioration and making timely care decisions. In addition, the 7-day window offered a suitable balance between the number of outcome events and prediction stability during model development. We also evaluated the data over different periods (eg, 1- and 14-day windows). Although the absolute values of the CHFs differed among the 1-, 7-, and 14-day prediction windows, the temporal patterns within each severity group were approximately consistent (see Figure S2 in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>).</p></sec><sec id="s3-4"><title>Rationale for Estimated Mortality Risk in Severe Cases</title><p>For the mortality risk assessment of patients with COVID-19, a machine learning model based on blood markers was proposed in Nature Machine Intelligence (NMI) 2020 [<xref ref-type="bibr" rid="ref21">21</xref>]. This model was built using samples obtained immediately before death or discharge, and lactate dehydrogenase, lymphocytes, and CRP were identified as key features. Mortality risk assessment using a decision tree using these 3 features was proposed in the study to facilitate clinical application (<xref ref-type="fig" rid="figure4">Figure 4A</xref>). After approximately 10 days of hospitalization, the RSF and NMI models showed equivalent performance as measured by accuracy and <italic>F</italic><sub>1</sub>-score. However, immediately following hospitalization, the RSF model outperformed the NMI model, indicating its superiority in early prognostic prediction (<xref ref-type="fig" rid="figure4">Figure 4B and C</xref>).</p><p>To examine the factors contributing to mortality risk over time, we calculated SurvSHAP(t) daily for the severe cases in the test dataset. Patients and time points showed different combinations of factors associated with changes in CHF (<xref ref-type="fig" rid="figure4">Figure 4D</xref>). For example, in young patients #2 and #6, peripheral oxygen saturation (SpO<sub>2</sub>) was associated with an increase in CHF immediately after admission. However, the contribution of SpO<sub>2</sub> decreased following the initiation of ECMO or invasive ventilation. By contrast, in patients #3 and #4, who were both older and not eligible for ECMO or invasive ventilation, the contribution of SpO<sub>2</sub> was higher than 10 days after hospitalization. &#x03B2;-D-glucan showed a greater contribution to mortality risk 1&#x2010;2 weeks before death than at any other time in patients #3, #4, and #6. Platelets had a high contribution in patients #4 and #6, and BMI also contributed to the mortality risk in these patients. Of note, in patient #4, BMI was measured for the first time on day 7, leading to a rapid increase in its contribution on that day. Calcium and blood amylase levels were elevated immediately before death, suggesting electrolyte abnormalities and multiorgan failure. CRP, a major predictor of mortality at initial diagnosis, contributed to risk assessment immediately after hospitalization.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Validation of the RSF model for mortality risk assessment. (A) Mortality risk assessment for COVID-19 based on 3 key predictors identified in a previous study: LDH, lymphocytes, and CRP. (B, C) Comparison of the performance of the RSF model developed in this study with the previously proposed NMI model. Accuracy (B) and <italic>F</italic><sub>1</sub>-score (C) for distinguishing survival and death cases are shown for each day after hospitalization, based on 61 COVID-19 cases in the test dataset. (D) Changes in the RSF-predicted mortality risk during hospitalization, along with daily SurvSHAP(t) of important predictors for severely ill patients in the test dataset. Six representative severe cases are shown, including 2 ECMO survivors and 4 deaths. The daily SurvSHAP(t) values for each variable correspond to changes in RSF mortality risk. The oxygen-support status is displayed between the CHF plot and the aggregated SurvSHAP(t) plot for each variable, as in <xref ref-type="fig" rid="figure3">Figure 3A</xref>: room air is shown in yellow, oxygen administration in light blue, NIV in green, and IMV/ECMO in blue. The light blue and black bars at the top of the graph indicate predictions by the previous NMI model, with light blue for predicted survival and black for predicted death. AMY: amylase; Ca: calcium; CHF: cumulative hazard function; CRP: C-reactive protein; ECMO: extracorporeal membrane oxygenation; IMV: invasive mechanical ventilation; LDH: lactate dehydrogenase; LFNC: low-flow nasal cannula; NIV: noninvasive ventilation; NMI: Nature Machine Intelligence; Plt: platelet; PT: prothrombin time; RA: room air; RSF: random survival forests; SpO<sub>2</sub>: peripheral oxygen saturation.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e65585_fig04.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In this study, we developed a framework to assess the prognostic risks of individual patients with COVID-19. Although we were able to predict patient prognosis with reasonable accuracy based on symptoms and blood test results at initial diagnosis, the predicted risk and actual prognosis deviated for some patients, suggesting that prognostic risk may change during hospitalization. Our proposed RSF model demonstrated high performance in predicting in-hospital mortality as a binary outcome, with an <italic>F</italic><sub>1</sub>-score exceeding 0.95 based on daily predictions made immediately after hospitalization (threshold: CHF&#x003E;0.2). Visualization of predictors using SurvSHAP(t) made the model explainable for each patient, with consistent predictors observed in both the training and test datasets. Such a dynamic prognostic framework can provide health care providers with real-time guidance to support clinical decision-making during hospitalization.</p><p>In the prognostic model at initial diagnosis, we did not predefine a single severity cut-off to dichotomize the outcome. Instead, we explored multiple binary classification tasks based on different thresholds (eg, severity&#x2265;1, &#x2265;2,..., &#x2265;5) derived from the original 7-point ordinal outcome scale (0&#x2010;6). This approach was chosen to comprehensively assess how predictive performance varies across different levels of clinical severity and to allow for flexible interpretation depending on the clinical context of interest. The partial predictability of disease progression at the time of initial diagnosis can be explained by key variables. CRP levels were important for identifying moderate and severe cases that may require oxygen administration. There was a clear difference in CRP levels between severity levels 3 and 4, but little difference between severity levels &#x2265;4 (<xref ref-type="fig" rid="figure2">Figure 2E</xref>). The same was observed for eGFR-creatinine and lymphocyte values, with clear distinctions between severity levels 3 and 4, but minimal differences at higher severities. This suggests that inflammation, reflected by CRP and lymphocytes, and renal dysfunction, reflected by eGFR-creatinine, serve as entry points for severe disease; however, further progression in severity and mortality is mainly influenced by other factors. These findings are consistent with previous studies reporting that elevated CRP and decreased lymphocyte count or eGFR are associated with early COVID-19 severity [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. Our results, however, further suggest that the progression to higher severity and mortality is predominantly driven by additional factors beyond these early indicators. Interestingly, creatinine was not ranked among the top 15 features only in the severity prediction model with the threshold &#x2265;3, while it appeared consistently for other thresholds (<xref ref-type="fig" rid="figure2">Figure 2C</xref>). This phenomenon may be attributed to the high degree of information overlap between creatinine and eGFR-creatinine, the latter being a composite measure that incorporates both age and sex and may have provided a more robust signal under this specific threshold. Platelet and amylase levels are the most likely factors associated with the progression of disease severity and mortality, given their importance in prognostic models during hospitalization. Platelet counts were characteristically lower in several mortality cases than in other severe cases, and amylase levels were markedly elevated in some fatal cases (<xref ref-type="fig" rid="figure2">Figure 2E</xref>). Fatal cases characterized by these factors may represent patients in whom signs of poor prognosis are already present at initial diagnosis. However, it should be noted that some deaths did not show such signs at initial diagnosis, making them difficult to distinguish from severe or even mild cases.</p><p>Although the initial diagnosis model demonstrated fair discriminatory ability overall (AUC 0.717 for predicting severity &#x2265;2), its performance remains below the generally accepted threshold for strong clinical utility (eg, &#x2265;0.8), particularly when applied to low-risk patients. While this AUC is clearly better than random chance (AUC 0.5), it may be insufficient for dependable clinical decision-making when used in isolation. The relatively lower performance in low-risk groups suggests that predicting hospital admission based solely on initial laboratory values may be inherently limited, and that more nuanced clinical judgment&#x2014;incorporating symptoms, physical findings, and contextual factors&#x2014;may be necessary in such cases.</p><p>Several RSF predictors that varied early in mortality cases were identified. Platelet and PT values were among the top 10 early predictors in the RSF model for COVID-19 mortality. Patients with COVID-19 are prone to arterial and venous thrombosis, and in severe cases, disseminated intravascular coagulation (DIC) can complicate their condition and lead to death [<xref ref-type="bibr" rid="ref24">24</xref>]. DIC was observed in only 0.6% of COVID-19 survivors, but it occurred frequently in 71.4% of mortality cases [<xref ref-type="bibr" rid="ref22">22</xref>]. Our results support the idea that coagulation abnormalities, which may lead to DIC, are early predictors of COVID-19 mortality. Amylase was also identified as an important predictor of dynamic mortality risk. It is mainly secreted by the pancreas and salivary glands. Previous studies have reported elevated blood amylase levels in patients with severe COVID-19 [<xref ref-type="bibr" rid="ref23">23</xref>]. Blood amylase levels are regulated by the balance between amylase production and clearance; elevated levels suggest damage to the producing tissues or impaired kidney function related to clearance. Such tissue damage may be a key event in the death of patients with COVID-19. Changes in blood cell composition were included among the RSF predictors, but these changes were not specific to patients who died (<xref ref-type="fig" rid="figure4">Figure 4</xref>). Platelets form platelet-neutrophil complexes when activated, which trigger neutrophil release via neutrophil extracellular traps [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. Neutrophilia is not an independent risk factor for mortality but may act as a predisposing factor for DIC, ultimately leading to death. &#x03B2;-D-glucan is not only an indicator of fungal infection but also a marker of sepsis-related gastrointestinal leakage [<xref ref-type="bibr" rid="ref27">27</xref>]. Even in the absence of fungemia or bacteremia, blood &#x03B2;-D-glucan levels during COVID-19 infection can induce neutrophil extracellular traps and may be associated with hypercytokinemia and severe inflammation [<xref ref-type="bibr" rid="ref28">28</xref>]. By integrating these dynamically changing risk factors using RSF, we were able to accurately assess how close each patient was to death at each time point.</p><p>Previous studies have used the approach of building models based on data immediately before outcomes such as death or hospital discharge, and then applying these models to earlier time points to predict prognosis [<xref ref-type="bibr" rid="ref21">21</xref>]. Although this approach can identify factors directly associated with mortality and achieves good predictive accuracy near the outcome, it has not performed well for early prognostic prediction. Even among patients with COVID-19, at least 10 factors are associated with death, and their importance shifts over time: CRP and SpO<sub>2</sub> are more influential in the earlier phases, whereas &#x03B2;-D-glucan, platelets, and calcium become more important just before death. In patients with COVID-19, viral proliferation is considered the primary pathogenic mechanism during the first few days after onset, whereas the inflammatory response and coagulation abnormalities due to host immunity become the dominant factors after the first week [<xref ref-type="bibr" rid="ref29">29</xref>]. This shift necessitates early administration of antiviral drugs and neutralizing antibodies during the initial phase, and the use of steroids and anticoagulation therapy after the first week [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. For effective clinical decision-making based on the phase of hospitalization, it is essential to present mortality risk with distinct, phase-specific rationales.</p><p>Our prognostic framework can be applied to various aspects of disease prevention and treatment. Early prognostic prediction immediately after hospitalization, which screens for potentially severe cases with high sensitivity, can be used to estimate the number of hospital beds and the amount of medical equipment required. Additionally, owing to the recent shortage of hospital beds, the number of patients receiving treatment at home is increasing, and cases of sudden deterioration or death during home care have become a cause for concern. By using the RSF model to identify early signs of mortality risk, it may be possible to reduce deaths during home treatment and ensure safer management outside the hospital. Coagulation factors, which are key predictors in the RSF mortality model, represent potent targets for early intervention. Heparin administration has been reported to improve the prognosis of severe DIC in patients with COVID-19 [<xref ref-type="bibr" rid="ref32">32</xref>]. The RSF model may help determine the appropriate timing for initiating anticoagulation therapy and evaluate treatment effects over time.</p><p>Although our study utilized a retrospective dataset, we designed the model to simulate real-time clinical application by dynamically updating the CHF at each time point during hospitalization (eg, day t, t+1, t+2). At each time point, only clinical data available up to that day were used, thereby emulating real-world scenarios in which patient information accumulates sequentially. The RSF model recalculates risk scores daily, enabling the timely identification of clinical deterioration and supporting dynamic decision-making. This time-updating mechanism reflects the evolving clinical status of patients and is essential for informing appropriate interventions and care adjustments during hospitalization.</p><p>While our framework was developed using data from patients with COVID-19, the underlying approach&#x2014;time-varying survival modeling with interpretable outputs&#x2014;is applicable to other acute or chronic diseases characterized by dynamic clinical trajectories. However, we acknowledge that this generalizability has not yet been empirically validated. Future work should explore its application to other conditions, such as sepsis, pneumonia, or heart failure, using disease-specific datasets to evaluate the framework&#x2019;s adaptability and robustness. To facilitate clinical integration, the model outputs could be embedded into electronic health record systems as real-time dashboards that display individualized risk trajectories and highlight contributing variables. For example, dynamic risk scores and SurvSHAP(t)-based feature summaries could be visualized alongside vital signs or laboratory trends to support triage decisions, early warnings, or escalation of therapy. Although we did not conduct a formal usability study, preliminary feedback from a small group of physicians who viewed the SurvSHAP(t) visualizations suggested that the temporal feature contributions enhanced their understanding of the rationale behind changes in risk over time. Future work should include structured surveys or qualitative interviews to assess how explainability tools influence clinician trust, understanding, and adoption in real-world settings.</p><p>In the interpretation of SurvSHAP(t) values, negative values indicate that a variable contributes to an increase in the predicted cumulative hazard, corresponding to a higher mortality risk. Conversely, positive values suggest a protective effect by lowering the predicted risk. SHAP-based feature importance, measured using both the mean absolute SHAP values (|SHAP|) and the mean aggregated absolute SurvSHAP(t) values, which average patient-level contributions over time, reflects the expected magnitude of each variable&#x2019;s influence on the model output across all observations. This provides insight into how sensitive the model&#x2019;s predictions are to each variable in aggregate and can be considered a model-based global sensitivity analysis method. In other words, a variable with a larger mean (aggregated) absolute SHAP value is expected to induce greater changes in the model&#x2019;s output when perturbed, indicating higher sensitivity to that feature.</p><p>As an additional aspect of sensitivity analysis, we examined the impact of different missing data scenarios. Preliminary results showed that, although prediction performance occasionally improved slightly without imputation, SHAP analysis revealed that the model was leveraging whether certain symptom variables were measured, essentially using the pattern of missingness as a predictive case. This indicates that the missingness mechanism was likely not at random and may have been biasedly associated with patient outcomes. To prevent overfitting to such data collection artifacts and ensure that the model relied on clinically meaningful features rather than exploiting missingness as a proxy, we opted to train all final models on imputed data.</p><p>We recognize that comorbidities may serve as confounders, influencing both predictor variables and patient outcomes. Although comorbidities were included as input features when available, we did not explicitly adjust for them using causal inference frameworks. Future extensions of this work should incorporate structured comorbidity indices (eg, Charlson or Elixhauser indices) and consider techniques such as inverse probability weighting or propensity score adjustment to reduce bias and enhance causal interpretability.</p><p>We designed the model with real-time applicability in mind. To assess its suitability for clinical implementation, we quantified the computation time (Table S3 in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>). In our implementation, the learning and inference times for RSF were approximately 1.89 and 0.25 seconds, respectively. Cox regression required approximately 0.10 seconds for learning and 0.01 seconds for inference, making RSF roughly 20 times slower in both processes. However, the computational times for RSF remain sufficiently short to enable inference in real-world clinical settings and do not present a barrier to real-time clinical application. On the other hand, calculating the contribution of variables to the prediction results using SurvSHAP(t) took approximately 20,000 seconds (ie, over 5 hours) for the test dataset of 828 records. Even when converted to computation time per record, the processing remains substantial and may pose a barrier to its use in actual clinical practice. To support future clinical applications, a more efficient and faster implementation of SurvSHAP(t) is desirable.</p><p>To evaluate potential biases in dynamic mortality predictions across different demographic groups, we conducted subgroup analyses based on sex and age categories, as summarized in <xref ref-type="table" rid="table3">Table 3</xref>. Specifically, we assessed performance in the following subgroups: males only, a younger age group (&#x003C;65 years), and an older age group (&#x2265;75 years). The results indicated a slight decrease in predictive performance among males compared with the overall cohort. By contrast, the younger age group showed a marginal performance improvement, likely reflecting the lower incidence of mortality in this subgroup. Conversely, the older age group exhibited a slight reduction in predictive performance, possibly due to the higher mortality rate in this population. Nonetheless, the performance differences across these subgroups were relatively minor compared with the overall analysis, suggesting that the model does not display substantial bias with respect to sex or age. It should also be noted that our dataset consisted exclusively of Japanese patients, limiting our ability to evaluate predictive fairness across different ethnic groups. We acknowledge this limitation and recognize the need for further validation in more diverse populations.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Performance of mortality prediction in subgroup analyses.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Subgroup</td><td align="left" valign="bottom">Concordance index</td></tr></thead><tbody><tr><td align="left" valign="top">All</td><td align="left" valign="top">0.941</td></tr><tr><td align="left" valign="top">Males only</td><td align="left" valign="top">0.919</td></tr><tr><td align="left" valign="top">Younger age group (&#x003C;65 years)</td><td align="left" valign="top">0.957</td></tr><tr><td align="left" valign="top">Older age group (&#x2265;75 years)</td><td align="left" valign="top">0.864</td></tr></tbody></table></table-wrap><p>This study had several limitations. First, the study cohort was relatively small, and data were obtained from a single hospital. As machine learning model performance and robustness are highly influenced by data size and diversity, our models may be prone to overfitting to this specific cohort. As a result, the identified predictive patterns could lack stability and generalizability when applied to other populations without retraining. Furthermore, the substantial reliance on data imputation to address missing values, particularly for certain biomarkers, introduces an additional layer of potential model instability and overfitting risk, as the models may inadvertently learn patterns from the imputation process itself rather than from true underlying biological signals. Consequently, the model will require updates and rigorous revalidation as the study expands to multiple centers and includes a larger sample size, ideally with efforts to minimize the extent of missing data. Second, we included only patients with COVID-19 diagnosed in 2020. Therefore, it is necessary to evaluate the generalizability of these models, including their applicability to different SARS-CoV-2 variants and the effects of vaccination. Notably, the data used in this study were collected during a period when vaccination was rarely administered, and can thus be considered valuable in representing disease trajectories unaffected by vaccination. Third, the study treated daily records from the same patient as independent data points for training, which presents a technical challenge for RSF. Incorporating the risk estimated on the previous day may enable more accurate predictions.</p><p>To advance the clinical utility and generalizability of the model, we plan to conduct a multicenter study involving hospitals with diverse patient populations and care protocols. This will enable retraining and external validation of the model across different clinical settings. Additionally, we aim to prospectively evaluate the model in a clinical pilot study, focusing on real-time integration, clinician usability, and assessment of treatment impact through interventional trials.</p></sec><sec id="s4-2"><title>Conclusions</title><p>We developed and validated an interpretable 2-model framework to enhance prognostic support for patients with COVID-19. The framework integrates a LightGBM model for predicting disease severity at admission with an RSF model that provides daily mortality risk estimates throughout hospitalization. These complementary models are designed to address distinct clinical needs at different stages of patient care.</p><p>Central to our approach is interpretability through SurvSHAP(t), which identified actionable, phase-specific predictors, such as elevated CRP levels at admission, declining SpO<sub>&#x2082;</sub> during progression, and late-stage indicators such as platelet loss accompanied by elevated &#x03B2;-D-glucan. These time-dependent explanations empower clinicians to anticipate and respond to evolving patient conditions with greater precision.</p><p>By combining early disease stratification with continuous, explainable mortality prediction, our framework facilitates timely interventions and strategic resource allocation. This demonstrates significant potential to improve clinical decision-making in dynamic care environments and may serve as a foundation for managing future infectious disease outbreaks with heterogeneous trajectories, pending prospective multi-institutional validation.</p></sec></sec></body><back><ack><p>We thank Elsevier Language Editing Services for reviewing the manuscript to eliminate grammatical and spelling errors and to ensure adherence to correct scientific English. This study was supported by grants from the Japan Society for the Promotion of Science (JSPS KAKENHI: grants JP20K21837, JP21K02356, and JP25K21344 to TI); the Japan Science and Technology Agency (JST) Moonshot R&#x0026;D Program (grant JPMJMS2025 to EK); the JST CREST Program (grant JPMJCR20H4 to EK); and the Japan Agency for Medical Research and Development (AMED: grants JP21wm0325007, JP20fk0108412, JP20fk0108413, and JP21gm5010003 to EK). The funders had no role in the study design, data collection, data analysis and interpretation, or writing of the manuscript. The authors confirm that no generative artificial intelligence tools were used in the original drafting of the manuscript. During the revision phase only, artificial intelligence&#x2013;based language polishing assistance was obtained from ChatGPT (model o3, OpenAI, 2025), Claude (Sonnet 4, Anthropic, 2025), and Gemini (2.5 Pro, Google, 2025). All suggestions provided by these tools were independently reviewed, fact-checked, and manually edited by the authors before inclusion. The authors remain fully responsible for the accuracy and integrity of the final text. This study was presented as a poster at the 6th Workshop on Virus Dynamics, held in July 2023.</p></ack><notes><sec><title>Data Availability</title><p>The datasets used or analyzed during this study are available from the corresponding author (EK) upon reasonable request. The underlying code and the training/test datasets are not publicly available but may be made available to qualified researchers upon reasonable request from the corresponding author.</p></sec></notes><fn-group><fn fn-type="con"><p>TI, M Shinoda, KS, EK, and M Shinkai designed the study. M Shinoda, KA, SO, KK, and M Shinkai collected the data. TI, MO, and EK conducted the data analysis. All authors contributed to data interpretation, manuscript writing, and critical review, and approved the final version of the manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AUC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb2">C-index</term><def><p>concordance index</p></def></def-item><def-item><term id="abb3">CHF</term><def><p>cumulative hazard function</p></def></def-item><def-item><term id="abb4">CRP</term><def><p>C-reactive protein</p></def></def-item><def-item><term id="abb5">DIC</term><def><p>disseminated intravascular coagulation</p></def></def-item><def-item><term id="abb6">ECMO</term><def><p>extracorporeal membrane oxygenation</p></def></def-item><def-item><term id="abb7">eGFR</term><def><p>estimated glomerular filtration rate</p></def></def-item><def-item><term id="abb8">GBDT</term><def><p>gradient boosting decision trees</p></def></def-item><def-item><term id="abb9">LASSO</term><def><p>least absolute shrinkage and selection operator</p></def></def-item><def-item><term id="abb10">LightGBM</term><def><p>Light Gradient Boosting Machine</p></def></def-item><def-item><term id="abb11">NMI</term><def><p>Nature Machine Intelligence</p></def></def-item><def-item><term id="abb12">PT</term><def><p>prothrombin time</p></def></def-item><def-item><term id="abb13">RSF</term><def><p>random survival forests</p></def></def-item><def-item><term id="abb14">SHAP</term><def><p>Shapley Additive Explanation</p></def></def-item><def-item><term id="abb15">SpO<sub>2</sub></term><def><p>peripheral oxygen saturation</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Forster</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Murff</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Peterson</surname><given-names>JF</given-names> </name><name name-style="western"><surname>Gandhi</surname><given-names>TK</given-names> </name><name name-style="western"><surname>Bates</surname><given-names>DW</given-names> </name></person-group><article-title>The incidence and severity of adverse events affecting patients after discharge from the hospital</article-title><source>Ann Intern Med</source><year>2003</year><month>02</month><day>4</day><volume>138</volume><issue>3</issue><fpage>161</fpage><lpage>167</lpage><pub-id pub-id-type="doi">10.7326/0003-4819-138-3-200302040-00007</pub-id><pub-id pub-id-type="medline">12558354</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Odell</surname><given-names>M</given-names> </name><name name-style="western"><surname>Victor</surname><given-names>C</given-names> </name><name name-style="western"><surname>Oliver</surname><given-names>D</given-names> </name></person-group><article-title>Nurses&#x2019; role in detecting deterioration in ward patients: systematic literature review</article-title><source>J Adv Nurs</source><year>2009</year><month>10</month><volume>65</volume><issue>10</issue><fpage>1992</fpage><lpage>2006</lpage><pub-id pub-id-type="doi">10.1111/j.1365-2648.2009.05109.x</pub-id><pub-id pub-id-type="medline">20568317</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mok</surname><given-names>WQ</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Liaw</surname><given-names>SY</given-names> </name></person-group><article-title>Vital signs monitoring to detect patient deterioration: an integrative literature review</article-title><source>Int J Nurs Pract</source><year>2015</year><month>05</month><volume>21 Suppl 2</volume><fpage>91</fpage><lpage>98</lpage><pub-id pub-id-type="doi">10.1111/ijn.12329</pub-id><pub-id pub-id-type="medline">26125576</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Pan</surname><given-names>C</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Management of critically ill patients with COVID-19 in ICU: statement from front-line intensive care experts in Wuhan, China</article-title><source>Ann Intensive Care</source><year>2020</year><month>06</month><day>6</day><volume>10</volume><issue>1</issue><fpage>73</fpage><pub-id pub-id-type="doi">10.1186/s13613-020-00689-1</pub-id><pub-id pub-id-type="medline">32506258</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Adhikari</surname><given-names>NKJ</given-names> </name><name name-style="western"><surname>Fowler</surname><given-names>RA</given-names> </name><name name-style="western"><surname>Bhagwanjee</surname><given-names>S</given-names> </name><name name-style="western"><surname>Rubenfeld</surname><given-names>GD</given-names> </name></person-group><article-title>Critical care and the global burden of critical illness in adults</article-title><source>Lancet</source><year>2010</year><month>10</month><day>16</day><volume>376</volume><issue>9749</issue><fpage>1339</fpage><lpage>1346</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(10)60446-1</pub-id><pub-id pub-id-type="medline">20934212</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Perotte</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ranganath</surname><given-names>R</given-names> </name><name name-style="western"><surname>Hirsch</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Blei</surname><given-names>D</given-names> </name><name name-style="western"><surname>Elhadad</surname><given-names>N</given-names> </name></person-group><article-title>Risk prediction for chronic kidney disease progression using heterogeneous electronic health record data and time series analysis</article-title><source>J Am Med Inform Assoc</source><year>2015</year><month>07</month><volume>22</volume><issue>4</issue><fpage>872</fpage><lpage>880</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocv024</pub-id><pub-id pub-id-type="medline">25896647</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Renu</surname><given-names>K</given-names> </name><name name-style="western"><surname>Prasanna</surname><given-names>PL</given-names> </name><name name-style="western"><surname>Valsala Gopalakrishnan</surname><given-names>A</given-names> </name></person-group><article-title>Coronaviruses pathogenesis, comorbidities and multi-organ damage - a review</article-title><source>Life Sci</source><year>2020</year><month>08</month><day>15</day><volume>255</volume><fpage>117839</fpage><pub-id pub-id-type="doi">10.1016/j.lfs.2020.117839</pub-id><pub-id pub-id-type="medline">32450165</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nielsen</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Thorsen-Meyer</surname><given-names>HC</given-names> </name><name name-style="western"><surname>Belling</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Survival prediction in intensive-care units based on aggregation of long-term disease history and acute physiology: a retrospective study of the Danish National Patient Registry and electronic patient records</article-title><source>Lancet Digit Health</source><year>2019</year><month>06</month><volume>1</volume><issue>2</issue><fpage>e78</fpage><lpage>e89</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(19)30024-X</pub-id><pub-id pub-id-type="medline">33323232</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johnson</surname><given-names>AEW</given-names> </name><name name-style="western"><surname>Ghassemi</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Nemati</surname><given-names>S</given-names> </name><name name-style="western"><surname>Niehaus</surname><given-names>KE</given-names> </name><name name-style="western"><surname>Clifton</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Clifford</surname><given-names>GD</given-names> </name></person-group><article-title>Machine learning and decision support in critical care</article-title><source>Proc IEEE Inst Electr Electron Eng</source><year>2016</year><month>02</month><volume>104</volume><issue>2</issue><fpage>444</fpage><lpage>466</lpage><pub-id pub-id-type="doi">10.1109/JPROC.2015.2501978</pub-id><pub-id pub-id-type="medline">27765959</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Toma&#x0161;ev</surname><given-names>N</given-names> </name><name name-style="western"><surname>Glorot</surname><given-names>X</given-names> </name><name name-style="western"><surname>Rae</surname><given-names>JW</given-names> </name><etal/></person-group><article-title>A clinically applicable approach to continuous prediction of future acute kidney injury</article-title><source>Nature New Biol</source><year>2019</year><month>08</month><volume>572</volume><issue>7767</issue><fpage>116</fpage><lpage>119</lpage><pub-id pub-id-type="doi">10.1038/s41586-019-1390-1</pub-id><pub-id pub-id-type="medline">31367026</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thorsen-Meyer</surname><given-names>HC</given-names> </name><name name-style="western"><surname>Nielsen</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Nielsen</surname><given-names>AP</given-names> </name><etal/></person-group><article-title>Dynamic and explainable machine learning prediction of mortality in patients in the intensive care unit: a retrospective study of high-frequency data in electronic patient records</article-title><source>Lancet Digit Health</source><year>2020</year><month>04</month><volume>2</volume><issue>4</issue><fpage>e179</fpage><lpage>e191</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(20)30018-2</pub-id><pub-id pub-id-type="medline">33328078</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Quinn</surname><given-names>TP</given-names> </name><name name-style="western"><surname>Jacobs</surname><given-names>S</given-names> </name><name name-style="western"><surname>Senadeera</surname><given-names>M</given-names> </name><name name-style="western"><surname>Le</surname><given-names>V</given-names> </name><name name-style="western"><surname>Coghlan</surname><given-names>S</given-names> </name></person-group><article-title>The three ghosts of medical AI: can the black-box present deliver?</article-title><source>Artif Intell Med</source><year>2022</year><month>02</month><volume>124</volume><fpage>102158</fpage><pub-id pub-id-type="doi">10.1016/j.artmed.2021.102158</pub-id><pub-id pub-id-type="medline">34511267</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lundberg</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SI</given-names> </name></person-group><article-title>A unified approach to interpreting model predictions</article-title><conf-name>NIPS&#x2019;17: Proceedings of the 31st International Conference on Neural Information Processing Systems</conf-name><conf-date>Dec 4-9, 2017</conf-date><conf-loc>Long Beach, CA</conf-loc><fpage>4768</fpage><lpage>4777</lpage></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Grein</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ohmagari</surname><given-names>N</given-names> </name><name name-style="western"><surname>Shin</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Compassionate use of remdesivir for patients with severe COVID-19</article-title><source>N Engl J Med</source><year>2020</year><month>06</month><day>11</day><volume>382</volume><issue>24</issue><fpage>2327</fpage><lpage>2336</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa2007016</pub-id><pub-id pub-id-type="medline">32275812</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Ke</surname><given-names>G</given-names> </name><name name-style="western"><surname>Meng</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Finley</surname><given-names>T</given-names> </name><etal/></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Guyon</surname><given-names>I</given-names> </name></person-group><article-title>LightGBM: a highly efficient gradient boosting decision tree</article-title><source>Advances in Neural Information Processing Systems</source><year>2017</year><volume>30</volume><publisher-name>Curran Associates, Inc</publisher-name></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Friedman</surname><given-names>JH</given-names> </name></person-group><article-title>Greedy function approximation: A gradient boosting machine</article-title><source>Ann Statist</source><year>2001</year><volume>29</volume><issue>5</issue><fpage>1189</fpage><lpage>1232</lpage><pub-id pub-id-type="doi">10.1214/aos/1013203451</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Stekhoven</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>B&#x00FC;hlmann</surname><given-names>P</given-names> </name></person-group><article-title>MissForest--non-parametric missing value imputation for mixed-type data</article-title><source>Bioinformatics</source><year>2012</year><month>01</month><day>1</day><volume>28</volume><issue>1</issue><fpage>112</fpage><lpage>118</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btr597</pub-id><pub-id pub-id-type="medline">22039212</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Akiba</surname><given-names>T</given-names> </name><name name-style="western"><surname>Sano</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yanase</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Optuna: a next-generation hyperparameter optimization framework</article-title><conf-name>Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery &#x0026; Data Mining</conf-name><conf-date>Aug 4-8, 2019</conf-date><conf-loc>Anchorage, AK</conf-loc><fpage>2623</fpage><lpage>2631</lpage><pub-id pub-id-type="doi">10.1145/3292500.333070</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ishwaran</surname><given-names>H</given-names> </name><name name-style="western"><surname>Kogalur</surname><given-names>UB</given-names> </name><name name-style="western"><surname>Blackstone</surname><given-names>EH</given-names> </name><name name-style="western"><surname>Lauer</surname><given-names>MS</given-names> </name></person-group><article-title>Random survival forests</article-title><source>Ann Appl Stat</source><year>2008</year><month>09</month><volume>2</volume><issue>3</issue><fpage>841</fpage><lpage>860</lpage><pub-id pub-id-type="doi">10.1214/08-AOAS169</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Krzyzi&#x0144;ski</surname><given-names>M</given-names> </name><name name-style="western"><surname>Spytek</surname><given-names>M</given-names> </name><name name-style="western"><surname>Baniecki</surname><given-names>H</given-names> </name><name name-style="western"><surname>Biecek</surname><given-names>P</given-names> </name></person-group><article-title>SurvSHAP(t): time-dependent explanations of machine learning survival models</article-title><source>Knowl Based Syst</source><year>2023</year><month>02</month><volume>262</volume><fpage>110234</fpage><pub-id pub-id-type="doi">10.1016/j.knosys.2022.110234</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yan</surname><given-names>L</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>HT</given-names> </name><name name-style="western"><surname>Goncalves</surname><given-names>J</given-names> </name><etal/></person-group><article-title>An interpretable mortality prediction model for COVID-19 patients</article-title><source>Nat Mach Intell</source><year>2020</year><volume>2</volume><issue>5</issue><fpage>283</fpage><lpage>288</lpage><pub-id pub-id-type="doi">10.1038/s42256-020-0180-7</pub-id><pub-id pub-id-type="medline">32285025</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tang</surname><given-names>N</given-names> </name><name name-style="western"><surname>Li</surname><given-names>D</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>Z</given-names> </name></person-group><article-title>Abnormal coagulation parameters are associated with poor prognosis in patients with novel coronavirus pneumonia</article-title><source>J Thromb Haemost</source><year>2020</year><month>04</month><volume>18</volume><issue>4</issue><fpage>844</fpage><lpage>847</lpage><pub-id pub-id-type="doi">10.1111/jth.14768</pub-id><pub-id pub-id-type="medline">32073213</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>F</given-names> </name><name name-style="western"><surname>Long</surname><given-names>X</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>X</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Z</given-names> </name></person-group><article-title>ACE2 expression in pancreas may cause pancreatic damage after SARS-CoV-2 infection</article-title><source>Clin Gastroenterol Hepatol</source><year>2020</year><month>08</month><volume>18</volume><issue>9</issue><fpage>2128</fpage><lpage>2130</lpage><pub-id pub-id-type="doi">10.1016/j.cgh.2020.04.040</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fraiss&#x00E9;</surname><given-names>M</given-names> </name><name name-style="western"><surname>Logre</surname><given-names>E</given-names> </name><name name-style="western"><surname>Pajot</surname><given-names>O</given-names> </name><name name-style="western"><surname>Mentec</surname><given-names>H</given-names> </name><name name-style="western"><surname>Plantef&#x00E8;ve</surname><given-names>G</given-names> </name><name name-style="western"><surname>Contou</surname><given-names>D</given-names> </name></person-group><article-title>Thrombotic and hemorrhagic events in critically ill COVID-19 patients: a French monocenter retrospective study</article-title><source>Crit Care</source><year>2020</year><month>06</month><day>2</day><volume>24</volume><issue>1</issue><fpage>275</fpage><pub-id pub-id-type="doi">10.1186/s13054-020-03025-y</pub-id><pub-id pub-id-type="medline">32487122</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guo</surname><given-names>L</given-names> </name><name name-style="western"><surname>Rondina</surname><given-names>MT</given-names> </name></person-group><article-title>The era of thromboinflammation: platelets are dynamic sensors and effector cells during infectious diseases</article-title><source>Front Immunol</source><year>2019</year><volume>10</volume><fpage>2204</fpage><pub-id pub-id-type="doi">10.3389/fimmu.2019.02204</pub-id><pub-id pub-id-type="medline">31572400</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kimball</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Obi</surname><given-names>AT</given-names> </name><name name-style="western"><surname>Diaz</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Henke</surname><given-names>PK</given-names> </name></person-group><article-title>The emerging role of NETs in venous thrombosis and immunothrombosis</article-title><source>Front Immunol</source><year>2016</year><volume>7</volume><fpage>236</fpage><pub-id pub-id-type="doi">10.3389/fimmu.2016.00236</pub-id><pub-id pub-id-type="medline">27446071</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Leelahavanichkul</surname><given-names>A</given-names> </name><name name-style="western"><surname>Worasilchai</surname><given-names>N</given-names> </name><name name-style="western"><surname>Wannalerdsakun</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Gastrointestinal leakage detected by serum (1&#x2192;3)-&#x03B2;-D-glucan in mouse models and a pilot study in patients with sepsis</article-title><source>Shock</source><year>2016</year><month>11</month><volume>46</volume><issue>5</issue><fpage>506</fpage><lpage>518</lpage><pub-id pub-id-type="doi">10.1097/SHK.0000000000000645</pub-id><pub-id pub-id-type="medline">27172153</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saithong</surname><given-names>S</given-names> </name><name name-style="western"><surname>Worasilchai</surname><given-names>N</given-names> </name><name name-style="western"><surname>Saisorn</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Neutrophil extracellular traps in severe SARS-CoV-2 infection: a possible impact of LPS and (1&#x2192;3)-&#x03B2;-D-glucan in blood from gut translocation</article-title><source>Cells</source><year>2022</year><month>03</month><day>24</day><volume>11</volume><issue>7</issue><fpage>1103</fpage><pub-id pub-id-type="doi">10.3390/cells11071103</pub-id><pub-id pub-id-type="medline">35406667</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Siddiqi</surname><given-names>HK</given-names> </name><name name-style="western"><surname>Mehra</surname><given-names>MR</given-names> </name></person-group><article-title>COVID-19 illness in native and immunosuppressed states: a clinical-therapeutic staging proposal</article-title><source>J Heart Lung Transplant</source><year>2020</year><month>05</month><volume>39</volume><issue>5</issue><fpage>405</fpage><lpage>407</lpage><pub-id pub-id-type="doi">10.1016/j.healun.2020.03.012</pub-id><pub-id pub-id-type="medline">32362390</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gandhi</surname><given-names>RT</given-names> </name><name name-style="western"><surname>Lynch</surname><given-names>JB</given-names> </name><name name-style="western"><surname>Del Rio</surname><given-names>C</given-names> </name></person-group><article-title>Mild or Moderate COVID-19</article-title><source>N Engl J Med</source><year>2020</year><month>10</month><day>29</day><volume>383</volume><issue>18</issue><fpage>1757</fpage><lpage>1766</lpage><pub-id pub-id-type="doi">10.1056/NEJMcp2009249</pub-id><pub-id pub-id-type="medline">32329974</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Murakami</surname><given-names>N</given-names> </name><name name-style="western"><surname>Hayden</surname><given-names>R</given-names> </name><name name-style="western"><surname>Hills</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Therapeutic advances in COVID-19</article-title><source>Nat Rev Nephrol</source><year>2023</year><volume>19</volume><issue>1</issue><fpage>38</fpage><lpage>52</lpage><pub-id pub-id-type="doi">10.1038/s41581-022-00642-4</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tang</surname><given-names>N</given-names> </name><name name-style="western"><surname>Bai</surname><given-names>H</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>X</given-names> </name><name name-style="western"><surname>Gong</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>D</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>Z</given-names> </name></person-group><article-title>Anticoagulant treatment is associated with decreased mortality in severe coronavirus disease 2019 patients with coagulopathy</article-title><source>J Thromb Haemost</source><year>2020</year><month>05</month><volume>18</volume><issue>5</issue><fpage>1094</fpage><lpage>1099</lpage><pub-id pub-id-type="doi">10.1111/jth.14817</pub-id><pub-id pub-id-type="medline">32220112</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Descriptive statistics of 84 variables&#x2014;including background information, symptoms, and blood and urine test data&#x2014;of patients with COVID-19 for prognostic screening at initial diagnosis.</p><media xlink:href="formative_v9i1e65585_app1.xlsx" xlink:title="XLSX File, 18 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Descriptive statistics of 72 variables&#x2014;including background information, vital signs, and blood and urine test data&#x2014;of patients with COVID-19 for dynamic mortality risk assessment during hospitalization.</p><media xlink:href="formative_v9i1e65585_app2.xlsx" xlink:title="XLSX File, 15 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Receiver operating characteristic curves, confusion matrices, and absolute values of the cumulative hazard functions.</p><media xlink:href="formative_v9i1e65585_app3.pdf" xlink:title="PDF File, 541 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Performance of hospitalization prediction models, including Light Gradient Boosting Machine, random forest, support vector machine, Elastic Net, and decision tree.</p><media xlink:href="formative_v9i1e65585_app4.pdf" xlink:title="PDF File, 120 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Detailed methods covering missing data imputation, hyperparameter optimization, ensemble averaging, evaluation metrics, model selection and interpretability rationale, and clinical justification of selected predictors.</p><media xlink:href="formative_v9i1e65585_app5.pdf" xlink:title="PDF File, 125 KB"/></supplementary-material><supplementary-material id="app6"><label>Multimedia Appendix 6</label><p>Comparison of computation time for training, prediction, and Shapley Additive Explanations&#x2013;based interpretation in survival analysis.</p><media xlink:href="formative_v9i1e65585_app6.pdf" xlink:title="PDF File, 333 KB"/></supplementary-material></app-group></back></article>