<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id><journal-id journal-id-type="publisher-id">formative</journal-id><journal-id journal-id-type="index">27</journal-id><journal-title>JMIR Formative Research</journal-title><abbrev-journal-title>JMIR Form Res</abbrev-journal-title><issn pub-type="epub">2561-326X</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e67767</article-id><article-id pub-id-type="doi">10.2196/67767</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Web-Based Explainable Machine Learning-Based Drug Surveillance for Predicting Sunitinib- and Sorafenib-Associated Thyroid Dysfunction: Model Development and Validation Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Chan</surname><given-names>Fan-Ying</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ku</surname><given-names>Yi-En</given-names></name><degrees>BSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lie</surname><given-names>Wen-Nung</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Chen</surname><given-names>Hsiang-Yin</given-names></name><degrees>PharmD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff3">3</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Clinical Pharmacy, College of Pharmacy, Taipei Medical University</institution><addr-line>250 Wuxing St, Xinyi Dist</addr-line><addr-line>Taipei</addr-line><country>Taiwan</country></aff><aff id="aff2"><institution>Department of Electrical Engineering, National Chung Cheng University</institution><addr-line>Chiayi</addr-line><country>Taiwan</country></aff><aff id="aff3"><institution>Department of Pharmacy, Wan Fang Hospital, Taipei Medical University</institution><addr-line>Taipei</addr-line><country>Taiwan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Vit</surname><given-names>Abigail Paradise</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Guo</surname><given-names>Lei</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Hsiang-Yin Chen, PharmD, Department of Clinical Pharmacy, College of Pharmacy, Taipei Medical University, 250 Wuxing St, Xinyi Dist, Taipei, 11031, Taiwan, 886 2-2736-1661; <email>shawn@tmu.edu.tw</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>10</day><month>4</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e67767</elocation-id><history><date date-type="received"><day>23</day><month>10</month><year>2024</year></date><date date-type="rev-recd"><day>03</day><month>03</month><year>2025</year></date><date date-type="accepted"><day>04</day><month>03</month><year>2025</year></date></history><copyright-statement>&#x00A9; Fan-Ying Chan, Yi-En Ku, Wen-Nung Lie, Hsiang-Yin Chen. Originally published in JMIR Formative Research (<ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>), 10.4.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://formative.jmir.org/2025/1/e67767"/><abstract><sec><title>Background</title><p>Unlike one-snap data collection methods that only identify high-risk patients, machine learning models using time-series data can predict adverse events and aid in the timely management of cancer.</p></sec><sec><title>Objective</title><p>This study aimed to develop and validate machine learning models for sunitinib- and sorafenib-associated thyroid dysfunction using a time-series data collection approach.</p></sec><sec sec-type="methods"><title>Methods</title><p>Time series data of patients first prescribed sunitinib or sorafenib were collected from a deidentified clinical research database. Logistic regression, random forest, adaptive Boosting, Light Gradient-Boosting Machine, and Gradient Boosting Decision Tree were used to develop the models. Prediction performances were compared using the accuracy, precision, recall, F1-score, area under the receiver operating characteristic curve, and area under the precision-recall curve. The optimal threshold for the best-performing model was selected based on the maximum F1-score. SHapley Additive exPlanations analysis was conducted to assess feature importance and contributions at both the cohort and patient levels.</p></sec><sec sec-type="results"><title>Results</title><p>The training cohort included 609 patients, while the temporal validation cohort had 198 patients. The Gradient Boosting Decision Tree model without resampling outperformed other models, with area under the precision-recall curve of 0.600, area under the receiver operating characteristic curve of 0.876, and F1-score of 0.583 after adjusting the threshold. The SHapley Additive exPlanations analysis identified higher cholesterol levels, longer summed days of medication use, and clear cell adenocarcinoma histology as the most important features. The final model was further integrated into a web-based application.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This model can serve as an explainable adverse drug reaction surveillance system for predicting sunitinib- and sorafenib-associated thyroid dysfunction.</p></sec></abstract><kwd-group><kwd>thyroid dysfunction</kwd><kwd>machine learning</kwd><kwd>cancer</kwd><kwd>sunitinib</kwd><kwd>sorafenib</kwd><kwd>TKI</kwd><kwd>tyrosine kinase inhibitor</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>Sunitinib- and sorafenib-associated thyroid dysfunction are time-varying and underreported adverse drug reactions (ADR). Despite the efficacy of multitargeted tyrosine kinase inhibitors TKI as first- or second-line therapies for solid and hematologic cancers, thyroid dysfunction&#x2014;especially hypothyroidism&#x2014;may complicate treatment regimens using sunitinib and sorafenib. Although not life-threatening, such adverse events can lead to a suboptimal quality of life, physical discomfort, or the need for thyroid dysfunction treatment [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Incidences of thyroid dysfunction vary from 10%- to 85% for sunitinib and from 6.3% to 27% for sorafenib [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. Hypothyroidism develops late and is prolonged, with onset ranging from 5 to 20 months [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. Due to its high variability and difficulty in predicting, close monitoring and proactive ADR surveillance with machine learning (ML) models may be warranted to manage sunitinib- and sorafenib-associated thyroid dysfunction.</p><p>Incorporating real-time laboratory data can enhance the performance of ML models in predicting thyroid adverse events. Previous studies have demonstrated the effectiveness of ML in predicting thyroid dysfunction, such as amiodarone-induced dysfunction using time-series data collection methods with a robust performance [<xref ref-type="bibr" rid="ref9">9</xref>]. In contrast, predicting immune checkpoint inhibitor-induced adverse thyroid events without continuous laboratory testing resulted in an area under the precision-recall curve (AUPRC) of 0.510 [<xref ref-type="bibr" rid="ref10">10</xref>]. Another study developed a predictive model for immune checkpoint inhibitor-induced adverse thyroid events without detailed time-point data collection, achieving an area under the receiver operating characteristic curve (AUROC) of 0.885 with thyroid-related features [<xref ref-type="bibr" rid="ref11">11</xref>]. However, no studies have focused on predicting thyroid adverse events caused by TKIs such as sunitinib and sorafenib. Adopting timely data collection with detailed clinical biochemical tests to develop thyroid dysfunction surveillance systems can help clinicians timely adjust TKI treatment by balancing risks and benefits.</p><p>Applying model interpretation and web-based applications can alleviate the black-box drawback of ML models and enhance understanding of ADRs. The SHapley Additive exPlanations (SHAP) analysis is a mathematical method that has become increasingly popular for explaining ML models [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. It is based on game theory concepts that calculate feature importance and contributions to predicted outcomes at both population and individual levels [<xref ref-type="bibr" rid="ref15">15</xref>]. Model deployment in web-based or smartphone applications were constructed in recent years to strengthen the scalability of predicting specific diseases or ADRs [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. Through a user-friendly interface and explainable model, applications can provide clinicians with a greater understanding and actionable preventive remedies for their patients. These techniques successfully have increased the interpretability and accessibility of ML models to support clinical decision-making.</p><p>The landscape of drug surveillance has experienced notable changes, shifting from passive reporting systems or rules-based alerting systems to active identification of adverse drug events, driven by advancements in electronic health records and artificial intelligence. Traditional methods often rely on spontaneous reporting or rules-based alerting, which may lead to underreporting and delays in identifying ADRs. The ML models, particularly tree-based algorithms, can analyze large-scale clinical data in real time, proactively detecting ADRs and enhancing medication safety at the point of care [<xref ref-type="bibr" rid="ref18">18</xref>]. By continuously collecting and analyzing patient data, ML-driven drug surveillance based on time-series data extraction enables dynamic risk assessment, facilitating early intervention and personalized treatment adjustments. Given the underreported and time-varying nature of thyroid dysfunction, this progressive approach can serve as a valuable tool for predicting ADRs in patients undergoing TKI therapy.</p></sec><sec id="s1-2"><title>Objective</title><p>The objective of this study was to develop and validate progressive ML predictive models for sunitinib- and sorafenib-induced thyroid dysfunction. Five algorithms&#x2014;logistic regression (LR), random forest (RF), Gradient Boosting Decision Tree (GBDT), Light Gradient Boosting Machine (LGBM), and Adaptive Boosting (AdaBoost)&#x2014;were used to construct the models. The specific aims of this study were (1) to use time-series data collected at the baseline, and at 1, 2, 3, 4, 5, 6, 9, 12, 18, 24, 30, and 36 months after the index date to generate predictive models using the five algorithms; (2) to select the best model by comparing the accuracy, precision, recall, F1-score, AUROC, and AUPRC, after adjusting for the optimal threshold; (3) to interpret the best-performing model with a SHAP analysis to analyze feature importance levels and contributions, comparing findings with a previous amiodarone-induced thyroid dysfunction predictive model; and (4) to deploy the best-performing model by constructing a web-based application.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Ethical Considerations</title><p>This retrospective study used the deidentified Clinical Research Database (CRD) which includes data from Taipei Medical University Hospital, Wan Fang Hospital, and Shuang Ho Hospital of the TMU health care system. Ethical review for this study was waived by the TMU-Joint Institutional Review Board (approval no.: N202202053). As the data had been deidentified, the requirement for informed consent was waived. No compensation was provided to the participants.</p></sec><sec id="s2-2"><title>Study Design and Patient Cohort</title><p>Data from patients who were first prescribed sunitinib or sorafenib from 2013 to 2019 were collected as the derivation (training) cohort, whereas data from patients treated between 2010 and 2012 were collected as a temporal validation (testing) cohort. The data-splitting time point was chosen considering a common proportion of 7:3 for the training and testing cohorts and similar incidences of thyroid dysfunction in both cohorts for better model development and validation. More recent data were used for model training to better reflect current clinical practice, allowing models to be developed with up-to-date treatment patterns and patient characteristics. Patients were excluded if they were younger than 18 years, pregnant, with a history of hypothyroidism, had a diagnosis of thyroid carcinoma, had undergone thyroidectomy, used levothyroxine, or had abnormal thyroid-stimulating hormone (TSH) levels within 1 year before the index date, which was the first day of sunitinib or sorafenib use. Patients were also excluded if they were lost to follow up. Each individual was followed up for 3 years, and data were collected until the end of the study period, loss to follow-up, death, or occurrence of thyroid dysfunction. <xref ref-type="fig" rid="figure1">Figure 1</xref> demonstrates the study design of the proposed models. This study followed the Transparent Reporting of a multivariable prediction model for Individual Prognosis Or Diagnosis&#x2009;+&#x2009;Artificial Intelligence (TRIPOD&#x2009;+&#x2009; AI) reporting guideline [<xref ref-type="bibr" rid="ref19">19</xref>]. Registration was not required, and no separate study protocol was prepared.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Study design of the proposed models. The study process included data collection, data splitting, data preprocessing, feature selection, resampling, model development, model validation, threshold adjustment, model interpretation, and development of a web-based application. AdaBoost: Adaptive Boosting; AUPRC: area under the precision recall curve; AUROC: area under the receiver operating characteristic curve; B-SMT: Oversampling with the Borderline Synthetic Minority Oversampling Technique; CRD: clinical research database; GBDT: Gradient Boosting Decision Tree; LGBM: Light Gradient Boosting Machine; RFECV: Recursive Feature Elimination with Cross-Validation; SMT: Synthetic Minority Oversampling Technique; TMU: Taipei Medical University.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e67767_fig01.png"/></fig></sec><sec id="s2-3"><title>Time-Series Data Collection and Preprocessing</title><p>Variables including patient demographics, cancer-related information, medication use, laboratory tests, coexisting drugs, and comorbidities were collected from the CRD. Patient demographics including age, gender, and cancer-related information were collected once at the baseline. Laboratory tests, medication use, comorbidities, coexisting drugs, weight, and body mass index (BMI) were collected at the baseline, and at 1, 2, 3, 4, 5, 6, 9, 12, 18, 24, 30, and 36 months after the index date (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Reengineering features included calculating the cumulative dose, summed days of medication, duration of sunitinib or sorafenib, and the slope of laboratory tests at recent and previous data collection time points. The number of coexisting thyroid-related drugs was calculated to determine whether the aggregated use of these medications increased the risk of thyroid dysfunction.</p><p>Data preprocessing including missing value imputation and feature scaling was performed to ensure data quality. Features with over 80% missing values, except for the TSH level, were first excluded from the model. Missing values were imputed using multivariate imputation by chained equations [<xref ref-type="bibr" rid="ref20">20</xref>]. If previous data were traceable, missing values, using time-series data collection, were precisely imputed using the last observation carried forward. Missing values in laboratory test slopes were imputed with zero. A feature-scaling method&#x2014;the robust scaler&#x2014;was used to reduce the effect of extreme values of continuous variables. Features were first selected through a literature review and clinical domain knowledge to identify thyroid-related variables. Recursive feature elimination, a feature selection technique that recursively removes the least important features with 5-fold cross-validation was then used, and the AUROC was considered to select optimal features for each model. The codebook and missing rates of each variable in the training and testing set are described in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p></sec><sec id="s2-4"><title>Prediction Outcome</title><p>The predictive outcome of this study was the occurrence of sunitinib- or sorafenib-associated thyroid dysfunction. Patients were defined as a TSH level &#x2265;4 mIU/L, a diagnosis of hypothyroidism with International Classification of Diseases codes (<italic>ICD-9-CM</italic>; <italic>243</italic> or <italic>244</italic> or <italic>ICD-10</italic>; <italic>E02</italic> or <italic>E03)</italic>, or use of levothyroxine (Anatomical Therapeutic Chemical code: H03AA02). These criteria were defined following previous studies that focused on drug-induced thyroid dysfunction [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>].</p></sec><sec id="s2-5"><title>Model Development and Validation</title><p>The study used three resampling strategies and raw data applied to the five algorithms to develop 20 machine learning models. The five algorithms included LR, RF, AdaBoost [<xref ref-type="bibr" rid="ref23">23</xref>], LGBM [<xref ref-type="bibr" rid="ref24">24</xref>], and GBDT [<xref ref-type="bibr" rid="ref25">25</xref>]. Resampling strategies used were random over-sampling (ROS), borderline synthetic minority oversampling technique (B-SMT), and a combination of over- and under-sampling using SMT and Tomek links (STMK). Bayesian optimization with 5-fold cross-validation and the AUPRC were considered for hyperparameter tuning [<xref ref-type="bibr" rid="ref26">26</xref>]. For boosting models, hyperparameters such as learning_rate and n_estimators were optimized to balance convergence speed and model complexity. Specifically, in LGBM, subsample and colsample_bytree were fine-tuned to mitigate overfitting. Key parameters including max_depth, min_samples_split, and min_samples_leaf were adjusted to improve generalization and prevent overfitting for RF. Table S3.1 in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref> lists the ranges of hyperparameters used for tuning in each algorithm. Pseudocodes of the model development process are listed in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p><p>A stratified 5-fold cross-validation was first used for internal validation of the training dataset, and the performances of the 20 models were evaluated using the temporal validation cohort. The accuracy, precision, recall, F1-score, AUROC, and AUPRC were the metrics used for evaluating model performance. Model performance was compared and evaluated following the sequence of the highest AUPRC, AUROC value, and F1-score to select the best-performing model.</p></sec><sec id="s2-6"><title>Threshold Adjustment, Model Interpretation, and Web-Based Application</title><p>To optimize the performance of the best-performing model, different thresholds were selected on the PRC based on different percentages of outcome predictions. Five cutoff points were chosen: (1) a high-risk threshold for identifying a lower number of patients potentially at risk; (2) a default threshold of 0.50; (3) an optimal threshold based on the maximum F1-score; (4) an equal threshold where precision, recall, and F1-score were equal, and (5) the low-risk threshold for identifying a higher number of patients potentially at risk. The F1-score, recall, precision, and accuracy were then compared for these 5 thresholds. The best model was further examined by SHAP analysis to explain feature importance and contribution at both the population and individual levels [<xref ref-type="bibr" rid="ref27">27</xref>]. At the population level, SHAP summary plots were used to demonstrate feature importance and how the top-ranked features impacted outcome predictions. On the other hand, SHAP force plots were used to visualize how the features contributed to outcome predictions in specific patients.</p><p>The model was further integrated into a web-based application to increase the accessibility of the model. The Python Flask framework was used to develop the application programming interface. The value of each feature served as input data that were fed back into the model to generate a predictive probability of thyroid dysfunction. The consistency of feature scaling between input data and training data was ensured by applying the same scaling transformation. The input variables with missing values were imputed with the last observation or the same multivariate imputation by chained equations transformation applied during model development to ensure consistency in predictions.</p></sec><sec id="s2-7"><title>Statistical Analysis</title><p>Patient characteristics were evaluated with independent <italic>t</italic> tests or the Wilcoxon rank-sum test for continuous variables, and the <italic>&#x03C7;</italic><sup>2</sup> test or Fisher exact test for categorical variables. A two-sided <italic>P</italic> value &#x003C;.05 was considered statistically significant. Data were analyzed using SAS (version 9.4; SAS Institute), Python (version 3.9.5; Python Software Foundation), and R software (version 4.2.2; R Foundation for Statistical Computing). The statistical significance of the AUPRC was calculated using MedCalc software (version 22.001).</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Patient Characteristics and Multivariate Analysis</title><p>This study enlisted data from 900 patients prescribed sunitinib or sorafenib from initial screening from the CRD. A STROBE (Strengthening The Reporting of Observational Studies in Epidemiology) flowchart of patient selection is described in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>. After applying the exclusion criteria, 807 patients remained. Patient characteristics and multivariate analysis of the training and temporal validation cohorts are listed in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>. The training cohort contained 609 patients, with 52 (8.5%) patients developing thyroid dysfunction, while 16 (8.1%) patients experienced thyroid dysfunction in the temporal validation cohort of 198 patients. There were no significant differences in age or gender in the derivation or temporal validation cohort. Cancer type, histology, aspartate aminotransferase (AST), and bilirubin levels significantly differed (<italic>P</italic>&#x003C;.001) between patients with and those without thyroid dysfunction in the two cohorts.</p></sec><sec id="s3-2"><title>Model Development and Validation</title><p>The total number of features selected by recursive feature elimination were 20, 18, 15, 40, and 20 in GBDT, AdaBoost, LGBM, RF, and LR, respectively. The most frequently selected features were recent laboratory tests including AST, alanine transaminase (ALT), bilirubin, cholesterol, and triglyceride levels. Patient demographics such as age and BMI summed days of medication use, and follow-up duration were also among the top-ranked selected features (<xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>). The optimal hyperparameter subsets selected by Bayesian optimization are listed in Table S3.2 in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p><p><xref ref-type="fig" rid="figure2">Figure 2</xref> shows the model performance based on the AUPRC, AUROC, F1-score, precision, recall, and accuracy in 20 ML models of the temporal validation cohort. Most of the GBDT and AdaBoost models had higher AUPRC values and F1-scores, while recall was higher in the RF and LR models. Of all the ML models, the GBDT without resampling (GBDT_RAW) outperformed the other models, with an AUPRC of 0.600, AUROC of 0.876, and an F1-score of 0.522. The AUPRC of GBDT_RAW (0.600, 95% CI 0.350-0.798) was significantly higher than those of the GBDT_ROS (0.388, 95% CI 0.175&#x2010;0.618; <italic>P</italic>&#x003C;.05), GBDT_BMST (0.300, 95% CI 0.124&#x2010;0.549; <italic>P</italic>&#x003C;.05), and GBDT_STMK (0.346, 95% CI 0.147&#x2010;0.582; <italic>P</italic>&#x003C;.05). <xref ref-type="supplementary-material" rid="app8">Multimedia Appendix 8</xref> lists model performances of 5-fold cross-validation with the training cohort and the statistical significance tests of the AUPRC of all the models.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Model performance on temporal validation. The model performance evaluated by the six metrics is demonstrated in a heatmap. Blue and green colors represent higher and lower values, respectively. ROS: random oversampling; BSMT: Oversampling with Borderline Synthetic Minority Oversampling Technique; STMK: Synthetic Minority Oversampling Technique-Tomek Links; GBDT: Gradient Boosting Decision Tree; AdaBoost: Adaptive Boosting; LGBM: Light Gradient Boosting Machine; RF: random forest; LR: logistic regression; AUPRC: area under the precision-recall curve; AUROC: area under the receiver operating characteristic curve.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e67767_fig02.png"/></fig></sec><sec id="s3-3"><title>Threshold Adjustment</title><p><xref ref-type="fig" rid="figure3">Figure 3</xref> shows the five cutoff points on the PRC and the precision, recall, and F1-score at different thresholds of the GBDT_RAW model. Based on different percentages of outcome predictions, cutoff points were 0.851 for identifying the top 1% of patients (2 predictive positive cases, point A &#x2014; high-risk threshold),0.500 for the top 3.5% (7 predictive positive cases, point B &#x2014; default threshold), 0.495 for the top 4% (8 predictive positive cases, point C &#x2014; optimal threshold based on the maximum F1-score), 0.272 for the top 8% (16 predictive positive cases, point D &#x2014; equal threshold), and 0.071 for the top 26% of patients (51 predictive positive cases, point E &#x2014; low-risk threshold). When moving the threshold from 0.500 to 0.851 (point A), the precision increased from 0.875 to 1.000, while recall significantly decreased to 0.125. In contrast, recall significantly increased to 0.750 and the precision decreased to 0.231 when changing the threshold to 0.066 (point E). The precision, recall, and F1-score reached 0.500 when the threshold was adjusted to 0.272 (point D). The optimal threshold of 0.495 (point C) for the GBDT_RAW model was selected based on the maximum F1-score, with a precision of 0.875, recall of 0.438, and F1-score of 0.583.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Threshold adjustment for the GBDT_RAW model. The five cutoff points on the precision-recall curve (A) represent different percentages of outcome predictions, precision, recall, and F1-scores based on different thresholds; (B) ,The X-axis represents the value of the threshold and the Y-axis shows values of the precision, recall, and F1-score.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e67767_fig03.png"/></fig></sec><sec id="s3-4"><title>Model Interpretation</title><p><xref ref-type="fig" rid="figure4">Figure 4</xref> shows model interpretation implemented with the SHAP analysis on the best-performing GBDT_RAW model. The summary plot in <xref ref-type="fig" rid="figure4">Figure 4A</xref> displays that the top five important predictors were the AST level, TG level, follow-up duration, cholesterol level, and albumin level. <xref ref-type="fig" rid="figure4">Figure 4B</xref> shows that patients with lower AST levels, higher cholesterol levels, higher albumin levels, longer durations of medication use, and clear cell adenocarcinoma histology had higher SHAP values for predicting the occurrence of thyroid dysfunction. At the individual level, force plots showed the impacts of features on predicting thyroid dysfunction in two specific patients. <xref ref-type="fig" rid="figure4">Figure 4C</xref> shows a patient with a predictive probability of 0.02, resulting from his AST level of 69 IU/L and the summed days of medications of 62 days, which contributed most negatively to outcome predictions. For a patient with a predictive probability of 0.82 in <xref ref-type="fig" rid="figure4">Figure 4D</xref>, the medication duration of 708 days and clear cell adenocarcinoma served as the most important factors that positively impacted outcome predictions.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Model interpretation with a SHAP analysis for the GBDT_RAW model. At the population level, the summary bar plot (A) Mean SHAP values of all features, and a summary dot plot; (B) shows how each feature impacted the outcome prediction. The x-axis shows SHAP values of all features, and the colors represent the feature values, with red and blue respectively demonstrating higher and lower values. At the individual level, force plots in (C) and (D) show how features contributed to the model output value in each patient. Red and blue arrows represent positive and negative contributions of features, and the length of the arrow shows the magnitude of the impact on outcome predictions. LAB_AST: recent aspartate aminotransferase level; LAB_TG: recent triglyceride level; PRED_DUR: follow-up days; LAB_Cholesterol: recent cholesterol level; LAB_Albumin: recent albumin level; LAB_AST_SLOPE: slope of aspartate aminotransferase level; MED_SUM: sum days of medication; LAB_MCV_SLOPE: slope of mean corpuscular volume; PRE_Hb: previous hemoglobin level; PRE_ALT: previous alanine transaminase level; LAB_MCH: recent mean corpuscular haemoglobin level; LAB_SCr: recent serum creatinine level; LAB_Hct_SLOPE: slope of hematocrit level; MED_DUR: duration of medication; PRE_MCHC: previous mean corpuscular hemoglobin concentration level; LAB_SCr_SLOPE: slope of serum creatinine level; LAB_MCHC_SLOPE: slope of mean corpuscular hemoglobin concentration level.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e67767_fig04.png"/></fig></sec><sec id="s3-5"><title>Web-Based Application</title><p>A web-based application for predicting sunitinib- and sorafenib-associated thyroid dysfunction was developed using the GBDT_RAW model (<xref ref-type="fig" rid="figure5">Figure 5</xref>). The application provides a user-friendly interface by showing 20 features selected by the GBDT model. Values of the features can be filled in with the appropriate units shown in each input box. The model then generates a predictive probability for the risk of sunitinib- or sorafenib-associated thyroid dysfunction. Ultimate predictions for the occurrence of thyroid dysfunction were determined based on thresholds adopted by clinical users.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Web-based application with a user-friendly interface. A web-based application developed using the GBDT_RAW model showing 20 selected features selected and the predictive probability.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e67767_fig05.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study developed explainable ML models by collecting time-series data to predict sunitinib- and sorafenib-associated thyroid dysfunction. The present model allowed ongoing predictions according to the rapidly shifting status of the disease for patients undergoing long-term TKI treatment. The best-performing GBDT without resampling model was optimized by threshold moving strategies to achieve a maximum F1-score. This study further used a SHAP analysis that provided interpretability at both the population and individual levels, identifying key predictors such as AST, cholesterol, and albumin levels. The feature selection process revealed similarities with prior research on amiodarone-induced thyroid dysfunction, supporting the model&#x2019;s potential applicability to other drug-induced thyroid dysfunctions [<xref ref-type="bibr" rid="ref9">9</xref>]. Integrating the model into a web-based application demonstrated its practical utility by allowing real-time risk estimation based on patient-specific data.</p></sec><sec id="s4-2"><title>Time-Series Data Collection</title><p>Time-series data collection in this study had a few advantages for thyroid dysfunction predictions on TKI users as illustrated in <xref ref-type="fig" rid="figure6">Figure 6</xref>. Clinical data at multiple time points in a long-term follow-up period were collected for model building. Time-series data allowed reengineering features by calculating rates of change of laboratory tests at recent and previous time points. The last observation carried forward method using the last value to replace missing data in subsequent time points ensured that missing values were imputed with plausible estimates [<xref ref-type="bibr" rid="ref28">28</xref>]. This time-series data collection closely monitored patients newly prescribed TKI users and those on long-term TKI therapy. The time-series model captured the critical moment of an approaching adverse event for an individual patient, providing oncologists with invaluable information to treat patients on TKIs.</p><p>Identifying thyroid dysfunction was reported to potentially serve as a prognostic indicator for treatment outcomes. Sunitinib and sorafenib respectively demonstrated progression-free survival (PFS) periods of 11 and 5.5 months in patients with renal cell carcinoma [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. Interestingly, studies indicated that patients with thyroid dysfunction had a longer PFS compared to patients with normal thyroid function among sunitinib (11.9 vs 8.8 months) and sorafenib users (19.3 vs 5.5 months) [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. These findings suggest that thyroid dysfunction may not only represent an adverse event but could serve as a marker of enhanced therapeutic response. Leveraging a time-series data collection approach, this study can predict thyroid dysfunction risk while simultaneously identifying patients who may derive greater clinical benefits from sustained TKI therapy. Unlike one-snap data collection which arbitrarily differentiates high-risk patients from a low-risk group, this time-series approach allows high-risk patients to use lifesaving TKIs for a relatively longer grace period which can significantly enhance their survival times. Models with time-series data collection balance the risks and benefits of survival and adverse drug events, bestowing precious survival periods for end-stage cancer patients with reasonable medication safety and improved quality of life.</p><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>Graphic comparison of one-snap and time-series data collection methods. Time-series and one-snap data collection methods were compared. The dashed line represents possible changes in variables during a long-term follow-up period. LOCF: Last Observation Carried Forward</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e67767_fig06.png"/></fig></sec><sec id="s4-3"><title>Best-Performing Model With Threshold Adjustment</title><p>The GBDT_RAW model outperformed other machine learning models in this study, with thresholds adjusted to optimize model performance. The gradient boosting method analyzed nonlinear relationships and handled imbalanced data to predict diagnoses, hospital readmissions, and clinical outcomes [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>]. During the hyperparameter tuning process, the AUPRC was considered, rather than the F1-score, without adjusting the threshold for imbalanced data [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. The model without resampling outperformed resampling approaches by maintaining high precision, while the sparsity of the minority class in this study probably caused resampling to introduce noise or unrealistic synthetic data, failing to improve recall. The final model then used five cutoff points on the PRC to decide optimal thresholds and percentages of positive predictions. A relatively low threshold can identify all patients at risk but may increase the number of false positives, overwhelming clinicians with numerous warnings to review. On the contrary, choosing a relatively high threshold reduces the number of false positives but increases the chances of missing true positive cases. The selected threshold increased the precision, recall, and F1-score of the model&#x2019;s performance, while considering the relative costs of false positives and false negatives to meet clinical needs [<xref ref-type="bibr" rid="ref37">37</xref>].</p></sec><sec id="s4-4"><title>Model Interpretation and Potential for Model Expansion</title><p>Similar features for predicting drug-induced thyroid dysfunction were selected by the presence of TKIs and a previous amiodarone model built by our research team [<xref ref-type="bibr" rid="ref9">9</xref>]. The feature selection process identified age, BMI, medication duration, summed days of medication, rate of change in serum creatinine levels, and recent mean corpuscular hemoglobin, AST, and cholesterol levels as key predictors of thyroid dysfunction in this study. Interestingly, these same features were also selected in our previous amiodarone model, suggesting their potential relevance across different drug-induced thyroid dysfunction models. Similar features highlight the potential for model expansion to increase generalizability. Top-ranked features identified in this study and their contributions calculated by the SHAP analysis were aligned with clinical domain knowledge. Higher cholesterol levels were found to positively impact predictions, which can be explained by the effect of thyroid function on lipoprotein metabolism [<xref ref-type="bibr" rid="ref38">38</xref>]. The present study also found that longer summed days of medication increased the risk of thyroid dysfunction. This finding was confirmed by a long-term safety study of sunitinib, which showed the frequency of thyroid dysfunction, unlike other adverse events, gradually increased over time [<xref ref-type="bibr" rid="ref39">39</xref>]. The AST level and histology of clear cell carcinoma served as important predictors, which may have resulted from a relatively lower incidence of thyroid dysfunction in patients with hepatocellular carcinoma and renal cell carcinoma.</p></sec><sec id="s4-5"><title>Clinical Implications of Web-Based Drug Surveillance</title><p>ML-based drug surveillance provides a promising tool for predicting and managing thyroid dysfunction caused by TKIs. Traditional clinical decision support systems (CDSS) rely on rule-based alerts for drug interactions or contraindications but often fail to capture the multifactorial nature of drug-induced thyroid dysfunction, which depends on thyroid-related factors [<xref ref-type="bibr" rid="ref40">40</xref>]. AI-driven CDSSs, leveraging ML algorithms, can overcome these limitations by identifying complex patterns in patient data, providing personalized risk assessments, and generating timely alerts for thyroid function monitoring. Deploying such ML models on cloud-based platforms alongside rule-based CDSSs could enhance real-time risk stratification, enabling early detection, intervention, and potential adjustments in therapy to prevent endocrine complications. Further exploration of CDSSs incorporating ML predictions are warranted to improve clinical practice and medication safety [<xref ref-type="bibr" rid="ref40">40</xref>].</p></sec><sec id="s4-6"><title>Limitations</title><p>There are a few limitations of this study. Data were from a single healthcare system and included limited numbers of sunitinib- or sorafenib-treated patients. There were missing data in the diagnosis of comorbidities and medication use. The nature of a retrospective study introduces underestimations of the incidence of thyroid dysfunction. As a result, different features selected by the present model and our previous amiodarone model mainly resulted from features with higher missing rates. Multicenter and multicountry studies for improving model extrapolation are needed before clinical application. Future qualitative research and prospective studies with the involvement of physicians should also be conducted to assess the usability and accessibility of the model for real-world evidence.</p></sec><sec id="s4-7"><title>Conclusions</title><p>This study applied time-series data collection to capture the critical moment of sunitinib- and sorafenib-associated thyroid dysfunction for ADR surveillance. The optimal threshold can balance the precision and recall meeting clinical needs. Feature importance was explained at the population and individual levels. The web-based application increased the model accessibility, allowing clinical users to receive real-time predictions. The comparison of features with amiodarone-induced thyroid dysfunction highlighted the potential for future model expansion.</p></sec></sec></body><back><ack><p>This work was supported by the National Science and Technology Council (NSTC) [grant no. NSTC-113-2320-B-038-057].</p></ack><notes><sec><title>Data Availability</title><p>The data were obtained from the Taipei Medical University clinical research database; this was approved by the Institutional Review Board of Taipei Medical University (TMU-JIRB-N202202053). The data and web-based application are available from the corresponding author upon reasonable requests, subject to appropriate request mechanisms and additional Institutional Review Board approval for personal information protection.</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AdaBoost</term><def><p>Adaptive Boosting</p></def></def-item><def-item><term id="abb2">ADR</term><def><p>adverse drug reaction</p></def></def-item><def-item><term id="abb3">ALT</term><def><p>alanine transaminase</p></def></def-item><def-item><term id="abb4">AST</term><def><p>aspartate aminotransferase</p></def></def-item><def-item><term id="abb5">AUPRC</term><def><p>area under the precision recall curve</p></def></def-item><def-item><term id="abb6">AUROC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb7">CDSS</term><def><p>clinical decision support systems</p></def></def-item><def-item><term id="abb8">CRD</term><def><p>clinical research database</p></def></def-item><def-item><term id="abb9">GBDT </term><def><p>Gradient Boosting Decision Tree</p></def></def-item><def-item><term id="abb10">LGBM</term><def><p>Light Gradient Boosting Machine</p></def></def-item><def-item><term id="abb11">LR</term><def><p>logistic regression</p></def></def-item><def-item><term id="abb12">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb13">RF</term><def><p>random forest</p></def></def-item><def-item><term id="abb14">TKI</term><def><p>tyrosine kinase inhibitor</p></def></def-item><def-item><term id="abb15">TMUH</term><def><p> Taipei Medical University Hospital</p></def></def-item><def-item><term id="abb16">TRIPOD+AI</term><def><p>Transparent reporting of a multivariable prediction model for individual prognosis or diagnosis + artificial intelligence</p></def></def-item><def-item><term id="abb17">TSH</term><def><p>thyroid-stimulating hormone</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Torino</surname><given-names>F</given-names> </name><name name-style="western"><surname>Corsello</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Longo</surname><given-names>R</given-names> </name><name name-style="western"><surname>Barnabei</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gasparini</surname><given-names>G</given-names> </name></person-group><article-title>Hypothyroidism related to tyrosine kinase inhibitors: an emerging toxic effect of targeted therapy</article-title><source>Nat Rev Clin Oncol</source><year>2009</year><month>04</month><volume>6</volume><issue>4</issue><fpage>219</fpage><lpage>228</lpage><pub-id pub-id-type="doi">10.1038/nrclinonc.2009.4</pub-id><pub-id pub-id-type="medline">19333228</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abdel-Rahman</surname><given-names>O</given-names> </name><name name-style="western"><surname>Fouad</surname><given-names>M</given-names> </name></person-group><article-title>Risk of thyroid dysfunction in patients with solid tumors treated with VEGF receptor tyrosine kinase inhibitors: a critical literature review and meta analysis</article-title><source>Expert Rev Anticancer Ther</source><year>2014</year><month>09</month><volume>14</volume><issue>9</issue><fpage>1063</fpage><lpage>1073</lpage><pub-id pub-id-type="doi">10.1586/14737140.2014.929501</pub-id><pub-id pub-id-type="medline">24927771</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Walko</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Aubert</surname><given-names>RE</given-names> </name><name name-style="western"><surname>La-Beck</surname><given-names>NM</given-names> </name><etal/></person-group><article-title>Pharmacoepidemiology of clinically relevant hypothyroidism and hypertension from sunitinib and sorafenib</article-title><source>Oncologist</source><year>2017</year><month>02</month><volume>22</volume><issue>2</issue><fpage>208</fpage><lpage>212</lpage><pub-id pub-id-type="doi">10.1634/theoncologist.2016-0233</pub-id><pub-id pub-id-type="medline">28167571</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vasileiadis</surname><given-names>T</given-names> </name><name name-style="western"><surname>Chrisofos</surname><given-names>M</given-names> </name><name name-style="western"><surname>Safioleas</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kontzoglou</surname><given-names>K</given-names> </name><name name-style="western"><surname>Papazisis</surname><given-names>K</given-names> </name><name name-style="western"><surname>Sdrolia</surname><given-names>A</given-names> </name></person-group><article-title>&#x0399;mpact of sunitinib-induced hypothyroidism on survival of patients with metastatic renal cancer</article-title><source>BMC Cancer</source><year>2019</year><month>04</month><day>30</day><volume>19</volume><issue>1</issue><fpage>407</fpage><pub-id pub-id-type="doi">10.1186/s12885-019-5610-8</pub-id><pub-id pub-id-type="medline">31039771</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Kudelka</surname><given-names>A</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>X</given-names> </name></person-group><article-title>Incidence and risk of hypertension with sorafenib in patients with cancer: a systematic review and meta-analysis</article-title><source>Lancet Oncol</source><year>2008</year><month>02</month><volume>9</volume><issue>2</issue><fpage>117</fpage><lpage>123</lpage><pub-id pub-id-type="doi">10.1016/S1470-2045(08)70003-2</pub-id><pub-id pub-id-type="medline">18221915</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sabatier</surname><given-names>R</given-names> </name><name name-style="western"><surname>Eymard</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Walz</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Could thyroid dysfunction influence outcome in sunitinib-treated metastatic renal cell carcinoma?</article-title><source>Ann Oncol</source><year>2012</year><month>03</month><volume>23</volume><issue>3</issue><fpage>714</fpage><lpage>721</lpage><pub-id pub-id-type="doi">10.1093/annonc/mdr275</pub-id><pub-id pub-id-type="medline">21653681</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Clemons</surname><given-names>J</given-names> </name><name name-style="western"><surname>Gao</surname><given-names>D</given-names> </name><name name-style="western"><surname>Naam</surname><given-names>M</given-names> </name><name name-style="western"><surname>Breaker</surname><given-names>K</given-names> </name><name name-style="western"><surname>Garfield</surname><given-names>D</given-names> </name><name name-style="western"><surname>Flaig</surname><given-names>TW</given-names> </name></person-group><article-title>Thyroid dysfunction in patients treated with sunitinib or sorafenib</article-title><source>Clin Genitourin Cancer</source><year>2012</year><month>12</month><volume>10</volume><issue>4</issue><fpage>225</fpage><lpage>231</lpage><pub-id pub-id-type="doi">10.1016/j.clgc.2012.08.002</pub-id><pub-id pub-id-type="medline">23017335</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jannin</surname><given-names>A</given-names> </name><name name-style="western"><surname>Penel</surname><given-names>N</given-names> </name><name name-style="western"><surname>Ladsous</surname><given-names>M</given-names> </name><name name-style="western"><surname>Vantyghem</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Do Cao</surname><given-names>C</given-names> </name></person-group><article-title>Tyrosine kinase inhibitors and immune checkpoint inhibitors-induced thyroid disorders</article-title><source>Crit Rev Oncol Hematol</source><year>2019</year><month>09</month><volume>141</volume><fpage>23</fpage><lpage>35</lpage><pub-id pub-id-type="doi">10.1016/j.critrevonc.2019.05.015</pub-id><pub-id pub-id-type="medline">31202955</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lu</surname><given-names>YT</given-names> </name><name name-style="western"><surname>Chao</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Chiang</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>HY</given-names> </name></person-group><article-title>Explainable machine learning techniques to predict amiodarone-induced thyroid dysfunction risk: multicenter, retrospective study with external validation</article-title><source>J Med Internet Res</source><year>2023</year><month>02</month><day>7</day><volume>25</volume><fpage>e43734</fpage><pub-id pub-id-type="doi">10.2196/43734</pub-id><pub-id pub-id-type="medline">36749620</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>W</given-names> </name><name name-style="western"><surname>Cho</surname><given-names>YA</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Jo</surname><given-names>AR</given-names> </name><name name-style="western"><surname>Min</surname><given-names>KH</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>KE</given-names> </name></person-group><article-title>Factors associated with thyroid-related adverse events in patients receiving PD-1 or PD-L1 inhibitors using machine learning models</article-title><source>Cancers (Basel)</source><year>2021</year><month>10</month><day>30</day><volume>13</volume><issue>21</issue><fpage>21</fpage><pub-id pub-id-type="doi">10.3390/cancers13215465</pub-id><pub-id pub-id-type="medline">34771631</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Development and validation of a prediction model for thyroid dysfunction in patients during immunotherapy</article-title><source>Endocr Pract</source><year>2024</year><month>10</month><volume>30</volume><issue>10</issue><fpage>943</fpage><lpage>950</lpage><pub-id pub-id-type="doi">10.1016/j.eprac.2024.07.006</pub-id><pub-id pub-id-type="medline">39004306</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Deng</surname><given-names>H</given-names> </name><name name-style="western"><surname>Eftekhari</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Carlin</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Development and validation of an explainable machine learning model for major complications after cytoreductive surgery</article-title><source>JAMA Netw Open</source><year>2022</year><month>05</month><day>2</day><volume>5</volume><issue>5</issue><fpage>e2212930</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2022.12930</pub-id><pub-id pub-id-type="medline">35612856</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Identification and validation of an explainable prediction model of acute kidney injury with prognostic implications in critically ill children: a prospective multicenter cohort study</article-title><source>EClinicalMedicine</source><year>2024</year><month>02</month><volume>68</volume><fpage>102409</fpage><pub-id pub-id-type="doi">10.1016/j.eclinm.2023.102409</pub-id><pub-id pub-id-type="medline">38273888</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jiang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Bo</surname><given-names>L</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Interpretable machine-learning model for real-time, clustered risk factor analysis of sepsis and septic death in critical care</article-title><source>Comput Methods Programs Biomed</source><year>2023</year><month>11</month><volume>241</volume><fpage>107772</fpage><pub-id pub-id-type="doi">10.1016/j.cmpb.2023.107772</pub-id><pub-id pub-id-type="medline">37657148</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Slack</surname><given-names>D</given-names> </name><name name-style="western"><surname>Hilgard</surname><given-names>S</given-names> </name><name name-style="western"><surname>Jia</surname><given-names>E</given-names> </name><name name-style="western"><surname>Singh</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lakkaraju</surname><given-names>H</given-names> </name></person-group><article-title>Fooling LIME and SHAP: adversarial attacks on post hoc explanation methods</article-title><source>Proceedings of the AAAI/ACM Conference on AI, Ethics, and Society</source><year>2020</year><fpage>180</fpage><lpage>186</lpage><pub-id pub-id-type="doi">10.1145/3375627.3375830</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ma</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wan</surname><given-names>X</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>A novel explainable online calculator for contrast-induced AKI in diabetics: A multi-centre validation and prospective evaluation study</article-title><source>J Transl Med</source><year>2023</year><month>07</month><day>31</day><volume>21</volume><issue>1</issue><fpage>517</fpage><pub-id pub-id-type="doi">10.1186/s12967-023-04387-x</pub-id><pub-id pub-id-type="medline">37525240</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mosquera-Lopez</surname><given-names>C</given-names> </name><name name-style="western"><surname>Ramsey</surname><given-names>KL</given-names> </name><name name-style="western"><surname>Roquemen-Echeverri</surname><given-names>V</given-names> </name><name name-style="western"><surname>Jacobs</surname><given-names>PG</given-names> </name></person-group><article-title>Modeling risk of hypoglycemia during and following physical activity in people with type 1 diabetes using explainable mixed-effects machine learning</article-title><source>Comput Biol Med</source><year>2023</year><month>03</month><volume>155</volume><fpage>106670</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.106670</pub-id><pub-id pub-id-type="medline">36803791</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Syrowatka</surname><given-names>A</given-names> </name><name name-style="western"><surname>Song</surname><given-names>W</given-names> </name><name name-style="western"><surname>Amato</surname><given-names>MG</given-names> </name><etal/></person-group><article-title>Key use cases for artificial intelligence to reduce the frequency of adverse drug events: a scoping review</article-title><source>Lancet Digit Health</source><year>2022</year><month>02</month><volume>4</volume><issue>2</issue><fpage>e137</fpage><lpage>e148</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(21)00229-6</pub-id><pub-id pub-id-type="medline">34836823</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Collins</surname><given-names>GS</given-names> </name><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names> </name><name name-style="western"><surname>Dhiman</surname><given-names>P</given-names> </name><etal/></person-group><article-title>TRIPOD+AI statement: updated guidance for reporting clinical prediction models that use regression or machine learning methods</article-title><source>BMJ</source><year>2024</year><month>04</month><day>16</day><volume>385</volume><fpage>e078378</fpage><pub-id pub-id-type="doi">10.1136/bmj-2023-078378</pub-id><pub-id pub-id-type="medline">38626948</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>van Buuren</surname><given-names>S</given-names> </name><name name-style="western"><surname>Oudshoorn</surname><given-names>CG</given-names> </name></person-group><source>Multivariate Imputation by Chained Equations</source><year>2000</year><publisher-name>Leiden: TNO</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://stefvanbuuren.name/publications/MICE%20V1.0%20Manual%20TNO00038%202000.pdf">https://stefvanbuuren.name/publications/MICE%20V1.0%20Manual%20TNO00038%202000.pdf</ext-link></comment><pub-id pub-id-type="other">90-6743-677-1</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kornelius</surname><given-names>E</given-names> </name><name name-style="western"><surname>Chiou</surname><given-names>JY</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>YS</given-names> </name><name name-style="western"><surname>Peng</surname><given-names>CH</given-names> </name><name name-style="western"><surname>Lai</surname><given-names>YR</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>CN</given-names> </name></person-group><article-title>Iodinated contrast media increased the risk of thyroid dysfunction: a 6-year retrospective cohort study</article-title><source>J Clin Endocrinol Metab</source><year>2015</year><month>09</month><volume>100</volume><issue>9</issue><fpage>3372</fpage><lpage>3379</lpage><pub-id pub-id-type="doi">10.1210/JC.2015-2329</pub-id><pub-id pub-id-type="medline">26168278</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Feldt</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sch&#x00FC;ssel</surname><given-names>K</given-names> </name><name name-style="western"><surname>Quinzler</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Incidence of thyroid hormone therapy in patients treated with sunitinib or sorafenib: a cohort study</article-title><source>Eur J Cancer</source><year>2012</year><month>05</month><volume>48</volume><issue>7</issue><fpage>974</fpage><lpage>981</lpage><pub-id pub-id-type="doi">10.1016/j.ejca.2012.01.036</pub-id><pub-id pub-id-type="medline">22382202</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Freund</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Schapire</surname><given-names>RE</given-names> </name></person-group><article-title>Experiments with a new boosting algorithm</article-title><source>ICML&#x2019;96: Proceedings of the Thirteenth International Conference on International Conference on Machine Learning</source><year>1996</year><month>07</month><fpage>148</fpage><lpage>156</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://cseweb.ucsd.edu/~yfreund/papers/boostingexperiments.pdf">https://cseweb.ucsd.edu/~yfreund/papers/boostingexperiments.pdf</ext-link></comment></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Ke</surname><given-names>G</given-names> </name><name name-style="western"><surname>Meng</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Finley</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Lightgbm: A highly efficient gradient boosting decision tree [abstract]</article-title><year>2017</year><access-date>2025-03-31</access-date><conf-name>31st Conference on Neural Information Processing Systems (NIPS 2017)</conf-name><conf-date>Dec 4-9, 2017</conf-date><comment><ext-link ext-link-type="uri" xlink:href="https://papers.nips.cc/paper_files/paper/2017/hash/6449f44a102fde848669bdd9eb6b76fa-Abstract.html">https://papers.nips.cc/paper_files/paper/2017/hash/6449f44a102fde848669bdd9eb6b76fa-Abstract.html</ext-link></comment></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Friedman</surname><given-names>JH</given-names> </name></person-group><article-title>Greedy function approximation: A gradient boosting machine</article-title><source>Ann Statist</source><year>2001</year><volume>29</volume><issue>5</issue><fpage>1189</fpage><lpage>1232</lpage><pub-id pub-id-type="doi">10.1214/aos/1013203451</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Snoek</surname><given-names>J</given-names> </name><name name-style="western"><surname>Larochelle</surname><given-names>H</given-names> </name><name name-style="western"><surname>Adams</surname><given-names>RP</given-names> </name></person-group><article-title>Practical bayesian optimization of machine learning algorithms [abstract]</article-title><year>2012</year><conf-name>Advances in neural information processing systems</conf-name><conf-date>Dec 3-6, 2012</conf-date><conf-loc>Lake Tahoe, Nevada</conf-loc><comment><ext-link ext-link-type="uri" xlink:href="https://papers.nips.cc/paper_files/paper/2012/hash/05311655a15b75fab86956663e1819cd-Abstract.html">https://papers.nips.cc/paper_files/paper/2012/hash/05311655a15b75fab86956663e1819cd-Abstract.html</ext-link></comment></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lundberg</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SI</given-names> </name></person-group><article-title>A unified approach to interpreting model predictions</article-title><year>2017</year><access-date>2025-03-31</access-date><conf-name>31st Conference on Neural Information Processing Systems (NIPS 2017)</conf-name><conf-date>Dec 4-9, 2017</conf-date><conf-loc>Long Beach, CA</conf-loc><comment><ext-link ext-link-type="uri" xlink:href="https://proceedings.neurips.cc/paper_files/paper/2017/file/8a20a8621978632d76c43dfd28b67767-Paper.pdf">https://proceedings.neurips.cc/paper_files/paper/2017/file/8a20a8621978632d76c43dfd28b67767-Paper.pdf</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lachin</surname><given-names>JM</given-names> </name></person-group><article-title>Fallacies of last observation carried forward analyses</article-title><source>Clin Trials</source><year>2016</year><month>04</month><volume>13</volume><issue>2</issue><fpage>161</fpage><lpage>168</lpage><pub-id pub-id-type="doi">10.1177/1740774515602688</pub-id><pub-id pub-id-type="medline">26400875</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Escudier</surname><given-names>B</given-names> </name><name name-style="western"><surname>Eisen</surname><given-names>T</given-names> </name><name name-style="western"><surname>Stadler</surname><given-names>WM</given-names> </name><etal/></person-group><article-title>Sorafenib in advanced clear-cell renal-cell carcinoma</article-title><source>N Engl J Med</source><year>2007</year><month>01</month><day>11</day><volume>356</volume><issue>2</issue><fpage>125</fpage><lpage>134</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa060655</pub-id><pub-id pub-id-type="medline">17215530</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Motzer</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Hutson</surname><given-names>TE</given-names> </name><name name-style="western"><surname>Tomczak</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Overall survival and updated results for sunitinib compared with interferon alfa in patients with metastatic renal cell carcinoma</article-title><source>J Clin Oncol</source><year>2009</year><month>08</month><day>1</day><volume>27</volume><issue>22</issue><fpage>3584</fpage><lpage>3590</lpage><pub-id pub-id-type="doi">10.1200/JCO.2008.20.1293</pub-id><pub-id pub-id-type="medline">19487381</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schmidinger</surname><given-names>M</given-names> </name><name name-style="western"><surname>Vogl</surname><given-names>UM</given-names> </name><name name-style="western"><surname>Bojic</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Hypothyroidism in patients with renal cell carcinoma: blessing or curse?</article-title><source>Cancer</source><year>2011</year><month>02</month><day>1</day><volume>117</volume><issue>3</issue><fpage>534</fpage><lpage>544</lpage><pub-id pub-id-type="doi">10.1002/cncr.25422</pub-id><pub-id pub-id-type="medline">20845482</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Silva</surname><given-names>NC da</given-names> </name><name name-style="western"><surname>Albertini</surname><given-names>MK</given-names> </name><name name-style="western"><surname>Backes</surname><given-names>AR</given-names> </name><name name-style="western"><surname>Pena</surname><given-names>G das G</given-names> </name></person-group><article-title>Machine learning for hospital readmission prediction in pediatric population</article-title><source>Comput Methods Programs Biomed</source><year>2024</year><month>02</month><volume>244</volume><fpage>107980</fpage><pub-id pub-id-type="doi">10.1016/j.cmpb.2023.107980</pub-id><pub-id pub-id-type="medline">38134648</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Duan</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Qiu</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Machine learning-based prediction model for distant metastasis of breast cancer</article-title><source>Comput Biol Med</source><year>2024</year><month>02</month><volume>169</volume><fpage>107943</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2024.107943</pub-id><pub-id pub-id-type="medline">38211382</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>May</surname><given-names>SB</given-names> </name><name name-style="western"><surname>Giordano</surname><given-names>TP</given-names> </name><name name-style="western"><surname>Gottlieb</surname><given-names>A</given-names> </name></person-group><article-title>Generalizable pipeline for constructing HIV risk prediction models across electronic health record systems</article-title><source>J Am Med Inform Assoc</source><year>2024</year><month>02</month><day>16</day><volume>31</volume><issue>3</issue><fpage>666</fpage><lpage>673</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocad217</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saito</surname><given-names>T</given-names> </name><name name-style="western"><surname>Rehmsmeier</surname><given-names>M</given-names> </name></person-group><article-title>The precision-recall plot is more informative than the ROC plot when evaluating binary classifiers on imbalanced datasets</article-title><source>PLoS ONE</source><year>2015</year><volume>10</volume><issue>3</issue><fpage>e0118432</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0118432</pub-id><pub-id pub-id-type="medline">25738806</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lipton</surname><given-names>ZC</given-names> </name><name name-style="western"><surname>Elkan</surname><given-names>C</given-names> </name><name name-style="western"><surname>Naryanaswamy</surname><given-names>B</given-names> </name></person-group><article-title>Optimal thresholding of classifiers to maximize F1 measure</article-title><source>Mach Learn Knowl Discov Databases</source><year>2014</year><volume>8725</volume><fpage>225</fpage><lpage>239</lpage><pub-id pub-id-type="doi">10.1007/978-3-662-44851-9_15</pub-id><pub-id pub-id-type="medline">26023687</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rizos</surname><given-names>CV</given-names> </name><name name-style="western"><surname>Elisaf</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Liberopoulos</surname><given-names>EN</given-names> </name></person-group><article-title>Effects of thyroid dysfunction on lipid profile</article-title><source>Open Cardiovasc Med J</source><year>2011</year><volume>5</volume><fpage>76</fpage><lpage>84</lpage><pub-id pub-id-type="doi">10.2174/1874192401105010076</pub-id><pub-id pub-id-type="medline">21660244</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Porta</surname><given-names>C</given-names> </name><name name-style="western"><surname>Gore</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Rini</surname><given-names>BI</given-names> </name><etal/></person-group><article-title>Long-term safety of sunitinib in metastatic renal cell carcinoma</article-title><source>Eur Urol</source><year>2016</year><month>02</month><volume>69</volume><issue>2</issue><fpage>345</fpage><lpage>351</lpage><pub-id pub-id-type="doi">10.1016/j.eururo.2015.07.006</pub-id><pub-id pub-id-type="medline">26215605</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sutton</surname><given-names>RT</given-names> </name><name name-style="western"><surname>Pincock</surname><given-names>D</given-names> </name><name name-style="western"><surname>Baumgart</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Sadowski</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Fedorak</surname><given-names>RN</given-names> </name><name name-style="western"><surname>Kroeker</surname><given-names>KI</given-names> </name></person-group><article-title>An overview of clinical decision support systems: benefits, risks, and strategies for success</article-title><source>NPJ Digit Med</source><year>2020</year><volume>3</volume><fpage>17</fpage><pub-id pub-id-type="doi">10.1038/s41746-020-0221-y</pub-id><pub-id pub-id-type="medline">32047862</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Flynn</surname><given-names>A</given-names> </name></person-group><article-title>Using artificial intelligence in health-system pharmacy practice: finding new patterns that matter</article-title><source>Am J Health Syst Pharm</source><year>2019</year><month>04</month><day>17</day><volume>76</volume><issue>9</issue><fpage>622</fpage><lpage>627</lpage><pub-id pub-id-type="doi">10.1093/ajhp/zxz018</pub-id><pub-id pub-id-type="medline">31361834</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Time-series data collection.</p><media xlink:href="formative_v9i1e67767_app1.docx" xlink:title="DOCX File, 364 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Codebook and missing rates of variables.</p><media xlink:href="formative_v9i1e67767_app2.docx" xlink:title="DOCX File, 24 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Hyperparameters tuning.</p><media xlink:href="formative_v9i1e67767_app3.docx" xlink:title="DOCX File, 21 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Pseudocodes of the model developing process.</p><media xlink:href="formative_v9i1e67767_app4.docx" xlink:title="DOCX File, 18 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Patient selection flowchart.</p><media xlink:href="formative_v9i1e67767_app5.docx" xlink:title="DOCX File, 141 KB"/></supplementary-material><supplementary-material id="app6"><label>Multimedia Appendix 6</label><p>Patient characteristics and multivariate analysis.</p><media xlink:href="formative_v9i1e67767_app6.docx" xlink:title="DOCX File, 23 KB"/></supplementary-material><supplementary-material id="app7"><label>Multimedia Appendix 7</label><p>Feature selection with recursive feature elimination.</p><media xlink:href="formative_v9i1e67767_app7.docx" xlink:title="DOCX File, 21 KB"/></supplementary-material><supplementary-material id="app8"><label>Multimedia Appendix 8</label><p>Model performance of five-fold cross-validation.</p><media xlink:href="formative_v9i1e67767_app8.docx" xlink:title="DOCX File, 24 KB"/></supplementary-material></app-group></back></article>