<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Diabetes</journal-id><journal-id journal-id-type="publisher-id">diabetes</journal-id><journal-id journal-id-type="index">23</journal-id><journal-title>JMIR Diabetes</journal-title><abbrev-journal-title>JMIR Diabetes</abbrev-journal-title><issn pub-type="epub">2371-4379</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v11i1e82635</article-id><article-id pub-id-type="doi">10.2196/82635</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Predictors of Glycemic Response to Sulfonylurea Therapy in Type 2 Diabetes Over 12 Months: Comparative Analysis of Linear Regression and Machine Learning Models</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Garg</surname><given-names>Shilpa</given-names></name><degrees>BTech</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kitchen</surname><given-names>Robert</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Gupta</surname><given-names>Ramneek</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Trucco</surname><given-names>Emanuele</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Pearson</surname><given-names>Ewan</given-names></name><degrees>MA, MB, BChir, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Diabetes Endocrinology and Reproductive Biology, School of Medicine, University of Dundee</institution><addr-line>Nethergate, Dundee</addr-line><addr-line>Dundee</addr-line><country>United Kingdom</country></aff><aff id="aff2"><institution>Novo Nordisk</institution><addr-line>Oxford</addr-line><country>United Kingdom</country></aff><aff id="aff3"><institution>Disease Intelligence Pte Ltd</institution><addr-line>10 Anson Road</addr-line><addr-line>Singapore</addr-line><country>Singapore</country></aff><aff id="aff4"><institution>Computing Department, School of Science and Engineering, University of Dundee</institution><addr-line>Dundee</addr-line><country>United Kingdom</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Zhao</surname><given-names>Ruxing</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Low</surname><given-names>Jonathan</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Yagcioglu</surname><given-names>Mert</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Taiwo</surname><given-names>Peter</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Shilpa Garg, BTech, Diabetes Endocrinology and Reproductive Biology, School of Medicine, University of Dundee, Nethergate, Dundee, Dundee, DD14HN, United Kingdom, 44 7443787733; <email>shilpa12370@gmail.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>6</day><month>2</month><year>2026</year></pub-date><volume>11</volume><elocation-id>e82635</elocation-id><history><date date-type="received"><day>19</day><month>08</month><year>2025</year></date><date date-type="rev-recd"><day>08</day><month>12</month><year>2025</year></date><date date-type="accepted"><day>11</day><month>12</month><year>2025</year></date></history><copyright-statement>&#x00A9; Shilpa Garg, Robert Kitchen, Ramneek Gupta, Emanuele Trucco, Ewan Pearson. Originally published in JMIR Diabetes (<ext-link ext-link-type="uri" xlink:href="https://diabetes.jmir.org">https://diabetes.jmir.org</ext-link>), 6.2.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Diabetes, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://diabetes.jmir.org/">https://diabetes.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://diabetes.jmir.org/2026/1/e82635"/><abstract><sec><title>Background</title><p>Sulfonylureas are commonly prescribed for managing type 2 diabetes, yet treatment responses vary significantly among individuals. Although advances in machine learning (ML) may enhance predictive capabilities compared to traditional statistical methods, their practical utility in real-world clinical environments remains uncertain.</p></sec><sec><title>Objective</title><p>This study aimed to evaluate and compare the predictive performance of linear regression models with several ML approaches for predicting glycemic response to sulfonylurea therapy using routine clinical data, and to assess model interpretability using Shapley Additive Explanations (SHAP) analysis as a secondary analysis.</p></sec><sec sec-type="methods"><title>Methods</title><p>A cohort of 7557 individuals with type 2 diabetes who initiated sulfonylurea therapy was analyzed, with all patients followed for 1 year. Linear and logistic regression models were used as baseline comparisons. A range of ML models was trained to predict the continuous change in hemoglobin A<sub>1c</sub> (HbA<sub>1c</sub>) levels and the achievement of HbA<sub>1c</sub> &#x003C;58 mmol/mol at follow-up. These models included random forest, extreme gradient boosting, support vector machines, a conventional feedforward neural network, and Bayesian additive regression trees. Model performance was assessed using standard metrics including <italic>R</italic>&#x00B2; and root mean squared error for regression tasks and area under the receiver operating characteristic for classification. In a subset of 2361 patients, nonfasting connecting peptide (C-peptide) was analyzed as a proxy for &#x03B2;-cell function. SHAP analysis was performed to identify and compare key predictors driving model performance across methods.</p></sec><sec sec-type="results"><title>Results</title><p>All models exhibited similar performance, with no significant advantages of ML techniques over linear regression. For continuous outcomes, Bayesian additive regression trees demonstrated the highest <italic>R</italic>&#x00B2; (0.445) and lowest root mean squared error (0.105), though the differences among models were minimal. For the binary outcome, extreme gradient boosting achieved the highest area under the receiver operating characteristic curve (0.712), with CIs overlapping those of other models. Across all models, baseline HbA<sub>1c</sub> was consistently the primary predictor, explaining the majority of the variance. SHAP analyses confirmed that baseline HbA<sub>1c</sub>, age, BMI, and sex were the most influential predictors. Sensitivity analyses and hyperparameter tuning did not significantly improve model performance. In the C-peptide subset, higher C-peptide levels were associated with greater glycemic improvement (<italic>&#x03B2;</italic>=&#x2212;3.2 mmol/mol per log(C-peptide); <italic>P</italic>&#x003C;.001).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>In this large, population-based cohort, ML models did not outperform traditional regression for predicting glycemic response to sulfonylureas. These findings suggest that limited gains from ML likely reflect an absence of strong nonlinear or high-order interactions in routine clinical data and that available features may not capture sufficient biological heterogeneity for complex models to confer added benefit. The inclusion of a C-peptide subset provides additional mechanistic insight by linking preserved &#x03B2;-cell function with treatment response.</p></sec></abstract><kwd-group><kwd>drug response</kwd><kwd>glycated hemoglobin</kwd><kwd>linear regression</kwd><kwd>machine learning models</kwd><kwd>treatment response prediction</kwd><kwd>type 2 diabetes</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Sulfonylureas are among the most commonly prescribed classes of glucose-lowering medications for individuals with type 2 diabetes. Their cost-effectiveness and accessibility make them particularly valuable in resource-constrained settings [<xref ref-type="bibr" rid="ref1">1</xref>]. However, significant variability exists in glycemic responses among individuals. This variability is influenced by various clinical and biological factors, such as age, kidney function, and genetic predispositions [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Identifying predictors of treatment response is essential for advancing precision medicine approaches and minimizing trial-and-error prescribing practices [<xref ref-type="bibr" rid="ref4">4</xref>].</p><p>Because sulfonylureas lower glucose primarily by stimulating insulin secretion from pancreatic &#x03B2;-cells, the degree of preserved &#x03B2;-cell function, often estimated by circulating connecting peptide (C-peptide) [<xref ref-type="bibr" rid="ref5">5</xref>], may influence treatment response. However, such markers are rarely available in real-world datasets and are not routinely included in prediction studies.</p><p>Machine learning (ML) methods have shown promise in predicting treatment responses more accurately than traditional regression models, particularly due to their ability to handle complex, nonlinear interactions between variables without requiring prespecified assumptions [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. In this context, ML approaches can capture subtle, multidimensional relationships that may be overlooked by traditional models, efficiently process large-scale longitudinal data, and generate data-driven insights that inform treatment selection. ML also offers better integration of diverse data types and improved interpretability through explainable AI, increasing clinical applicability [<xref ref-type="bibr" rid="ref8">8</xref>]. Despite this promise, relatively few studies have focused on modeling glycemic response in diabetes using real-world data [<xref ref-type="bibr" rid="ref9">9</xref>]. This gap in research presents a significant opportunity for further investigation.</p><p>Here, we use sulfonylurea response as an exemplar of diabetes drug response, due to its widespread use and the availability of clinical data. We evaluate and compare the efficacy of 5 ML models, including random forest, support vector machines, extreme gradient boosting (XGBoost), a conventional feedforward neural network (NN), and Bayesian additive regression trees (BART), in predicting the glycemic response to sulfonylureas in patients with type 2 diabetes. These models are compared with standard linear and logistic regression for continuous (change in hemoglobin A<sub>1c</sub> [HbA<sub>1c</sub>]) and binary (achievement of HbA<sub>1c</sub> &#x003C;58 mmol/mol) outcomes. Analyses were conducted using a large real-world cohort from the GoDARTS (Genetics of Diabetes Audit and Research in Tayside Scotland) study, including a biologically informative subset with C-peptide measurements to assess the contribution of &#x03B2;-cell function.</p><p>In addition to comparing predictive performance across models, we conducted a secondary analysis to examine feature contributions using Shapley Additive Explanations (SHAP) [<xref ref-type="bibr" rid="ref10">10</xref>]. This analysis allowed us to determine whether ML-derived feature importance aligns with the predictors identified by traditional regression approaches, providing insight into clinical interpretability and the practical utility of ML for informing treatment choice.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Population</title><p>The data were obtained from the GoDARTS [<xref ref-type="bibr" rid="ref11">11</xref>]. This population-based cohort links prescription, clinical, and laboratory records for individuals with diabetes in Tayside and Fife. The inclusion criteria included patients with type 2 diabetes who initiated sulfonylurea therapy (either as monotherapy or in combination), had a baseline HbA<sub>1c</sub> measurement (defined as the closest value within 183 days before to 7 days after treatment initiation), and a follow-up HbA<sub>1c</sub> measurement after a 1-year period. The 183-day window was selected to balance data availability and clinical relevance. For this analysis, only 2 HbA<sub>1c</sub> values per patient were used, 1 at baseline and 1 at follow-up, in line with the model&#x2019;s aim of predicting glycemic response from initial clinical features.</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>Data provision and linkage were carried out by the University of Dundee Health Informatics Centre, with analysis of anonymized data performed in an ISO27001 and Scottish Government&#x2013;accredited secure safe haven. Health Informatics Centre standard operating procedures were reviewed and approved by the National Health Service (NHS) East of Scotland Research Ethics Service (22/ES/0034), and consent for this study was obtained from the NHS Fife Caldicott Guardian. Under these approvals, secondary analysis of anonymised routine healthcare data does not require additional participant consent or compensation.</p></sec><sec id="s2-3"><title>Baseline Predictor Variables</title><p>Baseline clinical features included age, sex, HbA<sub>1c</sub>, BMI, total cholesterol, high-density lipoprotein (HDL) cholesterol, smoking status, systolic blood pressure, alkaline phosphatase, alanine transaminase, serum potassium, serum creatinine, bilirubin, and albumin. These variables were selected based on their availability in routine care and their known or suspected relevance to glycemic outcomes [<xref ref-type="bibr" rid="ref12">12</xref>]. Except for baseline HbA<sub>1c</sub> (as defined above), all measurements were defined as the closest recorded value within 2 years before to 90 days after sulfonylurea initiation.</p><p>To estimate average daily sulfonylurea dose, prescription records were used to extract drug strength and quantity dispensed. Five sulfonylureas were included: gliclazide, glipizide, glimepiride, glibenclamide, and tolbutamide. Each prescription&#x2019;s dose was standardized by dividing the prescribed dose by the drug&#x2019;s maximum recommended daily dose (as per the British National Formulary). This yielded a standardized dose unit, which was then multiplied by the number of tablets prescribed per prescription to calculate the total standardized dose. For each patient, the total dose was summed across all prescriptions, excluding the last one, and divided by treatment duration to derive the average daily dose. This dose was then categorized into low, medium, and high using quartiles.</p></sec><sec id="s2-4"><title>Outcome Definitions</title><p>The primary continuous outcome was defined as the change in glycated hemoglobin (HbA<sub>1c</sub>), measured in millimoles per mole, from baseline (at the time of sulfonylurea initiation) to the follow-up measurement closest to 12 months, within a window of 6-15 months.</p><p>The binary outcome was defined as whether a patient achieved a follow-up HbA<sub>1c</sub> level below 58 mmol/mol.</p></sec><sec id="s2-5"><title>Data Preparation</title><p>To ensure consistency and compatibility with ML models, several preprocessing steps were applied. Continuous variables with skewed distributions underwent log transformation to approximate a normal distribution [<xref ref-type="bibr" rid="ref13">13</xref>], enhancing model stability and reducing the influence of extreme values. Following this, all continuous predictors, including laboratory test results and physiological measurements, were scaled to a range between 0 and 1 using min-max normalization [<xref ref-type="bibr" rid="ref14">14</xref>]. This rescaling placed variables on a uniform scale, which is particularly important for algorithms like NNs that are sensitive to variable magnitudes. Categorical variables (eg, sex, smoking status, treatment group, average daily dose) were converted using one-hot encoding to make them compatible with model inputs.</p></sec><sec id="s2-6"><title>Missing Data Imputation and Collinearity Assessment</title><p>Patients missing either baseline or follow-up HbA<sub>1c</sub> measurements were excluded. For remaining clinical predictors, missingness was below 10% and not clustered within specific individuals. Missing values were imputed using multiple imputation by chained equations [<xref ref-type="bibr" rid="ref15">15</xref>] implemented in R (mice v3.18.0). Five imputed datasets were generated with 50 iterations each, using predictive mean matching for continuous variables. Full details of the imputation model are provided in Section 1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Convergence was assessed using the mean and variance of each variable across iterations and comparing distributions of observed and imputed values. Analyses were performed on pooled estimates derived using Rubin&#x2019;s rules [<xref ref-type="bibr" rid="ref16">16</xref>].</p><p>Collinearity among predictors was evaluated using variance inflation factors (VIFs) [<xref ref-type="bibr" rid="ref17">17</xref>]. Predictors with VIF values greater than 5 were reviewed for redundancy. In our final models, VIFs ranged from 1.06 to 1.5, indicating no meaningful multicollinearity. As a sensitivity check, strongly correlated clinical variables (<italic>r</italic> &#x003E; 0.8) were examined, and when overlap occurred (eg, estimated glomerular filtration rate vs serum creatinine), the variable more routinely and reliably measured in clinical practice (serum creatinine) was retained.</p></sec><sec id="s2-7"><title>Statistical Analysis: Baseline Models</title><p>Initial statistical analyses were conducted using linear regression [<xref ref-type="bibr" rid="ref18">18</xref>] for the continuous outcome and logistic regression for the binary outcome. These models identified baseline associations between clinical predictors and glycemic response to sulfonylurea therapy. Logistic regression estimated the probability of achieving an HbA<sub>1c</sub> &#x003C;58 mmol/mol. Of the 7557 individuals included, 3818 achieved the target, and 3739 did not.</p></sec><sec id="s2-8"><title>Residualization of Baseline HbA<sub>1c</sub></title><p>To disentangle treatment response from baseline glycemia, change in HbA<sub>1c</sub> was regressed on baseline HbA<sub>1c</sub>. The residuals from this model were used as outcomes for ML analyses. This allowed the identification of predictors influencing glycemic response independent of baseline HbA<sub>1c</sub> levels [<xref ref-type="bibr" rid="ref19">19</xref>].</p></sec><sec id="s2-9"><title>ML Models</title><p>Five ML models were implemented, reflecting diverse algorithmic strategies:</p><list list-type="order"><list-item><p>Random forest: An ensemble method that constructs multiple decision trees on bootstrapped data and aggregates their predictions [<xref ref-type="bibr" rid="ref20">20</xref>].</p></list-item><list-item><p>Support vector machines: A kernel-based classifier that establishes an optimal separating hyperplane [<xref ref-type="bibr" rid="ref21">21</xref>].</p></list-item><list-item><p>XGBoost: A boosting technique that sequentially builds trees to minimize residual error [<xref ref-type="bibr" rid="ref22">22</xref>].</p></list-item><list-item><p>NNs: A conventional feedforward NN (multilayer perceptron) trained using resilient backpropagation. Comprising layers of interconnected neurons, NNs excel at modeling complex relationships and require larger datasets and regularization to mitigate overfitting [<xref ref-type="bibr" rid="ref23">23</xref>].</p></list-item><list-item><p>BARTs: A Bayesian ensemble method that combines multiple regression trees and estimates uncertainty in predictions [<xref ref-type="bibr" rid="ref24">24</xref>]. BART is noted for strong performance in clinical applications [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref27">27</xref>].</p></list-item></list></sec><sec id="s2-10"><title>Model Implementation</title><p>For model development, a 2-stage validation framework combining cross-validation and a held-out test set was used. The data were randomly split into a 70% training set and a 30% held-out test set. Within the training set, 10-fold cross-validation [<xref ref-type="bibr" rid="ref18">18</xref>] was used for hyperparameter tuning and model selection to enhance model stability and reduce overfitting. Final performance was evaluated on the held-out test set, which remained unseen during training.</p><p>All analyses were performed in R (version 4.3.0). A detailed description of the packages and functions used for each model is presented in Section 2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, and XGBoost and NN hyperparameters are provided in Sections 3 and 4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, respectively. All preprocessing and modeling code is publicly available on GitHub [<xref ref-type="bibr" rid="ref28">28</xref>].</p></sec><sec id="s2-11"><title>Feature Importance</title><p>To identify the clinical features most strongly influencing model predictions, we assessed feature importance using SHAP values along with the built-in variable importance metrics from each model. SHAP values quantify the contribution of individual predictors to model outputs, enabling transparent, model-agnostic interpretation. Although SHAP can be applied to multiple model types, our results focused on the XGBoost model because it showed optimal predictive performance. SHAP summary plots were generated to visualize the magnitude and direction of feature effects, ranking predictors by their mean absolute SHAP values. Comparative plots across models were generated to visualize predictor impact on treatment response. This unified approach supported consistent evaluation of feature relevance across models and enhanced clinical interpretability.</p></sec><sec id="s2-12"><title>Performance Evaluation</title><p>Model performance was assessed separately for the continuous and binary outcomes. For the continuous outcome, evaluation metrics included root mean squared error (RMSE), mean absolute error, and the coefficient of determination (<italic>R</italic>&#x00B2;), which indicates the proportion of variance in the outcome explained by the model [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>].</p><p>For the binary outcome, performance was evaluated using standard classification metrics: area under the receiver operating characteristic curve (AUC), accuracy, sensitivity (recall), and specificity [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. In the linear regression models, regression coefficients were interpreted to assess the direction and magnitude of each predictor&#x2019;s association with the outcome, while <italic>P</italic> values indicated the statistical significance of these associations. An <italic>R</italic>&#x00B2; value provided an overall measure of model fit, and a <italic>P</italic> value below .05 was considered statistically significant.</p><p>To evaluate differences in performance across models, a resampling-based approach was used to compare their predictive metrics [<xref ref-type="bibr" rid="ref33">33</xref>]. Pairwise comparisons were conducted to assess whether any model significantly outperformed the others.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Cohort Characteristics</title><p>The study included 7557 individuals with type 2 diabetes who initiated sulfonylurea therapy and had both baseline and follow-up HbA<sub>1c</sub> values available. The cohort had a mean age of 63.7 (SD 11.8) years, and 57.9% (n=4377) were male. The mean baseline HbA<sub>1c</sub> was 76.5 (SD 16.7) mmol/mol (<xref ref-type="table" rid="table1">Table 1</xref>).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Baseline demographic and clinical characteristics of the study population.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Clinical variable</td><td align="left" valign="bottom">Sulfonylurea cohort (N=7557)</td></tr></thead><tbody><tr><td align="left" valign="top">Age at therapy initiation (y), mean (SD)</td><td align="left" valign="top">63.7 (11.8)</td></tr><tr><td align="left" valign="top" colspan="2">Sex, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">4377 (57.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">3180 (42.1)</td></tr><tr><td align="left" valign="top" colspan="2">Average daily dose, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Low</td><td align="left" valign="top">1844 (24.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Medium</td><td align="left" valign="top">3822 (50.6)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>High</td><td align="left" valign="top">1891 (25)</td></tr><tr><td align="left" valign="top">Duration of diabetes (y), mean (SD)</td><td align="left" valign="top">4.96 (4.49)</td></tr><tr><td align="left" valign="top" colspan="2">Duration of diabetes, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0&#x2010;1 years</td><td align="left" valign="top">1416 (18.7)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1&#x2010;5 years</td><td align="left" valign="top">3099 (41)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003E;5 years</td><td align="left" valign="top">3042 (40.3)</td></tr><tr><td align="left" valign="top">Time of treatment (mo), mean (SD)</td><td align="left" valign="top">11.4 (2.2)</td></tr><tr><td align="left" valign="top">Time from baseline HbA<sub>1c</sub><sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> measurement to treatment start (d), mean (SD)</td><td align="left" valign="top">21.3 (29.1)</td></tr><tr><td align="left" valign="top">Year of drug start, mean (SD)</td><td align="left" valign="top">2010 (6.12)</td></tr><tr><td align="left" valign="top">BMI (kg/m<sup>2</sup>), mean (SD)</td><td align="left" valign="top">31.3 (6.3)</td></tr><tr><td align="left" valign="top">Total cholesterol (mmol/L), mean (SD)</td><td align="left" valign="top">4.5 (1.2)</td></tr><tr><td align="left" valign="top">HDL<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> cholesterol (mmol/L), mean (SD)</td><td align="left" valign="top">1.2 (0.3)</td></tr><tr><td align="left" valign="top">Serum creatinine (&#x00B5;mol/L), mean (SD)</td><td align="left" valign="top">80.3 (27.4)</td></tr><tr><td align="left" valign="top">Albumin (g/L), mean (SD)</td><td align="left" valign="top">42.2 (4.0)</td></tr><tr><td align="left" valign="top">Bilirubin (&#x00B5;mol/L), mean (SD)</td><td align="left" valign="top">9.9 (5.2)</td></tr><tr><td align="left" valign="top">Alkaline phosphatase (U/L), mean (SD)</td><td align="left" valign="top">89.5 (42.1)</td></tr><tr><td align="left" valign="top">ALT/SGPT<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup> (U/L), mean (SD)</td><td align="left" valign="top">34.2 (24.4)</td></tr><tr><td align="left" valign="top">Potassium (mmol/L), mean (SD)</td><td align="left" valign="top">4.4 (0.4)</td></tr><tr><td align="left" valign="top">Systolic blood pressure, mean (SD)</td><td align="left" valign="top">137 (17.4)</td></tr><tr><td align="left" valign="top" colspan="2">Smoking status, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ever smoked&#x2014;yes</td><td align="left" valign="top">5628 (74.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ever smoked&#x2014;no</td><td align="left" valign="top">1870 (24.7)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ever smoked&#x2014;unknown</td><td align="left" valign="top">59 (0.8)</td></tr><tr><td align="left" valign="top" colspan="2">Therapy group, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mono</td><td align="left" valign="top">2508 (33.2)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dual</td><td align="left" valign="top">4251 (56.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Triple</td><td align="left" valign="top">798 (10.6)</td></tr><tr><td align="left" valign="top" colspan="2">Index of multiple deprivation quintile, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1 (most deprived)</td><td align="left" valign="top">1583 (16.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">1609 (21.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">1497 (19.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4</td><td align="left" valign="top">1396 (18.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>5 (least deprived)</td><td align="left" valign="top">1246 (16.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unknown</td><td align="left" valign="top">226 (3.0)</td></tr><tr><td align="left" valign="top" colspan="2">Ethnicity, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>White</td><td align="left" valign="top">5696 (75.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Others/mixed</td><td align="left" valign="top">259 (3.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Missing</td><td align="left" valign="top">1602 (21.2)</td></tr><tr><td align="left" valign="top" colspan="2">Region, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Tayside</td><td align="left" valign="top">5965 (78.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Fife</td><td align="left" valign="top">1592 (21.1)</td></tr><tr><td align="left" valign="top">Baseline HbA<sub>1c</sub> (mmol/mol), mean (SD)</td><td align="left" valign="top">76.5 (16.7)</td></tr><tr><td align="left" valign="top">HbA<sub>1c</sub> outcome (mmol/mol) (treatment HbA<sub>1c</sub>), mean (SD)</td><td align="left" valign="top">61.1 (15.4)</td></tr><tr><td align="left" valign="top">HbA<sub>1c</sub> response (change from baseline; mmol/mol), mean (SD)</td><td align="left" valign="top">&#x2013;15.4 (18)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>HbA<sub>1c</sub>: hemoglobin A<sub>1c</sub>.</p></fn><fn id="table1fn2"><p><sup>b</sup>HDL: high-density lipoprotein.</p></fn><fn id="table1fn3"><p><sup>c</sup>ALT/SGPT: alanine aminotransferase/serum glutamate pyruvate transaminase. </p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Associations Between Clinical Covariates and Treatment Response</title><p>A linear regression model was fit to assess the relationship between clinical variables and the change in HbA<sub>1c</sub>, defined as the difference between baseline HbA<sub>1c</sub> and follow-up values (ie, change=treatment&#x2013;baseline HbA<sub>1c</sub>). A negative change in HbA<sub>1c</sub> indicates a better treatment response to sulfonylureas, while a positive change signifies a worse response. No feature scaling (min-max normalization) was applied to the variables in this model. The model demonstrated satisfactory fit, with an <italic>R</italic>&#x00B2; value of 0.41 and a significant F-statistic (222.2; <italic>P&#x003C;</italic>.001).</p><p>The linear regression analysis identified several clinical variables significantly associated with the change in HbA<sub>1c</sub> among individuals treated with sulfonylureas. Older age and higher baseline HbA<sub>1c</sub> were associated with greater HbA<sub>1c</sub> reductions (negative coefficients), indicating more favorable responses. In contrast, a higher BMI was associated with smaller reductions, suggesting that individuals with higher BMI may struggle to achieve desired glycemic control. Additionally, sex differences indicated that male participants demonstrated slightly better response to sulfonylurea treatment than female participants.</p><p>These associations are illustrated in <xref ref-type="fig" rid="figure1">Figure 1</xref>, which presents a forest plot of the linear regression coefficients and CIs, highlighting the magnitude and direction of each predictor&#x2019;s effect on HbA<sub>1c</sub> change.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Forest plot showing regression coefficients and 95% CIs for predictors of change in hemoglobin A<sub>1c</sub> (HbA<sub>1c</sub>). Points represent model estimates and horizontal lines indicate 95% CIs. ALT: alanine aminotransferase; SGPT: alanine aminotransferase/serum glutamate pyruvate transaminase; T2D: type 2 diabetes. *<italic>P</italic>&#x003C;.05; **<italic>P</italic>&#x003C;.01; ***<italic>P</italic>&#x003C;.001.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="diabetes_v11i1e82635_fig01.png"/></fig></sec><sec id="s3-3"><title>C-Peptide Analysis</title><p>In a subset of 2361 individuals with nonfasting C-peptide data, higher C-peptide levels were strongly associated with greater reductions in HbA<sub>1c</sub> at 12 months (linear regression: <italic>&#x03B2;</italic>=&#x2212;3.2 mmol/mol per log(C-peptide); <italic>P</italic>&#x003C;.001). This finding suggests that preserved endogenous insulin secretion contributes to more favorable treatment outcomes.</p></sec><sec id="s3-4"><title>ML Model Performance for Continuous Outcome</title><p>For the continuous outcome of predicting changes in HbA<sub>1c</sub>, several models were evaluated. The results indicate that the BART model exhibited the lowest RMSE of 0.105 (21%) and the lowest mean absolute error of 0.079 (16.1%), highlighting its effective performance in estimating continuous changes. XGBoost and NNs also performed comparably, with RMSE values of 0.106.</p><p>On the original HbA<sub>1c</sub> scale, this corresponds to an approximate prediction error of 13.8 mmol/mol, comparable to the residual standard error from the linear regression model. Thus, the clinical prediction error was approximately ~14 mmol/mol.</p><p>However, the differences in RMSE and <italic>R</italic><sup>2</sup> across all models were minimal, indicating that while BART performed slightly better, the performance of all models was relatively comparable (<xref ref-type="table" rid="table2">Table 2</xref>). The similar <italic>R</italic><sup>2</sup> and RMSE values further suggest that no single model stands out significantly.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Regression model performance metrics (root mean squared error [RMSE], mean absolute error [MAE], and <italic>R</italic>&#x00B2;) for continuous outcome prediction across all 6 models<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Models</td><td align="left" valign="bottom">RMSE</td><td align="left" valign="bottom">MAE</td><td align="left" valign="bottom"><italic>R</italic><sup>2</sup></td></tr></thead><tbody><tr><td align="left" valign="top">Linear regression</td><td align="left" valign="top">0.106</td><td align="left" valign="top">0.08</td><td align="left" valign="top">0.434</td></tr><tr><td align="left" valign="top">RF<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="top">0.108</td><td align="left" valign="top">0.082</td><td align="left" valign="top">0.424</td></tr><tr><td align="left" valign="top">SVM<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="top">0.106</td><td align="left" valign="top">0.079</td><td align="left" valign="top">0.438</td></tr><tr><td align="left" valign="top">XGBoost<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup></td><td align="left" valign="top">0.106</td><td align="left" valign="top">0.08</td><td align="left" valign="top">0.433</td></tr><tr><td align="left" valign="top">NN<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup></td><td align="left" valign="top">0.106</td><td align="left" valign="top">0.081</td><td align="left" valign="top">0.427</td></tr><tr><td align="left" valign="top">BART<sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup></td><td align="left" valign="top">0.105</td><td align="left" valign="top">0.079</td><td align="left" valign="top">0.445</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>RMSE is shown as the normalized values.</p></fn><fn id="table2fn2"><p><sup>b</sup>RF: random forest.</p></fn><fn id="table2fn3"><p><sup>c</sup>SVM: support vector machine.</p></fn><fn id="table2fn4"><p><sup>d</sup>XGBoost: extreme gradient boosting.</p></fn><fn id="table2fn5"><p><sup>e</sup>NN: neural network.</p></fn><fn id="table2fn6"><p><sup>f</sup>BART: Bayesian additive regression trees.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-5"><title>Statistical Comparison of Model Performance</title><p>In addition to reporting standard performance metrics, statistical comparisons were performed using resampling-based techniques. Pairwise comparisons of RMSE and <italic>R</italic>&#x00B2; values across all models showed no statistically significant differences in performance; all ML models, including the linear regression baseline, performed similarly on this dataset.</p></sec><sec id="s3-6"><title>Sensitivity Analysis: Residualized HbA<sub>1c</sub> Change</title><p>A sensitivity analysis was performed to evaluate predictors of HbA<sub>1c</sub> change independent of baseline glycemia. Across all models, the maximum <italic>R</italic><sup>2</sup> value decreased to 0.05, indicating that only ~5% of the residual variance in 12-month HbA<sub>1c</sub> response was explained by routine clinical features after removing the effect of baseline HbA<sub>1c</sub>.</p><p>The performance metrics from this analysis further indicated that the RMSE and <italic>R</italic><sup>2</sup> values remained consistent across most models (<xref ref-type="table" rid="table3">Table 3</xref>). However, XGBoost and BART showed poorer performance, with high RMSE and lower <italic>R</italic><sup>2</sup> values. This likely reflects the fact that these algorithms are better suited for large, high-dimensional, or highly nonlinear datasets, whereas the present dataset may not contain sufficient complexity. This consistency across most models suggests that while some approaches explain marginally more variance in the sensitivity analysis, their predictive accuracy in terms of mean squared error remains stable.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Model performance after adjustment for baseline hemoglobin A<sub>1c</sub> (HbA<sub>1c</sub>) across all 6 models.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Models</td><td align="left" valign="bottom">RMSE<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="bottom">MAE<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td><td align="left" valign="bottom"><italic>R</italic><sup>2</sup></td></tr></thead><tbody><tr><td align="left" valign="top">Linear regression</td><td align="left" valign="top">0.127</td><td align="left" valign="top">0.095</td><td align="left" valign="top">0.054</td></tr><tr><td align="left" valign="top">RF<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="top">0.126</td><td align="left" valign="top">0.095</td><td align="left" valign="top">0.056</td></tr><tr><td align="left" valign="top">SVM<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td><td align="left" valign="top">0.128</td><td align="left" valign="top">0.094</td><td align="left" valign="top">0.051</td></tr><tr><td align="left" valign="top">XGBoost<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td><td align="left" valign="top">0.230</td><td align="left" valign="top">0.183</td><td align="left" valign="top">0.01</td></tr><tr><td align="left" valign="top">NN<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="left" valign="top">0.127</td><td align="left" valign="top">0.095</td><td align="left" valign="top">0.053</td></tr><tr><td align="left" valign="top">BART<sup><xref ref-type="table-fn" rid="table3fn7">g</xref></sup></td><td align="left" valign="top">0.214</td><td align="left" valign="top">0.191</td><td align="left" valign="top">0.021</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>RMSE: root mean squared error.</p></fn><fn id="table3fn2"><p><sup>b</sup>MAE: mean absolute error.</p></fn><fn id="table3fn3"><p><sup>c</sup>RF: random forest.</p></fn><fn id="table3fn4"><p><sup>d</sup>SVM: support vector machine.</p></fn><fn id="table3fn5"><p><sup>e</sup>XGBoost: extreme gradient boosting.</p></fn><fn id="table3fn6"><p><sup>f</sup>NN: neural network.</p></fn><fn id="table3fn7"><p><sup>g</sup>BART: Bayesian additive regression trees.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-7"><title>ML Model Performance for Binary Outcome</title><p>For the binary outcome of predicting achievement of HbA<sub>1c</sub> &#x003C;58 mmol/mol, model performance was assessed using the AUC and accuracy. The XGBoost model achieved the highest AUC (0.712), followed closely by BART (0.710), indicating modest discriminatory ability. Logistic regression performed similarly, with an AUC of 0.702.</p><p>The CIs for all models showed substantial overlap (ranging from 0.681 to 0.724 for logistic regression and 0.692 to 0.733 for XGBoost), indicating that no model demonstrated statistically superior discrimination. Overall, the models were broadly comparable in their ability to distinguish responders from nonresponders.</p><p>Model-level classification metrics are summarized in <xref ref-type="table" rid="table4">Table 4</xref>, and the corresponding ROC curves for all models are shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>, illustrating their similar performance profiles. In <xref ref-type="fig" rid="figure2">Figure 2</xref>, colored curves represent the individual models, visually reinforcing the overlapping AUCs and the absence of meaningful differences in classification performance.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Discrimination and classification performance of binary outcome models.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Models</td><td align="left" valign="bottom">AUC<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> (95% CI)</td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom">Precision</td><td align="left" valign="bottom">Recall</td></tr></thead><tbody><tr><td align="left" valign="top">Logistic regression</td><td align="left" valign="top">0.702 (0.681&#x2010;0.724)</td><td align="left" valign="top">0.654</td><td align="left" valign="top">0.657</td><td align="left" valign="top">0.628</td></tr><tr><td align="left" valign="top">RF<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup></td><td align="left" valign="top">0.708 (0.687&#x2010;0.729)</td><td align="left" valign="top">0.652</td><td align="left" valign="top">0.656</td><td align="left" valign="top">0.628</td></tr><tr><td align="left" valign="top">SVM<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">0.705 (0.684&#x2010;0.727)</td><td align="left" valign="top">0.65</td><td align="left" valign="top">0.656</td><td align="left" valign="top">0.618</td></tr><tr><td align="left" valign="top">XGBoost<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup></td><td align="left" valign="top">0.712 (0.692&#x2010;0.733)</td><td align="left" valign="top">0.646</td><td align="left" valign="top">0.65</td><td align="left" valign="top">0.625</td></tr><tr><td align="left" valign="top">NN<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup></td><td align="left" valign="top">0.699 (0.678&#x2010;0.72)</td><td align="left" valign="top">0.645</td><td align="left" valign="top">0.645</td><td align="left" valign="top">0.636</td></tr><tr><td align="left" valign="top">BART<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup></td><td align="left" valign="top">0.71 (0.689&#x2010;0.731)</td><td align="left" valign="top">0.651</td><td align="left" valign="top">0.652</td><td align="left" valign="top">636</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>AUC: area under the receiver operating characteristic curve.</p></fn><fn id="table4fn2"><p><sup>b</sup>RF: random forest.</p></fn><fn id="table4fn3"><p><sup>c</sup>SVM: support vector machine.</p></fn><fn id="table4fn4"><p><sup>d</sup>XGBoost: extreme gradient boosting.</p></fn><fn id="table4fn5"><p><sup>e</sup>NN: neural network.</p></fn><fn id="table4fn6"><p><sup>f</sup>BART: Bayesian additive regression trees.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Receiver operating characteristic (ROC) curves for binary outcome prediction models. Colors correspond to individual models as shown in the legend. ANN: artificial neural network; AUC: area under the receiver operating characteristic curve; BART: Bayesian additive regression trees; SVM: support vector machine; XGBoost: extreme gradient boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="diabetes_v11i1e82635_fig02.png"/></fig></sec><sec id="s3-8"><title>Feature Importance and SHAP Interpretability</title><p>Feature importance analyses consistently identified baseline HbA<sub>1c</sub> as the most significant predictor across all models. Other variables such as BMI, alanine transaminase, total cholesterol, and systolic blood pressure were also found to be significant, though their rankings varied slightly between algorithms. Across all 5 models, the rankings of key predictors remained largely consistent.</p><p>To further explain feature contributions, a SHAP summary plot derived from the XGBoost model is presented (<xref ref-type="fig" rid="figure3">Figure 3</xref>), offering a more granular view of individual feature effects on model predictions. Baseline HbA<sub>1c</sub> had the highest mean SHAP value (0.063), followed by total cholesterol, duration of diabetes, and age. Higher baseline HbA<sub>1c</sub> values were associated with larger predicted reductions in HbA<sub>1c</sub> (ie, more negative SHAP values), indicating greater expected treatment benefit.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Shapley Additive Explanations (SHAP) summary plot of feature importance in predicting glycemic response. Each dot represents 1 patient. The x-axis indicates the SHAP value (impact on model output). The color gradient reflects feature values (blue=higher values; yellow=lower values). Features are ordered by mean absolute SHAP values, indicating overall contribution to model predictions. ALT/SGPT: alanine aminotransferase/serum glutamate pyruvate transaminase; HbA<sub>1c</sub>: hemoglobin A<sub>1c</sub>; HDL: high-density lipoprotein; T2D: type 2 diabetes.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="diabetes_v11i1e82635_fig03.png"/></fig><p>The SHAP plot further shows that lower total cholesterol values corresponded to more negative SHAP values, suggesting better predicted outcomes, whereas higher cholesterol was linked to reduced response. Similarly, shorter diabetes duration and younger age were associated with more favorable predictions. For the variable sex, blue points represent male participants and yellow points represent female participants; male participants were associated with more negative SHAP values, indicating a better predicted response, compared to female participants, whose SHAP values clustered closer to or above zero.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study compared the predictive performance of traditional regression models and a range of ML algorithms for predicting glycemic response to sulfonylurea therapy in individuals with type 2 diabetes. The primary finding is that, with the dataset used, all models demonstrated comparable predictive performance. No ML approach significantly outperformed standard regression for either the continuous outcome or the binary outcome. These results indicate that, within routinely collected clinical data, the additional algorithmic complexity of ML methods does not necessarily yield superior predictive accuracy. Regression therefore remains a robust and interpretable option for predicting drug response in this context.</p><p>Linear regression analysis revealed that the model explained approximately 43% of the variance in changes to HbA<sub>1c</sub>. In the sensitivity analysis, after adjusting for baseline HbA<sub>1c</sub>, the maximum <italic>R</italic>&#x00B2; across all models dropped to 0.05, indicating that only a small proportion of outcome variability was captured by the remaining routine clinical features. This highlights the need for additional or more informative biomarkers to improve prediction.</p><p>Additionally, only about 50% (n=3818) of the participants achieved glycemic control after 1 year of sulfonylurea therapy, despite the relatively homogeneous clinical characteristics of the cohort. This finding highlights considerable interindividual variability in treatment response, suggesting that additional biological and behavioral factors may shape drug efficacy. Such heterogeneity may reflect differences in pharmacodynamic sensitivity, medication adherence, &#x03B2;-cell reserve, and underlying insulin resistance. BMI and HDL were considered indirect proxies of insulin resistance, as higher BMI is typically associated with greater insulin resistance, whereas higher HDL levels are generally linked to improved insulin sensitivity. Consistent with this, participants with higher BMI had poorer glycemic response, while those with higher HDL tended to show more favorable outcomes. However, direct measures of insulin resistance were not available in this dataset.</p></sec><sec id="s4-2"><title>No Added Value From ML Methods</title><p>While multiple ML algorithms were evaluated in parallel with traditional regression models, none demonstrated superior predictive performance. Across both continuous and binary outcomes (<xref ref-type="table" rid="table2">Tables 2 and 4</xref>), differences in metrics such as RMSE, <italic>R</italic>&#x00B2;, and AUC were small and not statistically significant, with overlapping CIs for all models. Even after hyperparameter tuning, predictive metrics remained modest, suggesting that ML methods did not uncover hidden patterns or interactions that traditional models missed.</p><p>This limited gain in predictive accuracy likely reflects the nature of routinely collected clinical data, which may lack sufficient biological complexity for ML algorithms to exploit. When input variables do not encompass detailed mechanistic information, even advanced algorithms cannot extract additional predictive signal. Consequently, transparent and easily interpretable models, such as linear or mixed-effects regression, may remain preferable, particularly when predictive performance is comparable. These models allow clinicians to understand feature contributions directly and translate findings into actionable treatment decisions.</p><p>Although complex ML models theoretically enable the capture of nonlinear relationships, their greater computational burden and reduced interpretability may limit their clinical utility unless they provide meaningful improvements in accuracy. The consistency of results across all modeling strategies, ranging from simple linear regression to ensemble and NN approaches, suggests that the available clinical features may not contain enough biological heterogeneity for ML methods to offer an advantage.</p><p>By intentionally comparing models of differing complexity, this study demonstrates that when data lack substantial nonlinearity or high-dimensional interactions, regression-based methods may remain more appropriate and efficient. This finding supports the continued reliance on interpretable models in routine clinical prediction tasks, where model parsimony and interpretability remain more valuable than algorithmic complexity for precision-medicine applications.</p></sec><sec id="s4-3"><title>Features That Inform Drug Response Prediction</title><p>Feature importance and SHAP analyses consistently identified baseline HbA<sub>1c</sub>, age, BMI, and sex as key predictors across regression and ML models. Baseline HbA<sub>1c</sub> was the strongest predictor, reflecting both regression to the mean and true physiological responsiveness [<xref ref-type="bibr" rid="ref34">34</xref>]. Older age and male sex were associated with greater HbA<sub>1c</sub> reduction, whereas higher BMI predicted poorer response, aligning with evidence that adiposity may reduce sulfonylurea effectiveness [<xref ref-type="bibr" rid="ref35">35</xref>]. These findings parallel results from the 5-drug predictive model developed by Dennis et al [<xref ref-type="bibr" rid="ref36">36</xref>], suggesting that these core predictors generalize across therapeutic classes.</p><p>C-peptide, available for a subset of participants, showed a strong positive association with glycemic improvement, consistent with the insulin-secretagogue mechanism of sulfonylureas. This highlights the contribution of &#x03B2;-cell reserve to treatment heterogeneity and underscores the value of including mechanistic biomarkers to enhance model interpretability and predictive accuracy.</p></sec><sec id="s4-4"><title>Limitations</title><p>This study has several limitations. First, routinely collected clinical data omit key determinants of treatment response such as adherence, diet, physical activity, genetics, and social factors. The limited availability of C-peptide prevented fuller assessment of &#x03B2;-cell function, and its strong association with response suggests that the inclusion of mechanistic biomarkers would likely improve predictive accuracy.</p><p>Second, the study population was limited to patients from Tayside and Fife in Scotland, which may reduce the generalizability of the findings to other regions or health care systems with different population characteristics or clinical practices.</p><p>Third, treatment response was assessed using a single HbA<sub>1c</sub> value taken between 6 and 15 months after treatment initiation. Although data closest to 12 months post-initiation were used, variability in the follow-up period (6&#x2010;15 mo) may introduce measurement variability and ought to be considered.</p><p>Additionally, the relatively low <italic>R</italic>&#x00B2; values across all models, even after applying rigorous methods such as a 70/30 train-test split and 10-fold cross-validation, suggest that the available clinical features alone do not explain sufficient variation in treatment response to support strong predictive performance.</p></sec><sec id="s4-5"><title>Future Directions</title><p>Future research should focus on improving prediction models by incorporating richer and more diverse data sources, including genetic, metabolomic, and continuous glucose monitoring data, as well as direct measures of insulin resistance and &#x03B2;-cell function. Integrating these modalities could improve model accuracy and help explain why individuals respond differently to sulfonylurea treatment. In addition, future studies could explore advanced modeling approaches, such as deep learning or hybrid models that balance predictive power with ease of interpretation for clinical use. The increasing availability of real-world, longitudinal clinical data also supports the use of time-dependent models, such as recurrent neural networks or transformer models, to track how treatment response evolves over time. Finally, testing these models in independent and ethnically diverse populations will be important to assess their generalizability and real-world applicability.</p><p>In conclusion, this study shows that the traditional regression models remain robust, clinically interpretable, and sufficient for predicting glycemic response to sulfonylurea therapy using routine data. The comparable performance of ML methods suggests that model transparency and accessibility may currently outweigh the small gains offered by algorithmic complexity in this context.</p></sec></sec></body><back><notes><sec><title>Funding</title><p>This work was supported by funding from Novo Nordisk, which provided a PhD studentship to SG.</p></sec></notes><fn-group><fn fn-type="con"><p>EP, RK, and RG contributed to conceptualization and supervision. SG conducted the data analysis and wrote the original manuscript. SG, EP, RK, and RG contributed to the reviewing and editing. ET reviewed the manuscript.</p></fn><fn fn-type="conflict"><p>RK is an employee of Novo Nordisk and serves as a director in Research and Development. RG is employed by Novo Nordisk and Disease Intelligence Pte Ltd and holds stock in both companies. The remaining authors declare no conflicts of interest.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AUC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb2">BART</term><def><p>Bayesian additive regression trees</p></def></def-item><def-item><term id="abb3">C-peptide</term><def><p>connecting peptide</p></def></def-item><def-item><term id="abb4">GoDARTS</term><def><p>Genetics of Diabetes Audit and Research in Tayside Scotland</p></def></def-item><def-item><term id="abb5">HbA<sub>1c</sub></term><def><p>hemoglobin A<sub>1c</sub></p></def></def-item><def-item><term id="abb6">HDL</term><def><p>high-density lipoprotein</p></def></def-item><def-item><term id="abb7">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb8">NHS</term><def><p>National Health Service</p></def></def-item><def-item><term id="abb9">NN</term><def><p>neural network</p></def></def-item><def-item><term id="abb10">RMSE</term><def><p>root mean square error</p></def></def-item><def-item><term id="abb11">SHAP</term><def><p>Shapley Additive Explanations</p></def></def-item><def-item><term id="abb12">VIF</term><def><p>variance inflation factor</p></def></def-item><def-item><term id="abb13">XGBoost</term><def><p>extreme gradient boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="web"><article-title>Diabetes</article-title><source>National Institute for Health and Care Excellence</source><access-date>2026-01-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.nice.org.uk/guidance/conditions-and-diseases/diabetes-and-other-endocrinal--nutritional-and-metabolic-conditions/diabetes">https://www.nice.org.uk/guidance/conditions-and-diseases/diabetes-and-other-endocrinal--nutritional-and-metabolic-conditions/diabetes</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pearson</surname><given-names>ER</given-names> </name><name name-style="western"><surname>Donnelly</surname><given-names>LA</given-names> </name><name name-style="western"><surname>Kimber</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Variation in TCF7L2 influences therapeutic response to sulfonylureas: a GoDARTs study</article-title><source>Diabetes</source><year>2007</year><month>08</month><volume>56</volume><issue>8</issue><fpage>2178</fpage><lpage>2182</lpage><pub-id pub-id-type="doi">10.2337/db07-0440</pub-id><pub-id pub-id-type="medline">17519421</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Uemura</surname><given-names>F</given-names> </name><name name-style="western"><surname>Okada</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Torimoto</surname><given-names>K</given-names> </name><name name-style="western"><surname>Tanaka</surname><given-names>Y</given-names> </name></person-group><article-title>Enlarged glycemic variability in sulfonylurea-treated well-controlled type 2 diabetics identified using continuous glucose monitoring</article-title><source>Sci Rep</source><year>2021</year><month>03</month><day>1</day><volume>11</volume><issue>1</issue><fpage>4875</fpage><pub-id pub-id-type="doi">10.1038/s41598-021-83999-z</pub-id><pub-id pub-id-type="medline">33649395</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chung</surname><given-names>WK</given-names> </name><name name-style="western"><surname>Erion</surname><given-names>K</given-names> </name><name name-style="western"><surname>Florez</surname><given-names>JC</given-names> </name><etal/></person-group><article-title>Precision medicine in diabetes: a consensus report from the American Diabetes Association (ADA) and the European Association for the Study of Diabetes (EASD)</article-title><source>Diabetes Care</source><year>2020</year><month>07</month><volume>43</volume><issue>7</issue><fpage>1617</fpage><lpage>1635</lpage><pub-id pub-id-type="doi">10.2337/dci20-0022</pub-id><pub-id pub-id-type="medline">32561617</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Maddaloni</surname><given-names>E</given-names> </name><name name-style="western"><surname>Bolli</surname><given-names>GB</given-names> </name><name name-style="western"><surname>Frier</surname><given-names>BM</given-names> </name><etal/></person-group><article-title>C-peptide determination in the diagnosis of type of diabetes and its management: a clinical perspective</article-title><source>Diabetes Obes Metab</source><year>2022</year><month>10</month><volume>24</volume><issue>10</issue><fpage>1912</fpage><lpage>1926</lpage><pub-id pub-id-type="doi">10.1111/dom.14785</pub-id><pub-id pub-id-type="medline">35676794</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Garg</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kitchen</surname><given-names>R</given-names> </name><name name-style="western"><surname>Gupta</surname><given-names>R</given-names> </name><name name-style="western"><surname>Pearson</surname><given-names>E</given-names> </name></person-group><article-title>Applications of AI in predicting drug responses for type 2 diabetes</article-title><source>JMIR Diabetes</source><year>2025</year><month>03</month><day>27</day><volume>10</volume><fpage>e66831</fpage><pub-id pub-id-type="doi">10.2196/66831</pub-id><pub-id pub-id-type="medline">40146874</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zou</surname><given-names>X</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ji</surname><given-names>L</given-names> </name></person-group><article-title>Review: Machine learning in precision pharmacotherapy of type 2 diabetes&#x2014;a promising future or a glimpse of hope?</article-title><source>Digit Health</source><year>2023</year><volume>9</volume><fpage>20552076231203879</fpage><pub-id pub-id-type="doi">10.1177/20552076231203879</pub-id><pub-id pub-id-type="medline">37786401</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Multimodal integration in health care: development with applications in disease management</article-title><source>J Med Internet Res</source><year>2025</year><month>08</month><day>21</day><volume>27</volume><fpage>e76557</fpage><pub-id pub-id-type="doi">10.2196/76557</pub-id><pub-id pub-id-type="medline">40840463</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ren</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Xiao</surname><given-names>D</given-names> </name><name name-style="western"><surname>Han</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Genetic and clinical predictive factors of sulfonylurea failure in patients with type 2 diabetes</article-title><source>Diabetes Technol Ther</source><year>2016</year><month>09</month><volume>18</volume><issue>9</issue><fpage>586</fpage><lpage>593</lpage><pub-id pub-id-type="doi">10.1089/dia.2015.0427</pub-id><pub-id pub-id-type="medline">27403931</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Lundberg</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SI</given-names> </name></person-group><article-title>A unified approach to interpreting model predictions</article-title><source>arXiv</source><comment>Preprint posted online on  May 22, 2017</comment><pub-id pub-id-type="doi">10.48550/arXiv.1705.07874</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>H&#x00E9;bert</surname><given-names>HL</given-names> </name><name name-style="western"><surname>Shepherd</surname><given-names>B</given-names> </name><name name-style="western"><surname>Milburn</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Cohort profile: Genetics of Diabetes Audit and Research in Tayside Scotland (GoDARTS)</article-title><source>Int J Epidemiol</source><year>2018</year><month>04</month><day>1</day><volume>47</volume><issue>2</issue><fpage>380</fpage><lpage>381j</lpage><pub-id pub-id-type="doi">10.1093/ije/dyx140</pub-id><pub-id pub-id-type="medline">29025058</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Martono</surname><given-names>DP</given-names> </name><name name-style="western"><surname>Lub</surname><given-names>R</given-names> </name><name name-style="western"><surname>Lambers Heerspink</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Hak</surname><given-names>E</given-names> </name><name name-style="western"><surname>Wilffert</surname><given-names>B</given-names> </name><name name-style="western"><surname>Denig</surname><given-names>P</given-names> </name></person-group><article-title>Predictors of response in initial users of metformin and sulphonylurea derivatives: a systematic review</article-title><source>Diabet Med</source><year>2015</year><month>07</month><volume>32</volume><issue>7</issue><fpage>853</fpage><lpage>864</lpage><pub-id pub-id-type="doi">10.1111/dme.12688</pub-id><pub-id pub-id-type="medline">25582542</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Feng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>N</given-names> </name><name name-style="western"><surname>Tu</surname><given-names>XM</given-names> </name></person-group><article-title>Log transformation: application and interpretation in biomedical research</article-title><source>Stat Med</source><year>2013</year><month>01</month><day>30</day><volume>32</volume><issue>2</issue><fpage>230</fpage><lpage>239</lpage><pub-id pub-id-type="doi">10.1002/sim.5486</pub-id><pub-id pub-id-type="medline">22806695</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cao</surname><given-names>XH</given-names> </name><name name-style="western"><surname>Stojkovic</surname><given-names>I</given-names> </name><name name-style="western"><surname>Obradovic</surname><given-names>Z</given-names> </name></person-group><article-title>A robust data scaling algorithm to improve classification accuracies in biomedical data</article-title><source>BMC Bioinformatics</source><year>2016</year><month>09</month><day>9</day><volume>17</volume><issue>1</issue><fpage>359</fpage><pub-id pub-id-type="doi">10.1186/s12859-016-1236-x</pub-id><pub-id pub-id-type="medline">27612635</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Van Buuren</surname><given-names>S</given-names> </name><name name-style="western"><surname>Groothuis-Oudshoorn</surname><given-names>K</given-names> </name></person-group><article-title>mice: multivariate imputation by chained equations in R</article-title><source>J Stat Softw</source><year>2011</year><month>12</month><volume>45</volume><issue>3</issue><fpage>67</fpage><pub-id pub-id-type="doi">10.18637/jss.v045.i03</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Rubin</surname><given-names>DB</given-names> </name></person-group><source>Multiple Imputation for Nonresponse in Surveys</source><year>1987</year><publisher-name>John Wiley &#x0026; Sons</publisher-name></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>O&#x2019;brien</surname><given-names>RM</given-names> </name></person-group><article-title>A caution regarding rules of thumb for variance inflation factors</article-title><source>Qual Quant</source><year>2007</year><month>09</month><day>11</day><volume>41</volume><issue>5</issue><fpage>673</fpage><lpage>690</lpage><pub-id pub-id-type="doi">10.1007/s11135-006-9018-6</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Hastie</surname><given-names>T</given-names> </name><name name-style="western"><surname>Tibshirani</surname><given-names>R</given-names> </name><name name-style="western"><surname>Friedman</surname><given-names>J</given-names> </name></person-group><source>The Elements of Statistical Learning: Data Mining, Inference, and Prediction</source><year>2009</year><edition>2</edition><publisher-name>Springer Series in Statistics</publisher-name><pub-id pub-id-type="doi">10.1007/978-0-387-84858-7</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Garc&#x00ED;a</surname><given-names>CB</given-names> </name><name name-style="western"><surname>Salmer&#x00F3;n</surname><given-names>R</given-names> </name><name name-style="western"><surname>Garc&#x00ED;a</surname><given-names>C</given-names> </name><name name-style="western"><surname>Garc&#x00ED;a</surname><given-names>J</given-names> </name></person-group><article-title>Residualization: justification, properties and application</article-title><source>J Appl Stat</source><year>2020</year><volume>47</volume><issue>11</issue><fpage>1990</fpage><lpage>2010</lpage><pub-id pub-id-type="doi">10.1080/02664763.2019.1701638</pub-id><pub-id pub-id-type="medline">35707574</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Breiman</surname><given-names>L</given-names> </name></person-group><article-title>Random forests</article-title><source>Mach Learn</source><year>2001</year><month>10</month><volume>45</volume><issue>1</issue><fpage>5</fpage><lpage>32</lpage><pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cortes</surname><given-names>C</given-names> </name><name name-style="western"><surname>Vapnik</surname><given-names>V</given-names> </name></person-group><article-title>Support-vector networks</article-title><source>Mach Learn</source><year>1995</year><month>09</month><volume>20</volume><issue>3</issue><fpage>273</fpage><lpage>297</lpage><pub-id pub-id-type="doi">10.1007/BF00994018</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>T</given-names> </name><name name-style="western"><surname>Guestrin</surname><given-names>C</given-names> </name></person-group><article-title>XGBoost: a scalable tree boosting system</article-title><source>arXiv</source><comment>Preprint posted online on  Mar 9, 2016</comment><pub-id pub-id-type="doi">10.48550/arXiv.1603.02754</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rumelhart</surname><given-names>D</given-names> </name><name name-style="western"><surname>Hinton</surname><given-names>G</given-names> </name><name name-style="western"><surname>Williams</surname><given-names>R</given-names> </name></person-group><article-title>Learning representations by back-propagating errors</article-title><source>Nature New Biol</source><year>2002</year><volume>323</volume><fpage>533</fpage><lpage>536</lpage><pub-id pub-id-type="doi">10.1038/323533a0</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chipman</surname><given-names>HA</given-names> </name><name name-style="western"><surname>George</surname><given-names>EI</given-names> </name><name name-style="western"><surname>McCulloch</surname><given-names>RE</given-names> </name></person-group><article-title>BART: Bayesian additive regression trees</article-title><source>Ann Appl Stat</source><year>2010</year><month>03</month><volume>4</volume><issue>1</issue><fpage>266</fpage><lpage>298</lpage><pub-id pub-id-type="doi">10.1214/09-AOAS285</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kapelner</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bleich</surname><given-names>J</given-names> </name></person-group><article-title>bartMachine: machine learning with Bayesian additive regression trees</article-title><source>J Stat Soft</source><year>2016</year><month>04</month><volume>70</volume><issue>4</issue><fpage>40</fpage><pub-id pub-id-type="doi">10.18637/jss.v070.i04</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cardoso</surname><given-names>P</given-names> </name><name name-style="western"><surname>Young</surname><given-names>KG</given-names> </name><name name-style="western"><surname>Hopkins</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Evaluating prediction of short-term tolerability of five type 2 diabetes drug classes using routine clinical features: UK population-based study</article-title><source>Diabetes Obes Metab</source><year>2025</year><month>08</month><volume>27</volume><issue>8</issue><fpage>4320</fpage><lpage>4329</lpage><pub-id pub-id-type="doi">10.1111/dom.16470</pub-id><pub-id pub-id-type="medline">40375735</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cardoso</surname><given-names>P</given-names> </name><name name-style="western"><surname>Young</surname><given-names>KG</given-names> </name><name name-style="western"><surname>Nair</surname><given-names>ATN</given-names> </name><etal/></person-group><article-title>Phenotype-based targeted treatment of SGLT2 inhibitors and GLP-1 receptor agonists in type 2 diabetes</article-title><source>Diabetologia</source><year>2024</year><month>05</month><volume>67</volume><issue>5</issue><fpage>822</fpage><lpage>836</lpage><pub-id pub-id-type="doi">10.1007/s00125-024-06099-3</pub-id><pub-id pub-id-type="medline">38388753</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="web"><article-title>Drug response prediction</article-title><source>GitHub</source><year>2025</year><access-date>2026-01-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/Pearson-Research-Lab/Drug-Response-Prediction">https://github.com/Pearson-Research-Lab/Drug-Response-Prediction</ext-link></comment></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Willmott</surname><given-names>C</given-names> </name><name name-style="western"><surname>Matsuura</surname><given-names>K</given-names> </name></person-group><article-title>Advantages of the mean absolute error (MAE) over the root mean square error (RMSE) in assessing average model performance</article-title><source>Clim Res</source><year>2005</year><volume>30</volume><fpage>79</fpage><lpage>82</lpage><pub-id pub-id-type="doi">10.3354/cr030079</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Freedman</surname><given-names>D</given-names> </name></person-group><source>Statistical Models: Theory and Practice</source><year>2005</year><publisher-name>Cambridge University Press</publisher-name><pub-id pub-id-type="doi">10.1017/CBO9781139165495</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fawcett</surname><given-names>T</given-names> </name></person-group><article-title>An introduction to ROC analysis</article-title><source>Pattern Recognit Lett</source><year>2006</year><month>06</month><volume>27</volume><issue>8</issue><fpage>861</fpage><lpage>874</lpage><pub-id pub-id-type="doi">10.1016/j.patrec.2005.10.010</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Powers</surname><given-names>DMW</given-names> </name></person-group><article-title>Evaluation: from precision, recall and F-factor to ROC, informedness, markedness &#x0026; correlation</article-title><source>Mach Learn Technol</source><year>2008</year><month>01</month><access-date>2026-01-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.researchgate.net/publication/228529307_Evaluation_From_Precision_Recall_and_F-Factor_to_ROC_Informedness_Markedness_Correlation">https://www.researchgate.net/publication/228529307_Evaluation_From_Precision_Recall_and_F-Factor_to_ROC_Informedness_Markedness_Correlation</ext-link></comment></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kuhn</surname><given-names>M</given-names> </name></person-group><article-title>Building predictive models in R using the caret package</article-title><source>J Stat Softw</source><year>2008</year><month>11</month><volume>28</volume><issue>5</issue><fpage>26</fpage><pub-id pub-id-type="doi">10.18637/jss.v028.i05</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jones</surname><given-names>AG</given-names> </name><name name-style="western"><surname>Lonergan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Henley</surname><given-names>WE</given-names> </name><name name-style="western"><surname>Pearson</surname><given-names>ER</given-names> </name><name name-style="western"><surname>Hattersley</surname><given-names>AT</given-names> </name><name name-style="western"><surname>Shields</surname><given-names>BM</given-names> </name></person-group><article-title>Should studies of diabetes treatment stratification correct for baseline HbA1c?</article-title><source>PLoS ONE</source><year>2016</year><volume>11</volume><issue>4</issue><fpage>e0152428</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0152428</pub-id><pub-id pub-id-type="medline">27050911</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dennis</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Henley</surname><given-names>WE</given-names> </name><name name-style="western"><surname>Weedon</surname><given-names>MN</given-names> </name><etal/></person-group><article-title>Sex and BMI alter the benefits and risks of sulfonylureas and thiazolidinediones in type 2 diabetes: a framework for evaluating stratification using routine clinical and individual trial data</article-title><source>Diabetes Care</source><year>2018</year><month>09</month><volume>41</volume><issue>9</issue><fpage>1844</fpage><lpage>1853</lpage><pub-id pub-id-type="doi">10.2337/dc18-0344</pub-id><pub-id pub-id-type="medline">30072404</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dennis</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Young</surname><given-names>KG</given-names> </name><name name-style="western"><surname>Cardoso</surname><given-names>P</given-names> </name><etal/></person-group><article-title>A five-drug class model using routinely available clinical features to optimise prescribing in type 2 diabetes: a prediction model development and validation study</article-title><source>Lancet</source><year>2025</year><month>03</month><day>1</day><volume>405</volume><issue>10480</issue><fpage>701</fpage><lpage>714</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(24)02617-5</pub-id><pub-id pub-id-type="medline">40020703</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Missing data imputation.</p><media xlink:href="diabetes_v11i1e82635_app1.docx" xlink:title="DOCX File, 23 KB"/></supplementary-material></app-group></back></article>