<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JD</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Diabetes</journal-id>
      <journal-title>JMIR Diabetes</journal-title>
      <issn pub-type="epub">2371-4379</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i1e53338</article-id>
      <article-id pub-id-type="pmid">39110490</article-id>
      <article-id pub-id-type="doi">10.2196/53338</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Machine Learning Model for Risk Stratification of Postdiagnosis Diabetic Ketoacidosis Hospitalization in Pediatric Type 1 Diabetes: Retrospective Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Cahill</surname>
            <given-names>Naomi</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Dey</surname>
            <given-names>Amit</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Degen</surname>
            <given-names>Isabella</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhang</surname>
            <given-names>Yijue</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Subramanian</surname>
            <given-names>Devika</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8168-1607</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Sonabend</surname>
            <given-names>Rona</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0004-6011-7742</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Singh</surname>
            <given-names>Ila</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <address>
            <institution>Department of Pathology and Immunology</institution>
            <institution>Baylor College of Medicine</institution>
            <addr-line>One Baylor Plaza</addr-line>
            <addr-line>Houston, TX, 77030</addr-line>
            <country>United States</country>
            <phone>1 832 824 7449</phone>
            <email>irsingh@texaschildrens.org</email>
          </address>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4786-3511</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Computer Science</institution>
        <institution>Rice University</institution>
        <addr-line>Houston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Pediatrics</institution>
        <institution>Baylor College of Medicine</institution>
        <addr-line>Houston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Division of Endocrinology</institution>
        <institution>Department of Pediatrics</institution>
        <institution>Texas Children’s Hospital</institution>
        <addr-line>Houston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Pathology and Immunology</institution>
        <institution>Baylor College of Medicine</institution>
        <addr-line>Houston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Divisions of Laboratory Medicine and Pathology Informatics</institution>
        <institution>Department of Pathology</institution>
        <institution>Texas Children’s Hospital</institution>
        <addr-line>Houston, TX</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Ila Singh <email>irsingh@texaschildrens.org</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>7</day>
        <month>8</month>
        <year>2024</year>
      </pub-date>
      <volume>9</volume>
      <elocation-id>e53338</elocation-id>
      <history>
        <date date-type="received">
          <day>4</day>
          <month>10</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>2</day>
          <month>1</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>11</day>
          <month>4</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>29</day>
          <month>5</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Devika Subramanian, Rona Sonabend, Ila Singh. Originally published in JMIR Diabetes (https://diabetes.jmir.org), 07.08.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Diabetes, is properly cited. The complete bibliographic information, a link to the original publication on https://diabetes.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://diabetes.jmir.org/2024/1/e53338" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Diabetic ketoacidosis (DKA) is the leading cause of morbidity and mortality in pediatric type 1 diabetes (T1D), occurring in approximately 20% of patients, with an economic cost of $5.1 billion/year in the United States. Despite multiple risk factors for postdiagnosis DKA, there is still a need for explainable, clinic-ready models that accurately predict DKA hospitalization in established patients with pediatric T1D.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aimed to develop an interpretable machine learning model to predict the risk of postdiagnosis DKA hospitalization in children with T1D using routinely collected time-series of electronic health record (EHR) data.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We conducted a retrospective case-control study using EHR data from 1787 patients from among 3794 patients with T1D treated at a large tertiary care US pediatric health system from January 2010 to June 2018. We trained a state-of-the-art; explainable, gradient-boosted ensemble (XGBoost) of decision trees with 44 regularly collected EHR features to predict postdiagnosis DKA. We measured the model’s predictive performance using the area under the receiver operating characteristic curve–weighted <italic>F</italic><sub>1</sub>-score, weighted precision, and recall, in a 5-fold cross-validation setting. We analyzed Shapley values to interpret the learned model and gain insight into its predictions.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our model distinguished the cohort that develops DKA postdiagnosis from the one that does not (P&lt;.001). It predicted postdiagnosis DKA risk with an area under the receiver operating characteristic curve of 0.80 (SD 0.04), a weighted <italic>F</italic><sub>1</sub>-score of 0.78 (SD 0.04), and a weighted precision and recall of 0.83 (SD 0.03) and 0.76 (SD 0.05) respectively, using a relatively short history of data from routine clinic follow-ups post diagnosis. On analyzing Shapley values of the model output, we identified key risk factors predicting postdiagnosis DKA both at the cohort and individual levels. We observed sharp changes in postdiagnosis DKA risk with respect to 2 key features (diabetes age and glycated hemoglobin at 12 months), yielding time intervals and glycated hemoglobin cutoffs for potential intervention. By clustering model-generated Shapley values, we automatically stratified the cohort into 3 groups with 5%, 20%, and 48% risk of postdiagnosis DKA.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We have built an explainable, predictive, machine learning model with potential for integration into clinical workflow. The model risk-stratifies patients with pediatric T1D and identifies patients with the highest postdiagnosis DKA risk using limited follow-up data starting from the time of diagnosis. The model identifies key time points and risk factors to direct clinical interventions at both the individual and cohort levels. Further research with data from multiple hospital systems can help us assess how well our model generalizes to other populations. The clinical importance of our work is that the model can predict patients most at risk for postdiagnosis DKA and identify preventive interventions based on mitigation of individualized risk factors.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>pediatric type 1 diabetes</kwd>
        <kwd>postdiagnosis diabetic ketoacidosis</kwd>
        <kwd>risk prediction and stratification</kwd>
        <kwd>XGBoost</kwd>
        <kwd>Shapley values</kwd>
        <kwd>ketoacidosis</kwd>
        <kwd>risks</kwd>
        <kwd>predict</kwd>
        <kwd>prediction</kwd>
        <kwd>predictive</kwd>
        <kwd>gradient-boosted ensemble model</kwd>
        <kwd>diabetes</kwd>
        <kwd>pediatrics</kwd>
        <kwd>children</kwd>
        <kwd>machine learning</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Diabetic ketoacidosis (DKA) is the leading cause of morbidity and mortality among patients with pediatric type 1 diabetes (T1D), accounting for nearly 50% of all deaths in this population [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. DKA occurs in 20% of patients with T1D, with an average cost of US $26,566 per DKA admission and a total economic cost of US $5.1 billion/year in the United States [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. Hospitalizations for DKA in the United States have increased by 6.3% each year from 2009 to 2014 despite many attempts at prevention [<xref ref-type="bibr" rid="ref8">8</xref>]. The incidence of DKA hospitalizations postdiagnosis has been estimated to be about 8 to 16 per 100 person-years in the pediatric population, with variations in both patient populations and in hospital or care systems [<xref ref-type="bibr" rid="ref9">9</xref>]. DKA has a significant impact on growth and development in children, potentially leading to neurocognitive impairment, cerebral edema, coma, or even death [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref10">10</xref>].</p>
        <p>Most prior studies pertaining to DKA hospitalization risk in pediatric patients are associational in nature, focusing on assessing DKA prevalence, predicting the risk of DKA at onset, and relating DKA at onset to its impact on glycemic control. These studies [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref18">18</xref>], conducted with a limited number of electronic health record (EHR)–derived features, using classical statistical methods, have identified the most common factors associated with DKA in patients with pediatric T1D. They include (1) insulin omission, especially in the context of chronic hyperglycemia (high glycated hemoglobin [HbA<sub>1c</sub>]) [<xref ref-type="bibr" rid="ref5">5</xref>], (2) females of age greater than 10 years, (3) racial minority youths (Hispanic and African American) [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>], (4) nonprivate health insurance (a proxy for socioeconomic disadvantage) [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>], (5) underlying mental health comorbidities, and (6) prior-DKA [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref25">25</xref>].</p>
        <p>Despite knowledge of DKA risk factors, there are few predictive tools ready for clinical integration that can accurately stratify DKA risk for established patients. This is partly because the relationship between known risk factors and postdiagnosis DKA is complex [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref25">25</xref>] and highly nonlinear, whereas tools for elucidating them have been generally limited to simple statistical models, such as logistic regression. Over the last 2 decades, nonlinear predictive techniques ranging from deep neural networks [<xref ref-type="bibr" rid="ref26">26</xref>] to ensemble methods such as bagging and boosting [<xref ref-type="bibr" rid="ref27">27</xref>], have been devised in the field of supervised machine learning. These methods derive their power from the ability to infer complex prediction functions directly from raw data. They have allowed for great progress in some diagnostic areas: diabetic retinopathy [<xref ref-type="bibr" rid="ref28">28</xref>], machine translation of clinical notes [<xref ref-type="bibr" rid="ref29">29</xref>], object recognition in radiologic or pathologic images [<xref ref-type="bibr" rid="ref30">30</xref>], as well as in DKA prediction in both patients with pediatric and adult T1D [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>], but pose challenges in terms of interpretability.</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>We develop an explainable, machine-learning model to predict pediatric patients with T1D who are at risk of DKA hospitalization postdiagnosis using a time-series of routinely collected, EHR data. We evaluate the predictive performance of our gradient-boosted decision tree model (XGBoost) on one of the largest cohorts of pediatric patients with T1D. Further, we use Shapely value analysis of our model outputs to (1) derive key predictive factors for postdiagnosis DKA, both at the cohort and at the individual levels, (2) reveal the progression of postdiagnosis DKA risk over time, and (3) automatically perform cohort-level risk stratification by agglomerative clustering of Shapley values.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design</title>
        <p>This study accessed deidentified EHR data from 6288 pediatric patients with diabetes, 3794 of them with a confirmed T1D diagnosis, between January 1, 2010, and June 30, 2018, treated at Texas Children’s Hospital (TCH). TCH is one of the largest tertiary-care pediatric health systems in the United States, and likely has some of the largest sets of pediatric patients with diabetes.</p>
        <p>To limit unintended biases and erroneous predictions caused by missing data, we defined stringent inclusion criteria to select the training cohort for model building. We selected patients who were (1) initially diagnosed at, and subsequently followed up within the TCH system with an onset date on or after January 1, 2010, (2) whose age at diagnosis was between 0 and 21 years, (3) who had at least 1 positive antibody titer (glutamic acid decarboxylase 65-kilodalton isoform [GAD65], islet cell autoantigen 512 [ICA512], and insulin AB) at diagnosis, and (4) with a clinical diagnosis of T1D by an endocrinologist. These criteria excluded 1723 patients from the first criterion, 45 from the second, and 239 from the third; with a remainder of 1787 patients included in the final analysis. Of these 1787 patients, 324 experienced at least 1 postdiagnosis DKA hospitalization. The small number of overall and positive cases is a consequence of T1D itself being a rare pediatric disease and postdiagnosis DKA being a rare complication of this disease.</p>
      </sec>
      <sec>
        <title>Feature Generation and Selection</title>
        <sec>
          <title>Feature Construction</title>
          <p>For each patient in the cohort, we extracted more than 100 features available in the EHR, from the time of diagnosis to 3-month clinic follow-ups for up to 2 years after onset. The data included demographic information, clinical data, laboratory values, treatment modality (insulin delivery), hospitalization records, and ambulatory care components. Demographic features included age at diagnosis (onset age), sex, race, ethnicity, and socioeconomic status proxies such as type of insurance, and zip code of residence. Clinical features included vital signs, BMI, and laboratory values including titers at the time of diagnosis. We included both raw diabetes titer values, as well as discretized Boolean (0 or 1) titer values (1 if GAD65 [<xref ref-type="bibr" rid="ref33">33</xref>] titer &gt;5 IU/mL, 1 if ICA512 [<xref ref-type="bibr" rid="ref33">33</xref>] titer &gt;5.4 IU/mL, 1 if insulin AB [<xref ref-type="bibr" rid="ref33">33</xref>] titer &gt;0.4 U/mL). We also included HbA<sub>1c</sub> values at diagnosis and at 3-month clinic follow-ups for up to 24 months. Hospitalization features included length of stay, laboratory-test time-series during the stay, as well as therapeutic interventions. Ambulatory care features included the use of auxiliary services (educators, nutrition services, psychology, and social workers), as well as no-shows and cancellations. We also included diabetes age (years after T1D onset), whether there was DKA at onset, and C-peptide value at the time of diagnosis since they were clinically relevant features.</p>
        </sec>
        <sec>
          <title>Feature Selection</title>
          <p>We omitted features that were missing values for more than 50% of the cohort. We dropped ambulatory care component features and most laboratory test features (except for HbA<sub>1c</sub>) on this basis. We also omitted features highly correlated with HbA<sub>1c</sub> values (such as the BMI time series) because they did not add to the predictive power of the model. In addition, we dropped all features perfectly correlated with the outcome variable—these included all hospitalization-derived features including laboratory tests conducted during DKA hospitalization and therapeutic interventions during hospitalization. This left us with 44 features described in detail later. We did not use additional feature selection methods, relying instead on XGBoost to select relevant features in the construction of the final decision ensemble.</p>
        </sec>
        <sec>
          <title>Missing Value Imputation</title>
          <p>We used a simple piecewise linear interpolation technique to fill in missing values in HbA<sub>1c</sub> records. HbA<sub>1c</sub> imputation was done only between 2 known values—for example, if the 3-month and 9-month HbA<sub>1c</sub> values for a patient were known, then the 6-month value was imputed as the average. We did not perform any other imputation. The XGBoost learning algorithm handles missing values by default, obviating the need for more imputation.</p>
        </sec>
        <sec>
          <title>Final Features</title>
          <p>The 44 features finally used for each patient in our cohort included 15 demographic features: sex (male or female), insurance (private or Medicaid or self-pay), race (White, African American, Asian, and Other), ethnicity (Hispanic, non-Hispanic, and Other), first 3 digits of zip code, 7 diabetes titers (raw values and discretized values for GAD65, ICA512, insulin AB, and the total number of positive antibody titers), 17 HbA<sub>1c</sub> features including 9 values of HbA<sub>1c</sub> (at diagnosis, and at 3-month follow-ups from 3 to 24 months), as well as 8 delta measures (differences between HbA<sub>1c</sub> measurements at successive follow-ups), and 5 other features: diabetes age (years since T1D diagnosis), onset age, DKA at onset (yes or no), C-peptide titer at diagnosis, and discretized C-peptide (&gt;1 U/mL).</p>
        </sec>
      </sec>
      <sec>
        <title>Outcome Definition</title>
        <p>We used hospitalization with DKA after diagnosis of T1D to define the outcome variable. We split the cohort into 2 classes: those who experienced at least 1 DKA episode after diagnosis (324/1787, 18%) and those who did not.</p>
      </sec>
      <sec>
        <title>Model Selection and Training Protocol</title>
        <p>We trained a multivariate gradient boosting decision tree ensemble on the data, using the Python XGBoost open-source library [<xref ref-type="bibr" rid="ref34">34</xref>]. As illustrated in Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, we used a 5-fold stratified cross-validation approach. We divided the data set into 5 equal-sized folds, with the ratio of patients with postdiagnosis DKA and non-DKA being equal in all groups. We used 4 of the folds for training a gradient-boosted ensemble and used the held-out fold for testing the ensemble. We repeated the process 5 times, each time with a different held-out fold, yielding 5 sets of performance measures. We used 4 standard metrics to quantify the performance of the postdiagnosis DKA classifier: area under the receiver operating characteristic curve (AUC), weighted <italic>F</italic><sub>1</sub>-score, weighted precision, and weighted recall. We reported the mean and SD of these 4 scores across the 5 folds, to characterize the predictive performance of the ensemble model.</p>
        <p>Key hyper-parameters for XGBoost (number of trees and tree depth) were selected using the standard hyperparameter tuning process described in section 5.3 of <italic>Deep Learning</italic> by Goodfellow et al [<xref ref-type="bibr" rid="ref35">35</xref>]. We held out 10% of the training data in each cross-validation fold as a validation set—this data does not participate in model construction.</p>
        <p>One of the challenges in model training is handling class imbalance (324 positive examples in a set of 1787 patients, in our case). This is an inherent consequence of postdiagnosis DKA being relatively uncommon. XGBoost handles imbalanced data sets by using the parameter scale_pos_weight, to reflect the degree of imbalance. This parameter weights the components of the cross-entropy loss function used by the training algorithm, assigning a higher weight to the minority class examples, in effect, simulating the process of up-sampling the minority class [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
      </sec>
      <sec>
        <title>Explaining Classifier Performance: Bee-Swarm and Main-Effects Plots</title>
        <p>We used the Shapley value [<xref ref-type="bibr" rid="ref37">37</xref>] framework to assign predictive importance to each feature. The Shapley value, or SHAP (Shapley additive explanations) value, of a feature for a patient, is a quantification of the contribution made by that feature to the DKA or no-DKA prediction made for that patient. The unit of measurement for SHAP values is the change in logarithmic odds of postdiagnosis DKA with and without the feature. Positive SHAP values mean a positive impact on prediction, that is, they lead the model to predict postdiagnosis DKA. Negative SHAP values mean a negative impact on prediction, that is, they lead the model to predict no DKA after diagnosis. Unlike regular feature importance plots, SHAP values show the directionality of the impact of the feature value on the outcome. We use plots of averaged SHAP values over the whole cohort for each feature, called a bee-swarm plot, to rank key factors that determine the risk of postdiagnosis DKA at the level of the entire cohort.</p>
        <p>Main-effects plots show variation in the log-odds of postdiagnosis DKA as functions of a single predictor, all else being equal. A sharp change in log-odds in the main-effects plot of a feature reveals important thresholds at which postdiagnosis DKA risk increases or decreases. For example, these plots help answer questions such as: does the risk of postdiagnosis DKA increase linearly with diabetes age, or is there an age interval where the risk rises significantly? For an individual patient, SHAP values allow for the selection of features relevant to the prediction outcome and explain the outcome as an additive combination of SHAP values. We produce main-effects plots for key cohort-level risk factors identified in the bee-swarm plot.</p>
      </sec>
      <sec>
        <title>Cohort Risk Stratification by Clustering Shapley Values</title>
        <p>Cohort risk stratification is a byproduct of the Shapley value analysis. We clustered the Shapley value matrix constructed from the output of the XGBoost model using a hierarchical agglomerative clustering algorithm, based on Ward linkage [<xref ref-type="bibr" rid="ref38">38</xref>]. The algorithm groups patients according to similarities in their Shapley value vectors, producing a dendrogram. Any horizontal cut of the dendrogram induces a clustering of the original data. We select a cut level to maximize the dissimilarity between clusters.</p>
      </sec>
      <sec>
        <title>Personalized Risk Assessment</title>
        <p>In addition to cohort-level predictions, the model is equally useful for generating interpretable predictions for individual patients. The model produces an additive risk score, which is the sum of the Shapley values for each predictive feature for that patient. When the sum is positive, it indicates higher than baseline risk for that patient; if it is negative, then the patient is at lower risk relative to the whole cohort.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>Data were gathered under institutional review board (number H-42624), which was approved by the institutional review board of Baylor College of Medicine. The institutional review board covers secondary analysis utilizing this data without additional consent. Data were deidentified prior to analysis.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Descriptive Analysis of Data</title>
        <p>We summarize the value distributions of key predictors in <xref ref-type="table" rid="table1">Table 1</xref>. Surprisingly, DKA at the onset which has been shown to be associated historically with worsening glycemic control over time [<xref ref-type="bibr" rid="ref13">13</xref>], does not have a strong correlation with postdiagnosis DKA. The median diabetes age at the first DKA after diagnosis is 2.43 (IQR 1.26-4.09) years. It validates the selection of time-series of HbA<sub>1c</sub> measurements from baseline to the first 24 months after diagnosis, as the basis for postdiagnosis DKA prediction.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Value distributions of key demographics and laboratory test values for the entire cohort of 1787 patients with type 1 diabetes treated at Texas Children’s Hospital between January 1, 2010, and June 30, 2018.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="620"/>
            <col width="350"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Feature</td>
                <td>Variables</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Sex (female), n (%)</td>
                <td>891 (49.86)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Race, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>African American</td>
                <td>299 (16.73)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asian</td>
                <td>65 (3.64)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>White</td>
                <td>1364 (76.33)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td>59 (3.30)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Ethnicity, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Non-Hispanic</td>
                <td>1301 (72.80)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hispanic</td>
                <td>442 (24.73)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td>44 (2.46)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Insurance, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Private</td>
                <td>1146 (64.13)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Medicaid</td>
                <td>641 (35.87)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Antibody titer, median (IQR)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Glutamic acid decarboxylase 65-kilodalton isoform</td>
                <td>13.0 (3.85-30.00)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Islet cell autoantigen 512</td>
                <td>6.80 (1.2-20.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Insulin antibody</td>
                <td>0.4 (0.4-3.50)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>HbA<sub>1c</sub><sup>a</sup>, median (IQR)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HbA<sub>1c</sub> baseline at diagnosis (n=1787)</td>
                <td>11.1 (9.5-12.90)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HbA<sub>1c</sub> at 3 months (n=1768)</td>
                <td>7.51 (6.76-8.48)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HbA<sub>1c</sub> at 6 months (n=1712)</td>
                <td>7.34 (6.52-8.37)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HbA<sub>1c</sub> at 9 months (n=1651)</td>
                <td>7.71 (6.87-8.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HbA<sub>1c</sub> at 12 months (n=1553)</td>
                <td>7.85 (7.08-8.84)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HbA<sub>1c</sub> at 15 months (n=1471)</td>
                <td>7.95 (7.20-8.91)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HbA<sub>1c</sub> at 18 months (n=1401)</td>
                <td>8.07 (7.30-9.07)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HbA<sub>1c</sub> at 21 months (n=1320)</td>
                <td>8.13 (7.31-9.10)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HbA<sub>1c</sub> at 24 months (n=1239)</td>
                <td>8.15 (7.33-9.20)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">C-peptide, median (IQR)</td>
                <td>0.43 (0.26-0.725)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Duration of T1D<sup>b</sup> (in years; diabetes age), median (IQR)</td>
                <td>4.10 (1.80-6.47)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Age at T1D diagnosis (in years; onset age), median (IQR)</td>
                <td>10.40 (6.73-13.43)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">DKA<sup>c</sup> at onset, n (%)</td>
                <td>623 (34.86)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Diabetes age at first DKA postdiagnosis (years postdiagnosis), median (IQR)</td>
                <td>2.43 (1.26-4.09)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Patients with at least 1 postdiagnosis DKA, n (%)</td>
                <td>324 (18.13)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>HbA<sub>1c</sub>: glycated hemoglobin.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>T1D: type 1 diabetes.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>DKA: diabetic ketoacidosis.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Model Evaluation by Cross-Validation With AUC, Precision, and Recall</title>
        <p>The box plot in <xref rid="figure1" ref-type="fig">Figure 1</xref>A shows the clear separation in probability between the no DKA and DKA postdiagnosis cohort (P value &lt;.001). The model is able to distinguish between the postdiagnosis DKA cohort and the non-DKA cohort at a statistically significant level. The cross-validated model with all 9 HbA<sub>1c</sub> measurements from baseline to 24 months has an AUC of 0.80 (SD 0.04) and a weighted <italic>F</italic><sub>1</sub>-score of 0.78 (SD 0.04). The weighted precision and recall of the model are 0.83 (SD 0.02) and 0.76 (SD 0.07) respectively. Cross-validation allows robust estimation of the predictive performance of the model on new patients. Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> shows the incremental effect of the addition of HbA<sub>1c</sub> values from 3 to 24 months on these performance measures. Model performance stops improving after the addition of HbA<sub>1c</sub> at 18 months after onset.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>(A) Probability of postdiagnosis DKA at the cohort level, (B,C) risk by individual key features of diabetes age and HbA<sub>1c</sub> at 12 months, and (D) risk stratification into group. The cohort that will develop DKA can be distinguished from the one that will not, with a (A) <italic>P</italic> value &lt;.001. The main-effects plots show critical thresholds where risk sharply rises (gray regions), (B) for diabetes age between 2.2 and 4.3 years, and (C) for HbA<sub>1c</sub> at 12 months between 8 and 10.3. (D) The scatterplot uses a diabetes age cutoff of 2.2 years and HbA<sub>1c</sub> at 12 months of 9.2 to stratify the population into 3 risk groups for postdiagnosis DKA. A total of 30% of the population has 5% or low risk for DKA, shown in light gray; 50% of the population is at 20% or moderate risk (in medium gray), and 20% is at 48% or high risk of postdiagnosis DKA. DKA: diabetic ketoacidosis; HbA<sub>1c</sub>: glycated hemoglobin.</p>
          </caption>
          <graphic xlink:href="diabetes_v9i1e53338_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Key Predictors of Postdiagnosis DKA</title>
        <p><xref rid="figure2" ref-type="fig">Figure 2</xref> shows a bee-swarm plot summarizing the entire distribution of SHAP values for each predictor. The x-axis of the plot shows the impact on model output (log-odds of postdiagnosis DKA risk) of each of the predictors sorted along the y-axis by decreasing importance. The most important feature that predicts postdiagnosis DKA is diabetes age (top row). Every point in the top row denotes a patient’s diabetes age and the impact of the value of diabetes age on their log-odds of postdiagnosis DKA risk. Patients with low diabetes age (newly diagnosed, and colored blue) have negative SHAP values and thus lower postdiagnosis DKA risk, while patients with higher diabetes age (colored red) have positive SHAP values and higher postdiagnosis DKA risk. As diabetes age increases, the log-odds of DKA risk goes from –1.25 to +0.7. While the plot shows the overall trend of increasing diabetes age contributing to increased risk of postdiagnosis DKA it does not elucidate the exact nature of that trend. HbA<sub>1c</sub> value at 12 months is the second most important feature, and the plot shows a trend of increasing postdiagnosis DKA risk with an increase in HbA<sub>1c</sub> values. For the third most important feature, C-peptide at diagnosis, the plot shows that higher values at diagnosis are associated with lower postdiagnosis DKA risk. Higher HbA<sub>1c</sub> levels at 9, 18, and 24 months are all associated with higher postdiagnosis risk. Higher onset age, ranked seventh in the ordering, is associated with lower postdiagnosis DKA risk. Not only has the model identified and ranked key predictors, but it also provides a quantitative measure of the impact of each of these features on the probability of postdiagnosis DKA risk.</p>
        <p><xref rid="figure1" ref-type="fig">Figures 1</xref>B and 1C show the main effects of 2 of the top predictors in the model: diabetes age and HbA<sub>1c</sub> at 12 months. The log-odds of postdiagnosis DKA risk do not vary linearly with diabetes age. Rather, there is a threshold effect, with a rapid increase in log-odds of risk from –0.95 to +0.35 units between diabetes ages of 2.2 and 4.3 years. HbA<sub>1c</sub> levels at 12 months reveal a similar threshold effect: levels below 8 are at relatively low risk of postdiagnosis DKA, with the risk rising steeply from –0.15 to +0.26 units for patients with HbA<sub>1c</sub> levels between 8 and 10.3. Beyond the value of 10.3, the risk contribution of the 12-month-HbA<sub>1c</sub> level plateaus at a log-odds of 0.26. Taken together, as shown in the shaded regions of the plots, the model predicts that at the cohort level, diabetes age between 2.2 and 4.3 years, and HbA<sub>1c</sub> levels at 12 months between 8 and 10.3 offer the best intervention points to influence postdiagnosis DKA risk.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Model features displayed in order of decreasing importance for postdiagnosis DKA risk prediction. Each feature in this bee-swarm plot is shown with its full range of values—from a minimum in blue, to a maximum in red; see the color scale on right for values in between. The x-axis defines the log-odds of postdiagnosis DKA risk (SHAP value). Each colored dot in a horizontal line represents the value of the corresponding feature for a patient in the training cohort. The most important predictors are diabetes age, HbA<sub>1c</sub> at 12 months, and C-peptide titer at diagnosis. DKA: diabetic ketoacidosis; GAD65: glutamic acid decarboxylase 65-kilodalton isoform; HbA<sub>1c</sub>: glycated hemoglobin; SHAP: Shapley additive explanations.</p>
          </caption>
          <graphic xlink:href="diabetes_v9i1e53338_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Cohort Risk Stratification by Clustering Shapley Values</title>
        <p>The agglomerative clustering analysis reveals 3 well-separated groups characterized by postdiagnosis DKA rates of 5%, 20%, and 48% respectively. Note that the clustering algorithm does not have access to the features or the labels (DKA or non-DKA) for each patient, but only the Shapley value of each feature for that patient. By using a decision tree algorithm to predict cluster membership, we identified the primary criteria to be a diabetes age cutoff of 2.2 years and an HbA<sub>1c</sub> at a 12-month cutoff of 9.2. <xref rid="figure1" ref-type="fig">Figure 1</xref>D visually displays these clusters across the dimensions of diabetes age and HbA<sub>1c</sub> at 12 months. Cluster 1, which is the low-risk group (5% probability of postdiagnosis DKA) consists of patients whose diabetes age is less than 2.2 years. Cluster 2, the medium risk group (20% probability of postdiagnosis DKA) is composed of patients with diabetes age of 2.2 years and older and HbA<sub>1c</sub> at 12 months &lt;9.2. Cluster 3, the high-risk group (48% probability of postdiagnosis DKA) consists of patients with diabetes age of 2.2 years and older and HbA<sub>1c</sub> at 12 months&gt;9.2. Patients at low risk constitute 30% of the population, those at medium risk constitute 50% of the population, and the high-risk group constitutes 20% of the population.</p>
      </sec>
      <sec>
        <title>Personalized Risk Assessment</title>
        <p><xref rid="figure3" ref-type="fig">Figure 3</xref> shows the individualized risk predictions for a patient at high risk for postdiagnosis DKA (<xref rid="figure3" ref-type="fig">Figure 3</xref>A) and low risk for postdiagnosis DKA (<xref rid="figure3" ref-type="fig">Figure 3</xref>B). For the patient in <xref rid="figure3" ref-type="fig">Figure 3</xref>A, the model shows the features contributing to high risk: worsening HbA<sub>1c</sub> values from 9 to 21 months post diagnosis (9.8 → 10.1 → 10.6 →10.8), and high diabetes age of 8.39 years. For the patient in <xref rid="figure3" ref-type="fig">Figure 3</xref>B, the model identifies a low diabetes age of 1.44 years as the primary reason for low DKA risk. HbA<sub>1c</sub> levels for this patient start at 6.7 at 9 months postdiagnosis and remain at 6.72 at the 12-month mark.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Risk models for 2 individual patients (A) at high risk and (B) at low risk of postdiagnosis DKA shown as waterfall plots. The baseline risk of –0.672 marked with a black vertical line represents the overall risk of postdiagnosis DKA at the cohort level. Factors in red are associated with higher DKA risk, and those in blue are associated with lower risk. The personalized risk score represents an individual’s unique risk profile. DKA: diabetic ketoacidosis; GAD65: glutamic acid decarboxylase 65-kilodalton isoform; HbA<sub>1c</sub>: glycated hemoglobin.</p>
          </caption>
          <graphic xlink:href="diabetes_v9i1e53338_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Approximately 18% of patients with T1D experience DKA after onset and yet there are few tools available to assist clinicians in assessing postdiagnosis DKA risk, either at the cohort level or at an individual level [<xref ref-type="bibr" rid="ref39">39</xref>]. Our gradient-boosted ensemble of decision trees trained on a diverse cohort of 1787 patients with T1D has demonstrated the ability to predict DKA after onset with high accuracy, revealing insights into the features most predictive of high risk, and offering explainable risk scores at the level of an individual patient.</p>
        <p>With an AUC of 0.80 (SD 0.04), a weighted <italic>F</italic><sub>1</sub>-score of 0.78 (SD 0.04), and weighted precision and recall of 0.83 (SD 0.03) and 0.76 (SD 0.05) respectively, the model delivers performance similar to Food and Drug Administration–approved predictive computational tools for detecting cervical and breast cancer [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]. Using Shapley value analysis, the model identified diabetes age and HbA<sub>1c</sub> at 12 months as the top 2 drivers of postdiagnosis DKA (<xref rid="figure1" ref-type="fig">Figure 1</xref>). Even more interesting, is the data-driven discovery of a “critical period” between 2.2 and 4.3 years of disease and an HbA<sub>1c</sub> at 12 months between 8 and 10.3 that poses the greatest risk for postdiagnosis DKA, as revealed by the main-effects Shapley value plots. During this period, a sharp nonlinear rise in DKA risk (<xref rid="figure1" ref-type="fig">Figures 1</xref>B and 1C) suggests that the optimal window for preventive intervention may exist years prior to the adverse event. By clustering Shapley values using a hierarchical agglomerative clustering technique, we can cleanly stratify the population into 3 major risk classes: 30% in the low-risk group (5% risk of postdiagnosis DKA), 50% in the medium-risk group (20% risk of postdiagnosis DKA) and 20% in the high-risk group (48% risk of postdiagnosis DKA). Consistent with the high AUC scores, the model displayed clear separation between patients with T1D with no DKA postdiagnosis, and those with DKA postdiagnosis (P&lt;.001; <xref rid="figure1" ref-type="fig">Figure 1</xref>A), holding promise for accurate identification of at-risk patients, with personalized risk scores highlighting individual patient-level factors that drive postdiagnosis DKA risk (<xref rid="figure3" ref-type="fig">Figure 3</xref>).</p>
        <p>Our model, made interpretable by Shapley value analysis, provides insights into the key determiners of risk for postdiagnosis DKA, and elucidates the nonlinear relationships between key predictors and postdiagnosis DKA risk. Using the Shapley value framework, the model assesses risks at both the cohort and at the individual level, guiding the choice of therapeutic interventions.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>Data-driven approaches to building predictive risk models are becoming important in clinical applications as prescriptive analytics and targeted personalized therapy become more readily available [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]. Recent models [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>] for predicting patients at high risk for DKA have used logistic regression analyses to identify the top 3 features indicative of postdiagnosis DKA in pediatric T1D: most recent HbA<sub>1c</sub>, type of health insurance, and prior occurrence of DKA in the past 2 years. These models were qualitatively evaluated in a retrospective setting.</p>
        <p>Our unique contribution is the design of an explainable predictive model for postdiagnosis DKA using one of the largest pediatric T1D cohorts studied in the literature. Our model’s predictive performance surpasses the state of the art on this problem (Williams et al [<xref ref-type="bibr" rid="ref31">31</xref>]) on a similar patient cohort. It does so using variables collected on a patient with pediatric T1D during diagnosis, and routine clinic follow-ups for up to 24 months, and not measurements gathered from DKA hospitalization visits (which are fully correlated with our outcome variable). In addition, through our choice of model and statistical analysis using the Shapley value framework, we identify key risk factors predictive of postdiagnosis DKA at the population level and the individual level. We are able to reveal sharp changes in postdiagnosis DKA risk over time, identifying intervals for possible intervention. Finally, we perform risk stratification by automatically deriving risk clusters from Shapley values.</p>
        <p>The ensemble model developed here has robust quantitative performance measures. It captures the heterogeneity inherent in the T1D population by building a set of weighted models, rather than a single linear model. Further, it can be operationalized as a predictive tool within existing EHR frameworks, allowing for better clinical management of pediatric T1D with enhanced resource allocation where specialized diabetes care is scarce [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>].</p>
        <p>Our model is derived from data spanning a decade in a large and diverse cohort of patients with pediatric T1D at a major tertiary-care children’s hospital. Data readily available in the EHR was included in the data input to the model. The model lets the data drive the selection of key predictors, thus eliminating human bias. The gradient-boosted ensemble method is key to predictive performance since (1) the relationships between predictors and the outcome variable are highly nonlinear (<xref rid="figure1" ref-type="fig">Figures 1</xref>B and 1C), precluding the use of simpler models such as logistic regression, and (2) there is significant variation among patients in the cohort, precluding the use of a one-size-fits-all model [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]. To our knowledge, this is the first deployment of such a model to predict DKA occurrence in a pediatric context. However, successful deployment of the model in a decision support context requires careful integration into clinical workflow.</p>
      </sec>
      <sec>
        <title>Limitations and Strengths</title>
        <p>This study is a single-center, retrospective study with data limited to what was currently available in the EHR. We acknowledge that the EHR does not capture every patient characteristic that impacts clinical outcomes. Including data collected outside of the traditional health care environment, that is, remote patient monitoring data, and social determinants of health, can improve the predictive performance of our model.</p>
        <p>We further acknowledge that DKA occurrences postdiagnosis are not always deterministically predictable, particularly in cases involving infection, illness, and instances of inadequate parental supervision.</p>
        <p>In our study, the postdiagnosis DKA outcome in a patient with T1D is determined by hospitalization for DKA; this is a commonly used criterion in prior work on pediatric T1D [<xref ref-type="bibr" rid="ref31">31</xref>]. However, it is possible that patients with mild cases of postdiagnosis DKA who did not require hospitalization, or were treated at a different facility are not accounted for in our outcome definition.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We have built an explainable, predictive, machine learning model with potential for integration into clinical workflow. The model risk-stratifies patients with pediatric T1D and identifies patients at the highest postdiagnosis DKA risk using limited follow-up data starting from the time of diagnosis. The model identifies key time points and risk factors to direct clinical interventions at both the individual and cohort levels. The clinical import of our work is that the model can predict patients most at risk for postdiagnosis DKA and identify preventive interventions based on mitigation of individualized risk factors.</p>
        <p>Future work includes further developing the model with data from multiple hospital systems, testing its generalizability across cohorts from other institutions, and prospectively studying whether it can assist clinicians target interventions to improve outcomes.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary figures and tables.</p>
        <media xlink:href="diabetes_v9i1e53338_app1.docx" xlink:title="DOCX File , 162 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUC</term>
          <def>
            <p>area under the receiver- operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">DKA</term>
          <def>
            <p>diabetic ketoacidosis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">GAD65</term>
          <def>
            <p>glutamic acid decarboxylase 65-kilodalton isoform</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">HbA<sub>1c</sub></term>
          <def>
            <p>glycated hemoglobin</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">ICA512</term>
          <def>
            <p>islet cell autoantigen 512</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">SHAP</term>
          <def>
            <p>Shapley additive explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">T1D</term>
          <def>
            <p>type 1 diabetes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">TCH</term>
          <def>
            <p>Texas Children’s Hospital</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors thank Mark Rittenhouse and Ashok Kurian for help with data extraction, the Diabetes Care Process Team for discussions, and Karen Prince for help with figures.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>DS, RS, and IS participated in the conceptual design of the study, analysis, and interpretation of the data. DS and IS drafted the manuscript, and all authors reviewed and edited the manuscript and approved the final version.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vellanki</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Umpierrez</surname>
              <given-names>GE</given-names>
            </name>
          </person-group>
          <article-title>Increasing hospitalizations for DKA: a need for prevention programs</article-title>
          <source>Diabetes Care</source>
          <year>2018</year>
          <volume>41</volume>
          <issue>9</issue>
          <fpage>1839</fpage>
          <lpage>1841</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30135197"/>
          </comment>
          <pub-id pub-id-type="doi">10.2337/dci18-0004</pub-id>
          <pub-id pub-id-type="medline">30135197</pub-id>
          <pub-id pub-id-type="pii">41/9/1839</pub-id>
          <pub-id pub-id-type="pmcid">PMC6105328</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shilo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zuckerman-Levin</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Shehadeh</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Nunes</surname>
              <given-names>KP</given-names>
            </name>
          </person-group>
          <article-title>Diabetic ketoacidosis in the pediatric population with type 1 diabetes</article-title>
          <source>Major Topics in Type 1 Diabetes</source>
          <year>2015</year>
          <publisher-loc>NA</publisher-loc>
          <publisher-name>InTechOpen</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Garibaldi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Becker</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Is the risk of diabetic ketoacidosis modifiable?</article-title>
          <source>J Pediatr</source>
          <year>2016</year>
          <volume>171</volume>
          <fpage>10</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jpeds.2016.01.057</pub-id>
          <pub-id pub-id-type="medline">26879811</pub-id>
          <pub-id pub-id-type="pii">S0022-3476(16)00134-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wolfsdorf</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Glaser</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Sperling</surname>
              <given-names>MA</given-names>
            </name>
            <collab>American Diabetes Association</collab>
          </person-group>
          <article-title>Diabetic ketoacidosis in infants, children, and adolescents: a consensus statement from the American Diabetes Association</article-title>
          <source>Diabetes Care</source>
          <year>2006</year>
          <volume>29</volume>
          <issue>5</issue>
          <fpage>1150</fpage>
          <lpage>1159</lpage>
          <pub-id pub-id-type="doi">10.2337/diacare.2951150</pub-id>
          <pub-id pub-id-type="medline">16644656</pub-id>
          <pub-id pub-id-type="pii">29/5/1150</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Firth</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bennett</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Howard</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chisholm</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Ketoacidosis occurring in newly diagnosed and established diabetic children</article-title>
          <source>Acta Paediatr</source>
          <year>1998</year>
          <volume>87</volume>
          <issue>5</issue>
          <fpage>537</fpage>
          <lpage>541</lpage>
          <pub-id pub-id-type="doi">10.1080/08035259850158245</pub-id>
          <pub-id pub-id-type="medline">9641735</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cengiz</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Xing</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Wolfsdorf</surname>
              <given-names>JI</given-names>
            </name>
            <name name-style="western">
              <surname>Haymond</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Rewers</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shanmugham</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tamborlane</surname>
              <given-names>WV</given-names>
            </name>
            <name name-style="western">
              <surname>Willi</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Seiple</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>DuBose</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Beck</surname>
              <given-names>RW</given-names>
            </name>
            <collab>T1D Exchange Clinic Network</collab>
          </person-group>
          <article-title>Severe hypoglycemia and diabetic ketoacidosis among youth with type 1 diabetes in the T1D exchange clinic registry</article-title>
          <source>Pediatr Diabetes</source>
          <year>2013</year>
          <volume>14</volume>
          <issue>6</issue>
          <fpage>447</fpage>
          <lpage>454</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23469984"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/pedi.12030</pub-id>
          <pub-id pub-id-type="medline">23469984</pub-id>
          <pub-id pub-id-type="pmcid">PMC4100244</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mathias</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Menon</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Schubart</surname>
              <given-names>U</given-names>
            </name>
          </person-group>
          <article-title>Health care utilization and burden of diabetic ketoacidosis in the U.S. over the past decade: a nationwide analysis</article-title>
          <source>Diabetes Care</source>
          <year>2018</year>
          <volume>41</volume>
          <issue>8</issue>
          <fpage>1631</fpage>
          <lpage>1638</lpage>
          <pub-id pub-id-type="doi">10.2337/dc17-1379</pub-id>
          <pub-id pub-id-type="medline">29773640</pub-id>
          <pub-id pub-id-type="pii">dc17-1379</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benoit</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Geiss</surname>
              <given-names>LS</given-names>
            </name>
            <name name-style="western">
              <surname>Gregg</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Albright</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Trends in diabetic ketoacidosis hospitalizations and in-hospital mortality—United States, 2000-2014</article-title>
          <source>MMWR Morb Mortal Wkly Rep</source>
          <year>2018</year>
          <volume>67</volume>
          <issue>12</issue>
          <fpage>362</fpage>
          <lpage>365</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.15585/mmwr.mm6712a3"/>
          </comment>
          <pub-id pub-id-type="doi">10.15585/mmwr.mm6712a3</pub-id>
          <pub-id pub-id-type="medline">29596400</pub-id>
          <pub-id pub-id-type="pmcid">PMC5877353</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rewers</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chase</surname>
              <given-names>HP</given-names>
            </name>
            <name name-style="western">
              <surname>Mackenzie</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Walravens</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Roback</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rewers</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hamman</surname>
              <given-names>RF</given-names>
            </name>
            <name name-style="western">
              <surname>Klingensmith</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Predictors of acute complications in children with type 1 diabetes</article-title>
          <source>JAMA</source>
          <year>2002</year>
          <volume>287</volume>
          <issue>19</issue>
          <fpage>2511</fpage>
          <lpage>2518</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.287.19.2511</pub-id>
          <pub-id pub-id-type="medline">12020331</pub-id>
          <pub-id pub-id-type="pii">joc12060</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Umpierrez</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Korytkowski</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Diabetic emergencies–ketoacidosis, hyperglycaemic hyperosmolar state and hypoglycaemia</article-title>
          <source>Nat Rev Endocrinol</source>
          <year>2016</year>
          <volume>12</volume>
          <issue>4</issue>
          <fpage>222</fpage>
          <lpage>232</lpage>
          <pub-id pub-id-type="doi">10.1038/nrendo.2016.15</pub-id>
          <pub-id pub-id-type="medline">26893262</pub-id>
          <pub-id pub-id-type="pii">nrendo.2016.15</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Semenkovich</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Berlin</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Ankney</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Klages</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Keenan</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Rybak</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Banks</surname>
              <given-names>GG</given-names>
            </name>
            <name name-style="western">
              <surname>Alemzadeh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Eddington</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Predictors of diabetic ketoacidosis hospitalizations and hemoglobin A1c among youth with type 1 diabetes</article-title>
          <source>Health Psychol</source>
          <year>2019</year>
          <volume>38</volume>
          <issue>7</issue>
          <fpage>577</fpage>
          <lpage>585</lpage>
          <pub-id pub-id-type="doi">10.1037/hea0000719</pub-id>
          <pub-id pub-id-type="medline">30973748</pub-id>
          <pub-id pub-id-type="pii">2019-19147-001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vicinanza</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Messaaoui</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tenoutasse</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dorchy</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Diabetic ketoacidosis in children newly diagnosed with type 1 diabetes mellitus: role of demographic, clinical, and biochemical features along with genetic and immunological markers as risk factors. a 20-year experience in a tertiary Belgian center</article-title>
          <source>Pediatr Diabetes</source>
          <year>2019</year>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>584</fpage>
          <lpage>593</lpage>
          <pub-id pub-id-type="doi">10.1111/pedi.12864</pub-id>
          <pub-id pub-id-type="medline">31038262</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Duca</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Reboussin</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Pihoker</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Imperatore</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Saydah</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer-Davis</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rewers</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dabelea</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Diabetic ketoacidosis at diagnosis of type 1 diabetes and glycemic control over time: the search for diabetes in youth study</article-title>
          <source>Pediatr Diabetes</source>
          <year>2019</year>
          <volume>20</volume>
          <issue>2</issue>
          <fpage>172</fpage>
          <lpage>179</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30556249"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/pedi.12809</pub-id>
          <pub-id pub-id-type="medline">30556249</pub-id>
          <pub-id pub-id-type="pmcid">PMC6361710</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mazarello Paes</surname>
              <given-names>Veena</given-names>
            </name>
            <name name-style="western">
              <surname>Barrett</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Dunger</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Gevers</surname>
              <given-names>EF</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor-Robinson</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Viner</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Stephenson</surname>
              <given-names>TJ</given-names>
            </name>
          </person-group>
          <article-title>Factors predicting poor glycemic control in the first two years of childhood onset type 1 diabetes in a cohort from East London, UK: analyses using mixed effects fractional polynomial models</article-title>
          <source>Pediatr Diabetes</source>
          <year>2020</year>
          <volume>21</volume>
          <issue>2</issue>
          <fpage>288</fpage>
          <lpage>299</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31782879"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/pedi.12950</pub-id>
          <pub-id pub-id-type="medline">31782879</pub-id>
          <pub-id pub-id-type="pmcid">PMC7028081</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aeppli</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Mahler</surname>
              <given-names>FL</given-names>
            </name>
            <name name-style="western">
              <surname>Konrad</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Future glycemic control of children diagnosed with type 1 diabetes mellitus at toddler and preschool/school age</article-title>
          <source>J Pediatr Endocrinol Metab</source>
          <year>2019</year>
          <month>09</month>
          <day>25</day>
          <volume>32</volume>
          <issue>9</issue>
          <fpage>929</fpage>
          <lpage>933</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.5167/uzh-178435"/>
          </comment>
          <pub-id pub-id-type="doi">10.1515/jpem-2019-0152</pub-id>
          <pub-id pub-id-type="medline">31323008</pub-id>
          <pub-id pub-id-type="pii">/j/jpem.ahead-of-print/jpem-2019-0152/jpem-2019-0152.xml</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Incidence and associates of diabetic ketoacidosis in a community-based cohort: the fremantle diabetes study phase II</article-title>
          <source>BMJ Open Diabetes Res Care</source>
          <year>2020</year>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>e000983</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://drc.bmj.com/lookup/pmidlookup?view=long&amp;pmid=32139599"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjdrc-2019-000983</pub-id>
          <pub-id pub-id-type="medline">32139599</pub-id>
          <pub-id pub-id-type="pii">8/1/e000983</pub-id>
          <pub-id pub-id-type="pmcid">PMC7059509</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rahme</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Simard</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Larocque</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Nakhla</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Increasing prevalence of diabetic ketoacidosis at diabetes diagnosis among children in Quebec: a population-based retrospective cohort study</article-title>
          <source>CMAJ Open</source>
          <year>2019</year>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>E300</fpage>
          <lpage>E305</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://cmajopen.ca/cgi/pmidlookup?view=long&amp;pmid=31088804"/>
          </comment>
          <pub-id pub-id-type="doi">10.9778/cmajo.20190047</pub-id>
          <pub-id pub-id-type="medline">31088804</pub-id>
          <pub-id pub-id-type="pii">7/2/E300</pub-id>
          <pub-id pub-id-type="pmcid">PMC6517121</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ampt</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>van Gemert</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Craig</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Donaghue</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Lain</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Nassar</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Using population data to understand the epidemiology and risk factors for diabetic ketoacidosis in Australian children with type 1 diabetes</article-title>
          <source>Pediatr Diabetes</source>
          <year>2019</year>
          <volume>20</volume>
          <issue>7</issue>
          <fpage>901</fpage>
          <lpage>908</lpage>
          <pub-id pub-id-type="doi">10.1111/pedi.12891</pub-id>
          <pub-id pub-id-type="medline">31291024</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Malik</surname>
              <given-names>FS</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mangione-Smith</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Keren</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mahant</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Srivastava</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Tieder</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Patient characteristics associated with differences in admission frequency for diabetic ketoacidosis in United States children's hospitals</article-title>
          <source>J Pediatr</source>
          <year>2016</year>
          <volume>171</volume>
          <fpage>104</fpage>
          <lpage>110</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jpeds.2015.12.015</pub-id>
          <pub-id pub-id-type="medline">26787380</pub-id>
          <pub-id pub-id-type="pii">S0022-3476(15)01525-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mejia-Otero</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Adhikari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>PC</given-names>
            </name>
          </person-group>
          <article-title>Risk factors for hospitalization in youth with type 1 diabetes: development and validation of a multivariable prediction model</article-title>
          <source>Pediatr Diabetes</source>
          <year>2020</year>
          <volume>21</volume>
          <issue>7</issue>
          <fpage>1268</fpage>
          <lpage>1276</lpage>
          <pub-id pub-id-type="doi">10.1111/pedi.13090</pub-id>
          <pub-id pub-id-type="medline">32737942</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Redondo</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Libman</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kollman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tosur</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gal</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Bacha</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Klingensmith</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Clements</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Racial/ethnic minority youth with recent-onset type 1 diabetes have poor prognostic factors</article-title>
          <source>Diabetes Care</source>
          <year>2018</year>
          <volume>41</volume>
          <issue>5</issue>
          <fpage>1017</fpage>
          <lpage>1024</lpage>
          <pub-id pub-id-type="doi">10.2337/dc17-2335</pub-id>
          <pub-id pub-id-type="medline">29496742</pub-id>
          <pub-id pub-id-type="pii">dc17-2335</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Vakharia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Uysal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hendrix</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Fegan-Bohm</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lyons</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sonabend</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gunn</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Banuelos</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dei-Tutu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A comprehensive system for identifying patients with type 1 diabetes at increased risk for diabetic ketoacidosis at Texas Children's Hospital</article-title>
          <source>Clin Diabetes</source>
          <year>2022</year>
          <volume>40</volume>
          <issue>1</issue>
          <fpage>92</fpage>
          <lpage>96</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35221478"/>
          </comment>
          <pub-id pub-id-type="doi">10.2337/cd21-0072</pub-id>
          <pub-id pub-id-type="medline">35221478</pub-id>
          <pub-id pub-id-type="pii">cd210072.40.1</pub-id>
          <pub-id pub-id-type="pmcid">PMC8865789</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Banuelos</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Uysal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vakharia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hendrix</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fegan-Bohm</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lyons</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Sonabend</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gunn</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Dei-Tutu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>An automated risk index for diabetic ketoacidosis in pediatric patients with type 1 diabetes: the RI-DKA</article-title>
          <source>Clin Diabetes</source>
          <year>2022</year>
          <volume>40</volume>
          <issue>2</issue>
          <fpage>204</fpage>
          <lpage>210</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35669298"/>
          </comment>
          <pub-id pub-id-type="doi">10.2337/cd21-0070</pub-id>
          <pub-id pub-id-type="medline">35669298</pub-id>
          <pub-id pub-id-type="pii">CD210070</pub-id>
          <pub-id pub-id-type="pmcid">PMC9160557</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smaldone</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Honig</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stone</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Arons</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Weinger</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Characteristics of California children with single versus multiple diabetic ketoacidosis hospitalizations (1998-2000)</article-title>
          <source>Diabetes Care</source>
          <year>2005</year>
          <volume>28</volume>
          <issue>8</issue>
          <fpage>2082</fpage>
          <lpage>2084</lpage>
          <pub-id pub-id-type="doi">10.2337/diacare.28.8.2082-a</pub-id>
          <pub-id pub-id-type="medline">16043767</pub-id>
          <pub-id pub-id-type="pii">28/8/2082-a</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ehrmann</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kulzer</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Roos</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Haak</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Khatib</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hermanns</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Risk factors and prevention strategies for diabetic ketoacidosis in people with established type 1 diabetes</article-title>
          <source>Lancet Diabetes Endocrinol</source>
          <year>2020</year>
          <volume>8</volume>
          <issue>5</issue>
          <fpage>436</fpage>
          <lpage>446</lpage>
          <pub-id pub-id-type="doi">10.1016/S2213-8587(20)30042-5</pub-id>
          <pub-id pub-id-type="medline">32333879</pub-id>
          <pub-id pub-id-type="pii">S2213-8587(20)30042-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>LeCun</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bengio</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hinton</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Deep learning</article-title>
          <source>Nature</source>
          <year>2015</year>
          <volume>521</volume>
          <issue>7553</issue>
          <fpage>436</fpage>
          <lpage>444</lpage>
          <pub-id pub-id-type="doi">10.1038/nature14539</pub-id>
          <pub-id pub-id-type="medline">26017442</pub-id>
          <pub-id pub-id-type="pii">nature14539</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hastie</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tibshirani</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Additive logistic regression: a statistical view of boosting (with discussion and a rejoinder by the authors)</article-title>
          <source>Ann Stat</source>
          <year>2000</year>
          <volume>28</volume>
          <issue>2</issue>
          <fpage>337</fpage>
          <lpage>407</lpage>
          <pub-id pub-id-type="doi">10.1214/aos/1016218223</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gulshan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Coram</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stumpe</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Narayanaswamy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Venugopalan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Widner</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Madams</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cuadros</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Raman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Mega</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Webster</surname>
              <given-names>DR</given-names>
            </name>
          </person-group>
          <article-title>Development and validation of a deep learning algorithm for detection of diabetic retinopathy in retinal fundus photographs</article-title>
          <source>JAMA</source>
          <year>2016</year>
          <volume>316</volume>
          <issue>22</issue>
          <fpage>2402</fpage>
          <lpage>2410</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2016.17216</pub-id>
          <pub-id pub-id-type="medline">27898976</pub-id>
          <pub-id pub-id-type="pii">2588763</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Schuster</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>QV</given-names>
            </name>
            <name name-style="western">
              <surname>Norouzi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Macherey</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Krikun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Macherey</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Google's neural machine translation system: bridging the gap between human and machine translation</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on October 8, 2016</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1609.08144</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Summers</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Deep learning lends a hand to pediatric radiology</article-title>
          <source>Radiology</source>
          <year>2018</year>
          <volume>287</volume>
          <issue>1</issue>
          <fpage>323</fpage>
          <lpage>325</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29558310"/>
          </comment>
          <pub-id pub-id-type="doi">10.1148/radiol.2018172898</pub-id>
          <pub-id pub-id-type="medline">29558310</pub-id>
          <pub-id pub-id-type="pmcid">PMC5881636</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Ferro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mullaney</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Skrabonja</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Barnes</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Patton</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Lockee</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tallon</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Vandervelden</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Schweisberger</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McDonough</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lind</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>D'Avolio</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Clements</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>An "all-data-on-hand" deep learning model to predict hospitalization for diabetic ketoacidosis in youth with type 1 diabetes: development and validation study</article-title>
          <source>JMIR Diabetes</source>
          <year>2023</year>
          <volume>8</volume>
          <fpage>e47592</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://diabetes.jmir.org/2023//e47592/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/47592</pub-id>
          <pub-id pub-id-type="medline">37224506</pub-id>
          <pub-id pub-id-type="pii">v8i1e47592</pub-id>
          <pub-id pub-id-type="pmcid">PMC10394604</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>FL</given-names>
            </name>
            <name name-style="western">
              <surname>Molony</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Doder</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zalmover</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Juhaeri</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Performance assessment of different machine learning approaches in predicting diabetic ketoacidosis in adults with type 1 diabetes using electronic health records data</article-title>
          <source>Pharmacoepidemiol Drug Saf</source>
          <year>2021</year>
          <volume>30</volume>
          <issue>5</issue>
          <fpage>610</fpage>
          <lpage>618</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33480091"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/pds.5199</pub-id>
          <pub-id pub-id-type="medline">33480091</pub-id>
          <pub-id pub-id-type="pmcid">PMC8049019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Verkauskiene</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Danyte</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Dobrovolskiene</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Stankute</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Simoniene</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Razanskaite-Virbickiene</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Seibokaite</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Urbonaite</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jurgeviciene</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Vitkauskiene</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schwitzgebel</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Marciulionyte</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The course of diabetes in children, adolescents and young adults: does the autoimmunity status matter?</article-title>
          <source>BMC Endocr Disord</source>
          <year>2016</year>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>61</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcendocrdisord.biomedcentral.com/articles/10.1186/s12902-016-0145-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12902-016-0145-3</pub-id>
          <pub-id pub-id-type="medline">27842589</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12902-016-0145-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC5109672</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>XGBoost: a scalable tree boosting system</article-title>
          <year>2016</year>
          <conf-name>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>August 13-17, 2016</conf-date>
          <conf-loc>San Francisco, CA, United States</conf-loc>
          <publisher-name>ACM</publisher-name>
          <fpage>785</fpage>
          <lpage>794</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goodfellow</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Bengio</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Courville</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>Deep Learning</source>
          <year>2016</year>
          <publisher-loc>Cambridge, MA</publisher-loc>
          <publisher-name>MIT Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>The influence of class imbalance on cost-sensitive learning: an empirical study</article-title>
          <year>2006</year>
          <conf-name>Sixth International Conference on Data Mining (ICDM'06)</conf-name>
          <conf-date>December 18-22, 2006</conf-date>
          <conf-loc>Hong Kong, China</conf-loc>
          <publisher-loc>Hong Kong, China</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>970</fpage>
          <lpage>974</lpage>
          <pub-id pub-id-type="doi">10.1109/ICDM.2006.158</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SI</given-names>
            </name>
          </person-group>
          <article-title>A unified approach to interpreting model predictions</article-title>
          <year>2017</year>
          <conf-name>Proceedings of the 31st International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>2017</conf-date>
          <conf-loc>Red Hook, NY, United States</conf-loc>
          <fpage>4768</fpage>
          <lpage>4777</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Murtagh</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Contreras</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Algorithms for hierarchical clustering: an overview</article-title>
          <source>Wiley Interdiscip Rev: Data Min Knowl Discov</source>
          <year>2011</year>
          <month>12</month>
          <day>07</day>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>86</fpage>
          <lpage>97</lpage>
          <pub-id pub-id-type="doi">10.1002/widm.53</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kodama</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fujihara</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Shiozaki</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Horikawa</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yamada</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sato</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yaguchi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yamamoto</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kitazawa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Iwanaga</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Matsubayashi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sone</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Ability of current machine learning algorithms to predict and detect hypoglycemia in patients with diabetes mellitus: meta-analysis</article-title>
          <source>JMIR Diabetes</source>
          <year>2021</year>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>e22458</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://diabetes.jmir.org/2021/1/e22458/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22458</pub-id>
          <pub-id pub-id-type="medline">33512324</pub-id>
          <pub-id pub-id-type="pii">v6i1e22458</pub-id>
          <pub-id pub-id-type="pmcid">PMC7880810</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Houssami</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lång</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bernardi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tagliafico</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zackrisson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Skaane</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Digital breast tomosynthesis (3d-mammography) screening: a pictorial review of screen-detected cancers and false recalls attributed to tomosynthesis in prospective screening trials</article-title>
          <source>Breast</source>
          <year>2016</year>
          <volume>26</volume>
          <fpage>119</fpage>
          <lpage>134</lpage>
          <pub-id pub-id-type="doi">10.1016/j.breast.2016.01.007</pub-id>
          <pub-id pub-id-type="medline">27017251</pub-id>
          <pub-id pub-id-type="pii">S0960-9776(16)00012-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wentzensen</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lahrmann</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Kinney</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tokugawa</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Poitras</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Locke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bartels</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Krauthoff</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zuna</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Grewal</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Goldhoff</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Kingery</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Castle</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Schiffman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lorey</surname>
              <given-names>TS</given-names>
            </name>
            <name name-style="western">
              <surname>Grabe</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Accuracy and efficiency of deep-learning-based automation of dual stain cytology in cervical cancer screening</article-title>
          <source>J Natl Cancer Inst</source>
          <year>2021</year>
          <volume>113</volume>
          <issue>1</issue>
          <fpage>72</fpage>
          <lpage>79</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32584382"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jnci/djaa066</pub-id>
          <pub-id pub-id-type="medline">32584382</pub-id>
          <pub-id pub-id-type="pii">5862008</pub-id>
          <pub-id pub-id-type="pmcid">PMC7781458</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>An</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Au</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ang</surname>
              <given-names>TFA</given-names>
            </name>
          </person-group>
          <article-title>Deep ensemble learning for Alzheimer's disease classification</article-title>
          <source>J Biomed Inform</source>
          <year>2020</year>
          <volume>105</volume>
          <fpage>103411</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(20)30039-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103411</pub-id>
          <pub-id pub-id-type="medline">32234546</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(20)30039-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC9760486</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Holt</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>YJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Onufrak</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Croft</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>Population-based geographic access to endocrinologists in the United States, 2012</article-title>
          <source>BMC Health Serv Res</source>
          <year>2015</year>
          <volume>15</volume>
          <fpage>541</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmchealthservres.biomedcentral.com/articles/10.1186/s12913-015-1185-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12913-015-1185-5</pub-id>
          <pub-id pub-id-type="medline">26644021</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12913-015-1185-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC4672571</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Aye</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Boney</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Eugster</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Misra</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Singer</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Stafford</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Witchel</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Zeitler</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Sustaining the pediatric endocrinology workforce: recommendations from the pediatric endocrine society workforce task force</article-title>
          <source>J Pediatr</source>
          <year>2021</year>
          <volume>233</volume>
          <fpage>4</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jpeds.2020.10.063</pub-id>
          <pub-id pub-id-type="medline">33137317</pub-id>
          <pub-id pub-id-type="pii">S0022-3476(20)31362-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dietterich</surname>
              <given-names>TG</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Kittler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Roli</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Ensemble methods in machine learning</article-title>
          <source>Multiple Classifier Systems, Lecture Notes in Computer Science, Volume 1857</source>
          <year>2000</year>
          <publisher-loc>Berlin, Germany</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>1</fpage>
          <lpage>15</lpage>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
