<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JD</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Diabetes</journal-id>
      <journal-title>JMIR Diabetes</journal-title>
      <issn pub-type="epub">2371-4379</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i1e49113</article-id>
      <article-id pub-id-type="pmid">37999944</article-id>
      <article-id pub-id-type="doi">10.2196/49113</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Machine Learning Web App to Predict Diabetic Blood Glucose Based on a Basic Noninvasive Health Checkup, Sociodemographic Characteristics, and Dietary Information: Case Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Li</surname>
            <given-names>Sheyu</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Jiwani</surname>
            <given-names>Nasmin</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Matabuena</surname>
            <given-names>Marcos</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Sampa</surname>
            <given-names>Masuda Begum</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1707-0227</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Biswas</surname>
            <given-names>Topu</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0000-3562-6546</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Rahman</surname>
            <given-names>Md Siddikur</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8925-6544</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Aziz</surname>
            <given-names>Nor Hidayati Binti Abdul</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7995-4912</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Hossain</surname>
            <given-names>Md Nazmul</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0574-5223</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Aziz</surname>
            <given-names>Nor Azlina Ab</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Center for Engineering Computational Intelligence</institution>
            <institution>Faculty of Engineering and Technology</institution>
            <institution>Multimedia University</institution>
            <addr-line>Jalan Ayer Keroh Lama, Bukit Beruang</addr-line>
            <addr-line>Melaka, 75450</addr-line>
            <country>Malaysia</country>
            <phone>60 132999042</phone>
            <email>azlina.aziz@mmu.edu.my</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2119-6191</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Center for Engineering Computational Intelligence</institution>
        <institution>Faculty of Engineering and Technology</institution>
        <institution>Multimedia University</institution>
        <addr-line>Melaka</addr-line>
        <country>Malaysia</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Computer Science and Engineering</institution>
        <institution>Faculty of Science, Engineering and Technology</institution>
        <institution>University of Science and Technology Chittagong</institution>
        <addr-line>Chattogram</addr-line>
        <country>Bangladesh</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Statistics</institution>
        <institution>Faculty of Science</institution>
        <institution>Begum Rokeya University</institution>
        <addr-line>Rangpur</addr-line>
        <country>Bangladesh</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Marketing</institution>
        <institution>Faculty of Business Studies</institution>
        <institution>University of Dhaka</institution>
        <addr-line>Dhaka</addr-line>
        <country>Bangladesh</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Nor Azlina Ab Aziz <email>azlina.aziz@mmu.edu.my</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>24</day>
        <month>11</month>
        <year>2023</year>
      </pub-date>
      <volume>8</volume>
      <elocation-id>e49113</elocation-id>
      <history>
        <date date-type="received">
          <day>18</day>
          <month>5</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>16</day>
          <month>7</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>28</day>
          <month>9</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>11</day>
          <month>10</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Masuda Begum Sampa, Topu Biswas, Md Siddikur Rahman, Nor Hidayati Binti Abdul Aziz, Md Nazmul Hossain, Nor Azlina Ab Aziz. Originally published in JMIR Diabetes (https://diabetes.jmir.org), 24.11.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Diabetes, is properly cited. The complete bibliographic information, a link to the original publication on https://diabetes.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://diabetes.jmir.org/2023/1/e49113" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Over the past few decades, diabetes has become a serious public health concern worldwide, particularly in Bangladesh. The advancement of artificial intelligence can be reaped in the prediction of blood glucose levels for better health management. However, the practical validity of machine learning (ML) techniques for predicting health parameters using data from low- and middle-income countries, such as Bangladesh, is very low. Specifically, Bangladesh lacks research using ML techniques to predict blood glucose levels based on basic noninvasive clinical measurements and dietary and sociodemographic information.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>To formulate strategies for public health planning and the control of diabetes, this study aimed to develop a personalized ML model that predicts the blood glucose level of urban corporate workers in Bangladesh.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Based on the basic noninvasive health checkup test results, dietary information, and sociodemographic characteristics of 271 employees of the Bangladeshi Grameen Bank complex, 5 well-known ML models, namely, linear regression, boosted decision tree regression, neural network, decision forest regression, and Bayesian linear regression, were used to predict blood glucose levels. Continuous blood glucose data were used in this study to train the model, which then used the trained data to predict new blood glucose values.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Boosted decision tree regression demonstrated the greatest predictive performance of all evaluated models (root mean squared error=2.30). This means that, on average, our model’s predicted blood glucose level deviated from the actual blood glucose level by around 2.30 mg/dL. The mean blood glucose value of the population studied was 128.02 mg/dL (SD 56.92), indicating a borderline result for the majority of the samples (normal value: 140 mg/dL). This suggests that the individuals should be monitoring their blood glucose levels regularly.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This ML-enabled web application for blood glucose prediction helps individuals to self-monitor their health condition. The application was developed with communities in remote areas of low- and middle-income countries, such as Bangladesh, in mind. These areas typically lack health facilities and have an insufficient number of qualified doctors and nurses. The web-based application is a simple, practical, and effective solution that can be adopted by the community. Use of the web application can save money on medical expenses, time, and health management expenses. The created system also aids in achieving the Sustainable Development Goals, particularly in ensuring that everyone in the community enjoys good health and well-being and lowering total morbidity and mortality.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>blood glucose prediction</kwd>
        <kwd>boosted decision tree regression model</kwd>
        <kwd>machine learning</kwd>
        <kwd>noncommunicable diseases</kwd>
        <kwd>noninvasive</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Diabetes mellitus (DM), which is characterized by elevated blood glucose levels (BGLs), is a disease that is proliferating swiftly worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. The International Diabetes Federation predicted that by the end of 2045, 800 million people would have this disease [<xref ref-type="bibr" rid="ref2">2</xref>]. Diabetes is a noncommunicable disease (NCD) that is often regarded as the primary cause of numerous illnesses [<xref ref-type="bibr" rid="ref3">3</xref>]. Uncontrolled diabetes harms almost all body organs. Over time, the excessive glucose in the blood stream causes serious and even mortality-related complications, such as heart conditions, kidney issues, eye issues, diabetic neuropathy, and diabetic retinopathy [<xref ref-type="bibr" rid="ref4">4</xref>]. Diseases such as asthma, edema, and oral diseases are substantially correlated with diabetes incidence [<xref ref-type="bibr" rid="ref5">5</xref>].</p>
      <p>High blood glucose affects a person’s health and is a risk factor for developing NCDs [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. It is important to detect and monitor diabetes and prevent or control the major complications of the disease. Thus, early prediction of BGLs can reduce the amount of money spent on public health annually and help people become more aware of how to protect themselves from diabetes. Such prediction is crucial to the efficient management of diabetes. The goal of managing type 1 diabetes is to achieve optimal and long-lasting BGL control. This goal can be supported by the automated prediction of BGL using machine learning (ML) techniques, which are thought to be a promising approach. ML is a technique for improving performance by automatically learning from experience and making more accurate predictions [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Numerous factors influence BGLs. Future BGLs are influenced by prior glucose observations as well as insulin dosage, carbohydrate intake, and other lifestyle factors. Obesity and biomarkers (eg, body fluids including urine, blood, and saliva) are a few of the many factors that have a significant role in the onset and course of DM [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
      <p>In Bangladesh, urban residents exhibit a greater tendency to develop NCDs, including diabetes, than rural residents. This is due to several factors, including their occupational lifestyle (eg, heavy workloads and prolonged sitting to complete their tasks). Thus, people working in the private corporate sector are more likely to develop NCDs [<xref ref-type="bibr" rid="ref10">10</xref>].</p>
      <p>One of the main goals of health policy is to lower the costs associated with controlling NCDs [<xref ref-type="bibr" rid="ref11">11</xref>]. Hence, studies on how to regularly assess BGLs in a cost-effective way are needed [<xref ref-type="bibr" rid="ref12">12</xref>]. ML-based prediction models can help to achieve this goal. However, studies supporting the practical validity of ML techniques for predicting health parameters using data from low- and middle-income countries, such as Bangladesh, are very few [<xref ref-type="bibr" rid="ref13">13</xref>]. Specifically, Bangladesh lacks research using ML techniques to predict BGLs based on basic noninvasive clinical measurements and dietary and sociodemographic information. To formulate strategies for public health planning and the control of diabetes, this study aimed to develop a personalized ML model that predicts the BGLs of urban corporate workers in Bangladesh. We used 5 regression prediction models, including boosted decision tree regression, decision forest regression, Bayesian linear regression, neural network, and linear regression. The models were trained and tested using a data set collected by the team using basic noninvasive clinical measurement devices together with dietary and sociodemographic information. Among the models, boosted decision tree regression exhibited the best performance in predicting the BGLs of the collected data, achieving the lowest root mean square error (RMSE) of 2.3 and mean absolute error (MAE) of 1.3. The model was then incorporated into a web app called the BloodGlucosePrediction Calculator [<xref ref-type="bibr" rid="ref14">14</xref>], that allows individuals with basic noninvasive health measurements, dietary information, and sociodemographic information to predict their BGL value. Visual Studio was used to develop the web app. The app was developed based on the ML predictive model application programming interface and POST URL. The automated web-based BGL prediction system in this study is capable of aiding communities, especially those in highly remote areas, to diagnose BGLs quickly and easily. </p>
      <p>Many studies on the prediction of BGLs have been conducted, each using a different set of data, patients, and features [<xref ref-type="bibr" rid="ref15">15</xref>]. For example, a study used recurrent artificial neural networks (ANNs) and Elman recurrent ANNs to predict BGLs based on previous blood glucose values. They used a virtual data set called “Case 002” compiled from the free AIDA simulator. The study used RMSE to measure performance and obtained average RMSE values of 6.43 mg/dL, 7.45 mg/dL, 8.13 mg/dL, and 9.03 mg/dL for prediction horizons of 15 minutes, 30 minutes, 45 minutes, and 60 minutes, respectively. The researchers suggested additional case studies [<xref ref-type="bibr" rid="ref16">16</xref>].</p>
      <p>In another study [<xref ref-type="bibr" rid="ref17">17</xref>], prediction models using nonlinear autoregressive neural networks and long short-term memory (LSTM) networks were introduced for predicting future glucose levels. These models were trained on a large set of continuous glucose monitoring data. The LSTM model, in particular, demonstrated superior predictive performance, achieving a lower RMSE value of 19.47 compared to other models. In a study using the OhioT1DM data set, which contains data from 6 patients with type 1 diabetes who participated in an institutional review board–approved study for 8 weeks between March 2016 and April 2017, the researchers applied LSTM and neural attention models for blood glucose prediction [<xref ref-type="bibr" rid="ref18">18</xref>]. Their study found that the LSTM algorithm showed the best performance among the tested models.</p>
      <p>The ML model mentioned in the research by Orabi et al [<xref ref-type="bibr" rid="ref5">5</xref>] was trained on a data set of information from patients with type 2 diabetes. The data set, containing 23 characteristics, was collected by the Egyptian National Research Center specifically from patients with diabetes. The developed system showed 84% prediction accuracy. Meanwhile, Wu et al [<xref ref-type="bibr" rid="ref19">19</xref>] predicted type 2 DM using the Pima Indian Diabetes data set. They achieved an accuracy of 95.42% using the improved K-means algorithm and the logistic regression algorithm. They suggested further work to develop an application based on the proposed model. Kaur and Kumari [<xref ref-type="bibr" rid="ref8">8</xref>] also used the Pima Indian Diabetes data set to develop ML models that classify the patients into diabetic and nondiabetic categories [<xref ref-type="bibr" rid="ref8">8</xref>]. They applied and compared 5 different predictive models. The highest accuracy was reported for the linear kernel support vector machine, which achieved an accuracy of 0.89. The other 4 algorithms, including radial basis kernel support vector machine, k-nearest neighbor, ANN, and multifactor dimensionality reduction, achieved accuracies of 0.84, 0.88, 0.86, and 0.83, respectively.</p>
      <p>According to a review of diabetes prediction papers [<xref ref-type="bibr" rid="ref9">9</xref>], various data set characteristics, such as dimensionality, the number of instances relative to the number of features, or the data set type (genetic or clinical), can significantly impact the algorithm’s performance. As a result, an algorithm that performs best on one data set may have lower prediction accuracy than other algorithms on different data sets.</p>
      <p>Numerous studies have focused on predicting BGLs by using various feature sets and applying mathematical and ML models. However, no model has achieved 100% accuracy. Moreover, most of the previous ML-based studies in health care were conducted using data from high-income countries [<xref ref-type="bibr" rid="ref20">20</xref>]. The application of supervised ML approaches to medical data to predict diseases, the survivability of diseases, and different types of health checkup test results by using sample data from Bangladesh is lacking. A search through several academic databases, including PubMed, IEEE Xplore, and Google Scholar, found that no existing studies specifically focused on ML blood glucose prediction in Bangladesh using dietary and sociodemographic data. Therefore, more research is needed in this area. Consequently, this paper focuses on predicting continuous BGLs based on data from noninvasive basic health checkup tests, dietary information, and sociodemographic characteristics collected from patients from Bangladesh.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Collection</title>
        <p>The data were collected from the employees at the Grameen Bank complex in Dhaka, Bangladesh, which includes 18 distinct organizations with more than 500 employees, including Grameen Bank, Grameen Communications, other nongovernmental organizations, and private companies. The study collected data from 271 workers to predict their BGLs. Typically, a larger sample size is expected for ML approaches. However, previous studies included relatively few participants (eg, 118 [<xref ref-type="bibr" rid="ref21">21</xref>] and 300 [<xref ref-type="bibr" rid="ref22">22</xref>]). It must be mentioned that a small sample size is sometimes associated with higher classification accuracy [<xref ref-type="bibr" rid="ref23">23</xref>]. A simple random sampling procedure drew the sample. In this study, we informed people first about our portable health clinic (PHC) system. After the initial introduction of the PHC system, the survey was conducted among those who came to the service point and received the PHC service at least once.</p>
        <p>We calculated the required sample size using the following sample size formula, S = Z<sup>2</sup> × P × (1−P)M2, where S is the sample size for infinite population, Z is the <italic>z</italic> score, P is the population proportion (assumed as 50% or 0.5), and M is the margin of error.</p>
        <p>Using the above formula for Z=1.960, P=0.5, and M=0.05, we calculated the required sample size to be 384. However, due to missing values, we included 275 observations in our study.</p>
        <p>This study collected the test items used as input factors using the human-assisted PHC system. However, measurements such as arrhythmia, blood cholesterol, blood hemoglobin, blood grouping, urinary sugar, and urinary protein were excluded due to many missing cases. The blood glucose measurement was considered as an output factor. The PHC system has been previously described in detail [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
        <p>Clinical measurements were obtained through direct diagnosis using PHC devices operated during data collection by a well-trained nurse or health care professional. The clinical measurements assessed by a PHC were as follows: blood pressure; pulse rate; body temperature; oxygenation of blood; arrhythmia; body mass index (BMI); waist, hip, and waist to hip ratio; blood glucose; blood cholesterol; blood hemoglobin; blood uric acid; blood grouping; urinary sugar; and urinary protein. Data on dietary information and sociodemographic characteristics were collected during face-to-face interviews using a standard questionnaire.</p>
      </sec>
      <sec>
        <title>Regression Predictive Modeling</title>
        <sec>
          <title>Machine Learning Models</title>
          <p>Since the study’s targeted output variable was a continuous variable, a person’s BGL value was predicted using a regression prediction model. A regression predictive model’s performance is reported as an error in those predictions because it predicts a quantity. The most popular ML models, including boosted decision tree regression, decision forest regression, Bayesian linear regression, linear regression, and neural network, were evaluated. This study chose these models for comparison because they are widely used to predict medical data.</p>
        </sec>
        <sec>
          <title>Linear Regression</title>
          <p>The linear regression model is a very simple ML method in which each data point consists of a pair of vectors, namely, the input vector and the output vector. Even on larger data sets, it is the most straightforward, traditional, and widely-applied correlational method [<xref ref-type="bibr" rid="ref13">13</xref>]. The form of the linear regression model is <italic>U<sub>pred</sub></italic> = <italic>βx<sub>in</sub></italic>, where <italic>β</italic> represents the vector of coefficients, which are calculated by applying the least-squares method; <italic>U<sub>pred</sub></italic> is the predicted value; and <italic>x<sub>in</sub></italic> is the value of the independent variable [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        </sec>
        <sec>
          <title>Boosted Decision Tree Regression</title>
          <p>Boosting is a popular ML ensemble method [<xref ref-type="bibr" rid="ref25">25</xref>], where boosting in a decision tree ensemble tends to improve accuracy with some small risk of less coverage. It is an ML method for regression issues. It builds each regression tree in a stepwise fashion using a predefined loss function to measure the error in each step and correct for it in the next. Thus, the prediction model is an ensemble of weaker prediction models. In regression problems, boosting builds a series of trees in a stepwise fashion, and then selects the optimal tree using an arbitrary differentiable loss function [<xref ref-type="bibr" rid="ref26">26</xref>]. Like random forest, it combines many smaller, weaker models into a final summed prediction. However, the idea of boosting is to add new models to the ensemble in a sequence for a number of sequences. In each iteration, a new weak model is trained for the whole ensemble learned up to that new model. These iteratively produced new models are built to be maximally correlated with the negative gradient of the loss function that is also associated with the ensemble as a whole. In this approach, a performance function is placed on the gradient boosting machine to find the point at which adding more iterations becomes negligible in benefit (ie, adding more simple models, in this case decision trees, no longer reduces the error by a significant margin). At this point, the ensemble sums all of the predictions into a final overall prediction [<xref ref-type="bibr" rid="ref27">27</xref>]. The boosted trees model is an additive model that makes predictions by combining decisions from a sequence of base models. More formally, the class of models can be written as <italic>G</italic>(<italic>x</italic>) = <italic>f</italic><sub>0</sub>(<italic>x</italic>) + <italic>f</italic><sub>1</sub>(<italic>x</italic>) + <italic>f</italic><sub>2</sub>(<italic>x</italic>) + … + <italic>f</italic><sub>n</sub>(<italic>x</italic>), where the final classifier, <italic>G</italic>, is the sum of simple base classifiers <italic>f<sub>i</sub></italic>. For the boosted tree model, each base classifier is a simple <ext-link ext-link-type="uri" xlink:href="https://apple.github.io/turicreate/docs/userguide/supervised-learning/decision_tree_regression.html" xlink:type="simple">decision tree</ext-link>. This broad technique of using multiple models to obtain better predictive performance is called <ext-link ext-link-type="uri" xlink:href="http://en.wikipedia.org/wiki/Ensemble_learning" xlink:type="simple">model ensembling</ext-link>.</p>
        </sec>
        <sec>
          <title>Neural Network</title>
          <p>The neural network is a network of connected neurons. The neurons cannot operate without other neurons with whom they are connected. Usually, they are grouped in layers, process data in each layer, and pass it forward to the next layer. The last layer of neurons makes the decisions [<xref ref-type="bibr" rid="ref28">28</xref>].</p>
        </sec>
        <sec>
          <title>Decision Forest Regression</title>
          <p>This regression model consists of an ensemble of decision trees. A collection of trees constitutes a forest. Each tree in a regression decision forest outputs a Gaussian distribution as a prediction. Aggregation is performed over the ensemble of trees to find a Gaussian distribution closest to the combined distribution for all trees in the model [<xref ref-type="bibr" rid="ref29">29</xref>]. This technique generates several decision trees during training, which can split randomly from a seed point. This results in a “forest” of randomly generated decision trees whose outcomes are ensembled by the random forest algorithm to predict more accurately than a single tree does alone. One problem with a single decision tree is overfitting, which makes the prediction seem very good on the training data but unreliable in future predictions [<xref ref-type="bibr" rid="ref27">27</xref>]. By using decision forest regression, a model can be trained with a relatively small number of samples and produce good results.</p>
        </sec>
        <sec>
          <title>Bayesian Linear Regression</title>
          <p>Recently, Bayesian learning has been widely adopted and proven more powerful than other ML techniques. Bayesian linear regression allows a fairly natural mechanism to survive insufficient or poorly distributed data. It allows putting a prior on the coefficients and noise so that the priors can take over in the absence of data. The result of Bayesian linear regression is a distribution of possible model parameters based on the data and the prior. This allows the uncertainty about the model to be quantified with fewer data points, and the posterior distribution will be more spread out.</p>
        </sec>
      </sec>
      <sec>
        <title>Experimental Setup</title>
        <p>Azure Machine Learning Studio (Microsoft Corp) was used for the implementation of trained models. Azure Machine Learning Studio provides a user-friendly, visual approach to building ML pipelines. Azure Machine Learning Studio offers a graphical interface that allows users to design and build ML pipelines using a drag-and-drop approach. It also provides a wide range of prebuilt modules for data preprocessing, feature engineering, model training, and evaluation. These modules can be combined to create complex pipelines without writing code. We trained 5 relevant ML models using our data. The detailed technical aspects of the modeling process are shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
        <p><xref rid="figure1" ref-type="fig">Figure 1</xref> shows the ML algorithms used in this study. First, the data file was uploaded into the experiment. Then, the data were edited, and variables for use in the predictive algorithms were selected. Next, the data set was split, and the ML algorithms were trained with the given data set to develop the model. After training, the score model was obtained and the trained model was evaluated to measure its accuracy (ie, performance).</p>
        <p>To evaluate the performance of the models, RMSE values from each model were used. The RMSE of a model is the average difference between the model’s prediction and the actual outcome [<xref ref-type="bibr" rid="ref27">27</xref>]. It indicates how close the predicted value is to the actual value. There is no cutoff or benchmark for RMSE values. The smaller the value, the better the prediction. The MAE was also used. It is the sum of the absolute differences between predictions and actual values. Additionally, the coefficient of determination (<italic>R</italic><sup>2</sup>) was measured. <italic>R</italic><sup>2</sup> represents how close the predicted value is to the actual value, and a higher value of <italic>R</italic><sup>2</sup> is desirable.</p>
        <p>Each model was trained on a 70% training sample to ensure uniform training. We split data according using a 0.7:0.3 training set to test set ratio. We did not use the cross-validation method because K-fold cross-validation produces strongly biased performance estimates with small sample sizes [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        <p>The input-process-output model for predicting blood glucose based on sociodemographic characteristics, dietary information, and some basic health checkup test results is shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>. The 3 types of inputs were fed into the process using the 5 ML regression algorithms. The output was the predicted BGL.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flowchart of Azure machine learning algorithms.</p>
          </caption>
          <graphic xlink:href="diabetes_v8i1e49113_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>The input-process-output model used to predict blood glucose levels after processing 17 input variables using ML algorithms. BMI: body mass index; BP: blood pressure; ML: machine learning.</p>
          </caption>
          <graphic xlink:href="diabetes_v8i1e49113_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>The authors obtained ethics approval from the National Research Ethics Committee of the Bangladesh Medical Research Council (18325022019).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Description of the Study Population</title>
        <p>The descriptive statistics of the study participants and the summary statistics of the selected categorical predictors used in ML are shown in <xref ref-type="table" rid="table1">Table 1</xref> and <xref ref-type="table" rid="table2">Table 2</xref>, respectively.</p>
        <p>The mean age of the respondents was 49.61 (SD 7.39) years, and most participants were aged 50 years. On average, the respondents had a BMI of 25.37 (SD 3.20). The World Health Organization defines BMIs ranging from 25 to 29.9 as overweight; therefore, most of the respondents were overweight. The respondents’ average BGL was on the borderline at 128.02 (SD 56.92) mg/dL (whereas the normal value is 140 mg/dL). This shows that it is important for the respondents to check their blood glucose regularly.</p>
        <p>The majority (n=225, 83%) of the respondents were men and most had completed at least a college or university degree. Among the 271 respondents, 9.6% (n=26) reported that they drink sugar-containing drinks (eg, Coke, Fanta, soda, or fruit juice) 3 or more times a week, and 18.1% (n=49) reported that they eat fast foods (eg, pizza, hamburgers, and deep-fried foods) 3 or more time a week.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Summary statistics of the selected continuous predictors used in machine learning (n=271).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="320"/>
            <col width="320"/>
            <col width="360"/>
            <thead>
              <tr valign="top">
                <td>Variables</td>
                <td>Range</td>
                <td>Mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Age (years)</td>
                <td>34-77</td>
                <td>49.61 (7.39)</td>
              </tr>
              <tr valign="top">
                <td>Height (cm)</td>
                <td>140.00-184.00</td>
                <td>163.05 (7.45)</td>
              </tr>
              <tr valign="top">
                <td>Weight (kg)</td>
                <td>44.20-114.40</td>
                <td>67.52 (10.06)</td>
              </tr>
              <tr valign="top">
                <td>BMI<sup>a</sup> (kg/m<sup>2</sup>)</td>
                <td>18.39-40.53</td>
                <td>25.37 (3.20)</td>
              </tr>
              <tr valign="top">
                <td>Waist (cm)</td>
                <td>63.60-118.00</td>
                <td>90.24 (7.80)</td>
              </tr>
              <tr valign="top">
                <td>Hip (cm)</td>
                <td>80.00-127.00</td>
                <td>94.54 (6.29)</td>
              </tr>
              <tr valign="top">
                <td>Waist:hip ratio</td>
                <td>0.64-1.11</td>
                <td>0.96 (0.06)</td>
              </tr>
              <tr valign="top">
                <td>Body temperature (°F)</td>
                <td>92.12-99.64</td>
                <td>96.07 (1.15)</td>
              </tr>
              <tr valign="top">
                <td>SpO2<sup>b</sup></td>
                <td>93-99</td>
                <td>97.67 (1.17)</td>
              </tr>
              <tr valign="top">
                <td>Systolic BP<sup>c</sup> (mmHg)</td>
                <td>92-180</td>
                <td>126.68 (14.88)</td>
              </tr>
              <tr valign="top">
                <td>Diastolic BP (mmHg)</td>
                <td>59-108</td>
                <td>81.71 (8.43)</td>
              </tr>
              <tr valign="top">
                <td>Pulse rate (bpm)</td>
                <td>51-123</td>
                <td>80.27 (11.66)</td>
              </tr>
              <tr valign="top">
                <td>Blood uric acid</td>
                <td>3.10-11.00</td>
                <td>6.63 (1.54)</td>
              </tr>
              <tr valign="top">
                <td>Blood glucose (mg/dL)</td>
                <td>66.60-392.40</td>
                <td>128.02 (56.92)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>BMI: body mass index.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>Blood oxygenation.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>BP: blood pressure.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Summary statistics of the selected categorical predictors used in machine learning.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="460"/>
            <col width="510"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Category</td>
                <td>Participants (n=271), n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Gender</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>225 (83)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>46 (17)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Education</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No education (no school entered)</td>
                <td>10 (3.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Primary school completed</td>
                <td>30 (11.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Secondary school completed</td>
                <td>11 (4.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>High school completed</td>
                <td>23 (8.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Vocation school completed</td>
                <td>1 (0.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>College or university completed</td>
                <td>63 (23.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Higher education (master or doctor) completed</td>
                <td>133 (49.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Drinks sugar-containing drinks<sup>a</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>26 (9.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td>245 (90.4)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Eats fast foods<sup>b</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>49 (18.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td>222 (81.9)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Drinks sugar-containing drinks (eg, Coke, Fanta, soda, fruit juice, orsother Sweet or sugar-containing drinks) 3 or more times a week.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>Eats fast foods, such as pizza, hamburgers, or deep-fried foods (eg, singara, samosa, moglai parata) 3 or more times a week.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Prediction Performance Assessment</title>
        <p>To examine the prediction performance of the regression predictive technique using ML, the main evaluation criterion used was the RMSE. The RMSE measures the average magnitude of the error by taking the square root of the average of the squared differences between the prediction and actual observations. The RMSE value gives us an idea of how much, on average, the predicted values deviate from the actual values; it is a measure of the fit of the model to the data points. <xref ref-type="table" rid="table3">Table 3</xref> presents the performance of the regression models. The boosted decision tree regression model performed the best among the tested models. Its RMSE was the lowest at a value of 2.30, indicating that, on average, the boosted decision tree regression model’s predicted blood glucose deviated from the actual blood glucose by around 2.30 mg/dL. Its RMSE and MAE were significantly lower than those of the other models, while it’s <italic>R</italic><sup>2</sup> was the largest (0.99).</p>
        <p>The score model of the best predictive model—the boosted decision tree regression—is shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>. The “Scored Labels” column (last column) in <xref rid="figure3" ref-type="fig">Figure 3</xref> indicates the predicted value of BGLs. It can be seen that the deviation between the scored labels and the actual BGL reported in the “Bglucose” column was small.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Comparison of modeling techniques.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="340"/>
            <col width="250"/>
            <col width="210"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td>Model name</td>
                <td>Root mean squared error</td>
                <td>Mean absolute error</td>
                <td>
                  <italic>R</italic>
                  <sup>2</sup>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Neural network</td>
                <td>45.54</td>
                <td>36.24</td>
                <td>0.18</td>
              </tr>
              <tr valign="top">
                <td>Decision forest regression</td>
                <td>22.99</td>
                <td>17.46</td>
                <td>0.79</td>
              </tr>
              <tr valign="top">
                <td>Linear regression</td>
                <td>44.66</td>
                <td>35.59</td>
                <td>0.21</td>
              </tr>
              <tr valign="top">
                <td>Boosted decision tree regression</td>
                <td>2.30</td>
                <td>1.30</td>
                <td>0.99</td>
              </tr>
              <tr valign="top">
                <td>Bayesian linear regression</td>
                <td>44.49</td>
                <td>34.50</td>
                <td>0.22</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Partial view of the score model (prediction of blood glucose level) obtained by the boosted decision tree regression model. BloodPressuresys: systolic blood pressure; BloodPressuredia: diastolic blood pressure; Bglucose: blood glucose level; Ffood: fast food; Sdrinks: sugary drinks.</p>
          </caption>
          <graphic xlink:href="diabetes_v8i1e49113_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>ML algorithms can identify the patterns in a data set that may not be directly apparent. Thus, ML can provide helpful information and support to medical staff by identifying patterns that may not be obvious [<xref ref-type="bibr" rid="ref30">30</xref>]. Comparison of the results found in this study to those in previous related works is crucial. Most previous studies have reported performance measurements as a function of classification accuracy, which may not be directly comparable to this study, which adopts a regression approach to build a predictive model for the continuous variable (ie, BGL).</p>
        <p>A previous study compared the performance of 3 ML models, namely logistic regression, ANN, and decision tree models, for predicting diabetes or prediabetes using 12 common risk factors (including only 1 clinical factor: BMI) in Guangzhou, China [<xref ref-type="bibr" rid="ref31">31</xref>], and found accuracies of 77.87%, 73.23%, and 76.13% for the decision tree model, ANN, and logistic regression model, respectively.</p>
        <p>The gradient boosting ML algorithm has been successfully used in clinical studies to predict cardiovascular diseases [<xref ref-type="bibr" rid="ref12">12</xref>]. The gradient boosting decision tree method by Friedman [<xref ref-type="bibr" rid="ref32">32</xref>] predicted BMI with an accuracy of 0.91 [<xref ref-type="bibr" rid="ref33">33</xref>]. In the current study, decision tree regression was the best predictive model, followed by decision forest regression. Both of these are ensemble learning methods.</p>
        <p>In this study, 5 ML prediction algorithms were evaluated to predict blood glucose values. The health records of 271 employees aged 34 to 77 years were collected and used in this study. The data included well-known relevant factors of high blood glucose, such as age and BMI, as well as other factors with unknown associations with BGL. Specifically, 17 noninvasive health measurements, dietary information, and sociodemographic information were used for the prediction. This study used portable, cheap, and affordable devices for clinical data collection. The low-input dimensions provided the advantage of keeping the necessary time to train the models relatively small. Blood glucose was set as an output factor. Among the studied prediction algorithms, boosted decision tree regression was found to be the most effective with the best RMSE (2.3); this RMSE value was better than any reported in the literature. The developed model is a powerful tool for predicting blood glucose with limited medical resources and has been deployed on a website [<xref ref-type="bibr" rid="ref14">14</xref>]. <xref rid="figure4" ref-type="fig">Figure 4</xref> shows the web app. With this app, the patients of caregivers do not need to carry the blood glucose measuring instruments or be concerned with ensuring enough supply of test strips and lancet needles, as the predictor is able to predict BGL using external factors.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Screenshot view of the website to predict blood glucose value obtained by integrating the best performing boosted decision tree regression model into the application. BloodPressuresys: systolic blood pressure; BloodPressuredia: diastolic blood pressure; Bglucose: blood glucose level; Ffood: fast food; Sdrinks: sugary drinks.</p>
          </caption>
          <graphic xlink:href="diabetes_v8i1e49113_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study provides a measure for reducing NCDs and can be a good component in the national or global plan. We developed a blood glucose prediction model based on personal characteristics, dietary information, and some basic clinical measurements related to NCDs. Such a blood glucose prediction model is useful for reducing health management costs and improving awareness among high-risk individuals. Predicted glucose values can be used for early hypoglycemic or hyperglycemic alarms. These predictions can also help prevent complications associated with high BGLs. As a result, the developed model can help achieve the Sustainable Development Goals, ensuring universal and equal health coverage, and thus reducing overall morbidity and mortality.</p>
        <p>However, there are several limitations to this study. First, the number of samples we studied was small; it must be expanded to train the prediction model in the future. Second, this study was limited to a particular area, specifically among employees working in a corporate office. We collected the training data from this specific area. We trained our model by using these data only. The data from other institutes do not confirm our prediction model. Our findings may not be applicable to a broader population or different geographical locations. This is because the characteristics, behaviors, and dynamics of the population might differ significantly from one area to another. As a result, it becomes challenging to generalize the results beyond the confines of the chosen area and employee group. The specific area and employee group might possess unique cultural, economic, or contextual factors influencing their behaviors and responses. These factors might not hold true for other settings or groups, leading to skewed conclusions if applied outside the study’s scope. The data from other institutes do not confirm our prediction model. However, the framework achieves high performance on Grameen Bank complex data. Thus, we believe this data-based strategy is also fit for predicting blood glucose in other communities. In future studies, additional features (eg, work stress, everyday physical activity, eating red meat) should be considered to improve the prediction accuracy. Nonetheless, this study served as a successful case.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ANN</term>
          <def>
            <p>artificial neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BGL</term>
          <def>
            <p>blood glucose level</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BMI</term>
          <def>
            <p>body mass index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">DM</term>
          <def>
            <p>diabetes mellitus</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">LSTM</term>
          <def>
            <p>long short-term memory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">MAE</term>
          <def>
            <p>mean absolute error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">NCD</term>
          <def>
            <p>noncommunicable disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">PHC</term>
          <def>
            <p>portable health clinic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">RMSE</term>
          <def>
            <p>root mean square error</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was supported by multiple organizations. JSPS KAKENHI (grant 18K11529) and the Future Earth Research Fund (grant 18-161009264) jointly financed the core research. The Institute of Decision Science for a Sustainable Society, Kyushu University, Japan, provided travel expenses for data collection. Grameen Communications, Bangladesh, and Multimedia University, Malaysia (grant MMUI/230019)<bold>,</bold> provided technical assistance.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>MBS conceptualized the study<bold>,</bold> performed the formal analysis and investigation, designed the methodology, and wrote the manuscript. MBS, TB, MSR, NHBAA, MNH, and NAAA reviewed and edited the manuscript. All authors have read and agreed to the published version of the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>Diabetes</article-title>
          <source>World Health Organization</source>
          <access-date>2023-11-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/health-topics/diabetes#tab=tab_1">https://www.who.int/health-topics/diabetes#tab=tab_1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <article-title>IDF Diabetes Atlas 2022 reports</article-title>
          <source>IDF Diabetes Atlas</source>
          <access-date>2023-11-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://diabetesatlas.org/2022-reports/">https://diabetesatlas.org/2022-reports/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>Diabetes is considered as mother of all diseases</article-title>
          <source>YogaTute Health</source>
          <access-date>2023-11-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://yogatute.com/2016/10/diabetes-considered-mother-of_all_diseases.html">https://yogatute.com/2016/10/diabetes-considered-mother-of_all_diseases.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zarkogianni</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mitsis</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Litsa</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Arredondo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ficο</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Fioravanti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nikita</surname>
              <given-names>KS</given-names>
            </name>
          </person-group>
          <article-title>Comparative assessment of glucose prediction models for patients with type 1 diabetes mellitus applying sensors for glucose and physical activity monitoring</article-title>
          <source>Med Biol Eng Comput</source>
          <year>2015</year>
          <month>12</month>
          <volume>53</volume>
          <issue>12</issue>
          <fpage>1333</fpage>
          <lpage>1343</lpage>
          <pub-id pub-id-type="doi">10.1007/s11517-015-1320-9</pub-id>
          <pub-id pub-id-type="medline">26049412</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11517-015-1320-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Orabi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kamal</surname>
              <given-names>YM</given-names>
            </name>
            <name name-style="western">
              <surname>Rabah</surname>
              <given-names>TM</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Perner</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Early predictive system for diabetes mellitus disease</article-title>
          <source>Advances in Data Mining. Applications and Theoretical Aspects</source>
          <year>2016</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>427</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yun</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ryu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Development of nephrolithiasis in asymptomatic hyperuricemia: a cohort study</article-title>
          <source>Am J Kidney Dis</source>
          <year>2017</year>
          <month>08</month>
          <volume>70</volume>
          <issue>2</issue>
          <fpage>173</fpage>
          <lpage>181</lpage>
          <pub-id pub-id-type="doi">10.1053/j.ajkd.2017.01.053</pub-id>
          <pub-id pub-id-type="medline">28410765</pub-id>
          <pub-id pub-id-type="pii">S0272-6386(17)30548-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Choe</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Exploration of machine learning for hyperuricemia prediction models based on basic health checkup tests</article-title>
          <source>J Clin Med</source>
          <year>2019</year>
          <month>02</month>
          <day>02</day>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>172</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jcm8020172"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jcm8020172</pub-id>
          <pub-id pub-id-type="medline">30717373</pub-id>
          <pub-id pub-id-type="pii">jcm8020172</pub-id>
          <pub-id pub-id-type="pmcid">PMC6406925</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaur</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kumari</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Predictive modelling and analytics for diabetes using a machine learning approach</article-title>
          <source>Appl Comput Inform</source>
          <year>2020</year>
          <month>07</month>
          <day>28</day>
          <volume>18</volume>
          <issue>1/2</issue>
          <fpage>90</fpage>
          <lpage>100</lpage>
          <pub-id pub-id-type="doi">10.1016/j.aci.2018.12.004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kavakiotis</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Tsave</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Salifoglou</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Maglaveras</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Vlahavas</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chouvarda</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Machine learning and data mining methods in diabetes research</article-title>
          <source>Comput Struct Biotechnol J</source>
          <year>2017</year>
          <volume>15</volume>
          <fpage>104</fpage>
          <lpage>116</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2001-0370(16)30073-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.csbj.2016.12.005</pub-id>
          <pub-id pub-id-type="medline">28138367</pub-id>
          <pub-id pub-id-type="pii">S2001-0370(16)30073-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC5257026</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sampa</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Hossain</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hoque</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yokota</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Nishikitani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fukuda</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Influence of factors on the adoption and use of ICT-based eHealth technology by urban corporate people</article-title>
          <source>J Serv Sci Manag</source>
          <year>2020</year>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>19</lpage>
          <pub-id pub-id-type="doi">10.4236/jssm.2020.131001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hunter</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Reddy</surname>
              <given-names>KS</given-names>
            </name>
          </person-group>
          <article-title>Noncommunicable diseases</article-title>
          <source>N Engl J Med</source>
          <year>2013</year>
          <fpage>1336</fpage>
          <lpage>1343</lpage>
          <pub-id pub-id-type="doi">10.1016/b978-0-7020-5101-2.00062-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Canes</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Steinberg</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lyashevska</surname>
              <given-names>O</given-names>
            </name>
            <collab>AME Big-Data Clinical Trial Collaborative Group</collab>
          </person-group>
          <article-title>Predictive analytics with gradient boosting in clinical medicine</article-title>
          <source>Ann Transl Med</source>
          <year>2019</year>
          <month>04</month>
          <volume>7</volume>
          <issue>7</issue>
          <fpage>152</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31157273"/>
          </comment>
          <pub-id pub-id-type="doi">10.21037/atm.2019.03.29</pub-id>
          <pub-id pub-id-type="medline">31157273</pub-id>
          <pub-id pub-id-type="pii">atm-07-07-152</pub-id>
          <pub-id pub-id-type="pmcid">PMC6511546</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sampa</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Hossain</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Hoque</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yokota</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Nishikitani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Blood uric acid prediction with machine learning: model development and performance comparison</article-title>
          <source>JMIR Med Inform</source>
          <year>2020</year>
          <month>10</month>
          <day>08</day>
          <volume>8</volume>
          <issue>10</issue>
          <fpage>e18331</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2020/10/e18331/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/18331</pub-id>
          <pub-id pub-id-type="medline">33030442</pub-id>
          <pub-id pub-id-type="pii">v8i10e18331</pub-id>
          <pub-id pub-id-type="pmcid">PMC7582147</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <source>BloodGlucosePrediction Calculator</source>
          <access-date>2023-11-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bloodglucoseprediction.azurewebsites.net/webform1">https://bloodglucoseprediction.azurewebsites.net/webform1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Asad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Qamar</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Zeb</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Blood glucose level prediction with minimal inputs using feedforward neural network for diabetic type 1 patients</article-title>
          <source>Proceedings of the 2019 11th International Conference on Machine Learning and Computing</source>
          <year>2019</year>
          <conf-name>ICMLC '19</conf-name>
          <conf-date>February 22-24, 2019</conf-date>
          <conf-loc>Zhuhai</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3318299.3318354</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ben Ali</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hamdi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fnaiech</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Di Costanzo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Fnaiech</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ginoux</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Continuous blood glucose level prediction of type 1 diabetes based on artificial neural network</article-title>
          <source>Biocybern Biomed Eng</source>
          <year>2018</year>
          <volume>38</volume>
          <issue>4</issue>
          <fpage>828</fpage>
          <lpage>840</lpage>
          <pub-id pub-id-type="doi">10.1016/j.bbe.2018.06.005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aliberti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pupillo</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Terna</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Macii</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Di Cataldo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Patti</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Acquaviva</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A multi-patient data-driven approach to blood glucose prediction</article-title>
          <source>IEEE Access</source>
          <year>2019</year>
          <volume>7</volume>
          <fpage>69311</fpage>
          <lpage>69325</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2019.2919184</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mirshekarian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bunescu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Marling</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>LSTMs and neural attention models for blood glucose prediction: comparative experiments on real and synthetic data</article-title>
          <year>2019</year>
          <conf-name>41st Annual International Conference of the IEEE Engineering in Medicine and Biology Society</conf-name>
          <conf-date>July 23-27, 2019</conf-date>
          <conf-loc>Berlin</conf-loc>
          <pub-id pub-id-type="doi">10.1109/embc.2019.8856940</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Type 2 diabetes mellitus prediction model based on data mining</article-title>
          <source>Inform Med Unlocked</source>
          <year>2018</year>
          <volume>10</volume>
          <fpage>100</fpage>
          <lpage>107</lpage>
          <pub-id pub-id-type="doi">10.1016/j.imu.2017.12.006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Visualizing the knowledge structure and evolution of big data research in healthcare informatics</article-title>
          <source>Int J Med Inform</source>
          <year>2017</year>
          <month>02</month>
          <volume>98</volume>
          <fpage>22</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2016.11.006</pub-id>
          <pub-id pub-id-type="medline">28034409</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(16)30255-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zelic</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Kononenko</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Lavrac</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Vuga</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Induction of decision trees and Bayesian classification applied to diagnosis of sport injuries</article-title>
          <source>J Med Syst</source>
          <year>1997</year>
          <month>12</month>
          <volume>21</volume>
          <issue>6</issue>
          <fpage>429</fpage>
          <lpage>444</lpage>
          <pub-id pub-id-type="doi">10.1023/a:1022880431298</pub-id>
          <pub-id pub-id-type="medline">9555629</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>You</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A machine learning-based framework to identify type 2 diabetes through electronic health records</article-title>
          <source>Int J Med Inform</source>
          <year>2017</year>
          <month>01</month>
          <volume>97</volume>
          <fpage>120</fpage>
          <lpage>127</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27919371"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2016.09.014</pub-id>
          <pub-id pub-id-type="medline">27919371</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(16)30215-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC5144921</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vabalas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gowen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Poliakoff</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Casson</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>Machine learning algorithm validation with a limited sample size</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <volume>14</volume>
          <issue>11</issue>
          <fpage>e0224365</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0224365"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0224365</pub-id>
          <pub-id pub-id-type="medline">31697686</pub-id>
          <pub-id pub-id-type="pii">PONE-D-19-13163</pub-id>
          <pub-id pub-id-type="pmcid">PMC6837442</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sampa</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Hoque</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Hossain</surname>
              <given-names>MN</given-names>
            </name>
          </person-group>
          <article-title>Impacts of anthropometric, biochemical, socio-demographic, and dietary habits factors on the health status of urban corporate people in a developing country</article-title>
          <source>Healthcare (Basel)</source>
          <year>2020</year>
          <month>06</month>
          <day>27</day>
          <volume>8</volume>
          <issue>3</issue>
          <fpage>188</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=healthcare8030188"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/healthcare8030188</pub-id>
          <pub-id pub-id-type="medline">32605101</pub-id>
          <pub-id pub-id-type="pii">healthcare8030188</pub-id>
          <pub-id pub-id-type="pmcid">PMC7551820</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Roy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>WF</given-names>
            </name>
          </person-group>
          <article-title>Prediction modeling using EHR data: challenges, strategies, and a comparison of machine learning approaches</article-title>
          <source>Med Care</source>
          <year>2010</year>
          <month>06</month>
          <volume>48</volume>
          <issue>6 Suppl</issue>
          <fpage>S106</fpage>
          <lpage>S113</lpage>
          <pub-id pub-id-type="doi">10.1097/MLR.0b013e3181de9e17</pub-id>
          <pub-id pub-id-type="medline">20473190</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Manna</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Biswas</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kundu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rakshit</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Barman</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A statistical approach to predict flight delay using gradient boosted decision tree</article-title>
          <year>2017</year>
          <conf-name>International Conference on Computational Intelligence in Data Science (ICCIDS)</conf-name>
          <conf-date>June 2-7, 2017</conf-date>
          <conf-loc>Chennai</conf-loc>
          <pub-id pub-id-type="doi">10.1109/iccids.2017.8272656</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Abdollahi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Fuqua</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>de Carlo</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Bartholomai</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Balgemann</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>van Berkel</surname>
              <given-names>VH</given-names>
            </name>
            <name name-style="western">
              <surname>Frieboes</surname>
              <given-names>HB</given-names>
            </name>
          </person-group>
          <article-title>Prediction of lung cancer patient survival via supervised machine learning classification techniques</article-title>
          <source>Int J Med Inform</source>
          <year>2017</year>
          <month>12</month>
          <volume>108</volume>
          <fpage>1</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29132615"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2017.09.013</pub-id>
          <pub-id pub-id-type="medline">29132615</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(17)30236-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC5726571</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Remaining useful life estimation in prognostics using deep convolution neural networks</article-title>
          <source>Reliab Eng Syst Saf</source>
          <year>2018</year>
          <month>04</month>
          <volume>172</volume>
          <fpage>1</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ress.2017.11.021</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Criminisi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shotton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Konukoglu</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <source>Decision Forests: A Unified Framework for Classification, Regression, Density Estimation, Manifold Learning and Semi-Supervised Learning</source>
          <year>2012</year>
          <publisher-loc>Norwell</publisher-loc>
          <publisher-name>Now Foundations and Trends</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Delen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kadam</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Predicting breast cancer survivability: a comparison of three data mining methods</article-title>
          <source>Artif Intell Med</source>
          <year>2005</year>
          <month>06</month>
          <volume>34</volume>
          <issue>2</issue>
          <fpage>113</fpage>
          <lpage>127</lpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2004.07.002</pub-id>
          <pub-id pub-id-type="medline">15894176</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(04)00101-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Comparison of three data mining models for predicting diabetes or prediabetes by risk factors</article-title>
          <source>Kaohsiung J Med Sci</source>
          <year>2013</year>
          <month>02</month>
          <volume>29</volume>
          <issue>2</issue>
          <fpage>93</fpage>
          <lpage>99</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1607-551X(12)00217-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.kjms.2012.08.016</pub-id>
          <pub-id pub-id-type="medline">23347811</pub-id>
          <pub-id pub-id-type="pii">S1607-551X(12)00217-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <article-title>Greedy function approximation: a gradient boosting machine</article-title>
          <source>Ann Stat</source>
          <year>2001</year>
          <volume>29</volume>
          <issue>5</issue>
          <fpage>1189</fpage>
          <lpage>1232</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://projecteuclid.org/journals/annals-of-statistics/volume-29/issue-5/Greedy-function-approximation-A-gradient-boosting-machine/10.1214/aos/1013203451.full"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nohara</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wakata</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nakashima</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nakamura</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Machine learning based prediction of non-communicable diseases to improving intervention program in Bangladesh</article-title>
          <source>Eur J Biomed Inform</source>
          <year>2018</year>
          <volume>14</volume>
          <issue>4</issue>
          <fpage>20</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.24105/ejbi.2018.14.4.5</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
