<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JD</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Diabetes</journal-id>
      <journal-title>JMIR Diabetes</journal-title>
      <issn pub-type="epub">2371-4379</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i2e34681</article-id>
      <article-id pub-id-type="pmid">35576579</article-id>
      <article-id pub-id-type="doi">10.2196/34681</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Review</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Review</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Identifying Patients With Hypoglycemia Using Natural Language Processing: Systematic Literature Review</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mizokami-Stout</surname>
            <given-names>Kara</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Griauzde</surname>
            <given-names>Dina</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Elbattah</surname>
            <given-names>Mahmoud</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ren</surname>
            <given-names>Ziyou</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Suominen</surname>
            <given-names>Hanna</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Rastmanesh</surname>
            <given-names>Reza</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Zheng</surname>
            <given-names>Yaguang</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Rory Meyers College of Nursing</institution>
            <institution>New York University</institution>
            <addr-line>433 1st Avenue</addr-line>
            <addr-line>New York, NY, 10010</addr-line>
            <country>United States</country>
            <phone>1 212 998 5170</phone>
            <email>yaguang.zheng@nyu.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8400-1398</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Dickson</surname>
            <given-names>Victoria Vaughan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6673-1960</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Blecker</surname>
            <given-names>Saul</given-names>
          </name>
          <degrees>MHS, MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4460-1046</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Ng</surname>
            <given-names>Jason M</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6733-0176</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Rice</surname>
            <given-names>Brynne Campbell</given-names>
          </name>
          <degrees>MA, MSLIS, MS</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4396-9378</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Melkus</surname>
            <given-names>Gail D’Eramo</given-names>
          </name>
          <degrees>EdD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5859-4118</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Shenkar</surname>
            <given-names>Liat</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4717-7239</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Mortejo</surname>
            <given-names>Marie Claire R</given-names>
          </name>
          <degrees>BSN</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2439-9135</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Johnson</surname>
            <given-names>Stephen B</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7663-4355</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Rory Meyers College of Nursing</institution>
        <institution>New York University</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Population Health</institution>
        <institution>Grossman School of Medicine</institution>
        <institution>New York University</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Division of Endocrinology and Metabolism</institution>
        <institution>Department of Medicine</institution>
        <institution>University of Pittsburgh</institution>
        <addr-line>Pittsburgh, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Division of Libraries</institution>
        <institution>New York University</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Lehigh Valley Health Network</institution>
        <institution>Lehigh Valley Reilly Children’s Hospital</institution>
        <addr-line>Allentown, PA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Yaguang Zheng <email>yaguang.zheng@nyu.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Apr-Jun</season>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>16</day>
        <month>5</month>
        <year>2022</year>
      </pub-date>
      <volume>7</volume>
      <issue>2</issue>
      <elocation-id>e34681</elocation-id>
      <history>
        <date date-type="received">
          <day>3</day>
          <month>11</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>19</day>
          <month>1</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>3</day>
          <month>4</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>8</day>
          <month>4</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Yaguang Zheng, Victoria Vaughan Dickson, Saul Blecker, Jason M Ng, Brynne Campbell Rice, Gail D’Eramo Melkus, Liat Shenkar, Marie Claire R Mortejo, Stephen B Johnson. Originally published in JMIR Diabetes (https://diabetes.jmir.org), 16.05.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Diabetes, is properly cited. The complete bibliographic information, a link to the original publication on https://diabetes.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://diabetes.jmir.org/2022/2/e34681" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Accurately identifying patients with hypoglycemia is key to preventing adverse events and mortality. Natural language processing (NLP), a form of artificial intelligence, uses computational algorithms to extract information from text data. NLP is a scalable, efficient, and quick method to extract hypoglycemia-related information when using electronic health record data sources from a large population.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The objective of this systematic review was to synthesize the literature on the application of NLP to extract hypoglycemia from electronic health record clinical notes.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Literature searches were conducted electronically in PubMed, Web of Science Core Collection, CINAHL (EBSCO), PsycINFO (Ovid), IEEE Xplore, Google Scholar, and ACL Anthology. Keywords included <italic>hypoglycemia</italic>, <italic>low blood glucose</italic>, <italic>NLP</italic>, and <italic>machine learning</italic>. Inclusion criteria included studies that applied NLP to identify hypoglycemia, reported the outcomes related to hypoglycemia, and were published in English as full papers.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>This review (n=8 studies) revealed heterogeneity of the reported results related to hypoglycemia. Of the 8 included studies, 4 (50%) reported that the prevalence rate of any level of hypoglycemia was 3.4% to 46.2%. The use of NLP to analyze clinical notes improved the capture of undocumented or missed hypoglycemic events using International Classification of Diseases, Ninth Revision (ICD-9), and International Classification of Diseases, Tenth Revision (ICD-10), and laboratory testing. The combination of NLP and ICD-9 or ICD-10 codes significantly increased the identification of hypoglycemic events compared with individual methods; for example, the prevalence rates of hypoglycemia were 12.4% for International Classification of Diseases codes, 25.1% for an NLP algorithm, and 32.2% for combined algorithms. All the reviewed studies applied rule-based NLP algorithms to identify hypoglycemia.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The findings provided evidence that the application of NLP to analyze clinical notes improved the capture of hypoglycemic events, particularly when combined with the ICD-9 or ICD-10 codes and laboratory testing.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>hypoglycemia</kwd>
        <kwd>natural language processing</kwd>
        <kwd>electronic health records</kwd>
        <kwd>diabetes</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Approximately 34 million (13%) US adults have diabetes [<xref ref-type="bibr" rid="ref1">1</xref>]. Worldwide, 387 million persons have diabetes, a number that is expected to rise to 592 million by 2035 [<xref ref-type="bibr" rid="ref2">2</xref>]. In 2017, direct and indirect costs attributed to diabetes in the United States were estimated to be US $327 billion [<xref ref-type="bibr" rid="ref3">3</xref>]. Optimal glycemic control (glycated hemoglobin [HbA<sub>1c</sub>] &#60;7%) can be achieved with comprehensive antidiabetic treatment; however, the risk of hypoglycemia increases. In patients with type 2 diabetes (T2D), after experiencing hypoglycemia, the 3-year incidence of cardiovascular events was 35.1%, and mortality 28.3% to 31.9% [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>].</p>
        <p>The incidence of hypoglycemia has been reported to vary widely for patients with diabetes. An earlier systematic review and meta-analysis of 46 studies found that 45% of the patients with T2D had mild or moderate hypoglycemia and 6% had severe hypoglycemia; the prevalence was even higher among those treated with insulin, with 50% having mild or moderate hypoglycemia events and 21% having severe events [<xref ref-type="bibr" rid="ref6">6</xref>]. A subsequent review study showed that the rates of severe hypoglycemia in T2D were between 0.7 and 12 per 100 person-years in randomized controlled trials and between 0.2 (without treatment with insulin or sulfonylureas) and 2 (with treatment with insulin or sulfonylureas) per 100 person-years [<xref ref-type="bibr" rid="ref7">7</xref>]. The most recent systematic review and meta-analysis of 72 studies indicated that the incidence rate of hypoglycemia was 14.5 to 42,890 episodes per 1000 person-years in type 1 diabetes (T1D) and 0.072 to 16,360 episodes per 1000 person-years in T2D [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
        <p>The reported rates of hypoglycemia vary largely because of the marked heterogeneity in the way that hypoglycemia is defined, measured, and reported. Accurately identifying patients with hypoglycemia is key to preventing adverse events and mortality. There are several methods to identify hypoglycemia events and severity in large populations, including patient questionnaires and International Classification of Diseases, Ninth Revision (ICD-9), or International Classification of Diseases, Tenth Revision (ICD-10), and electronic health records (EHRs). Studies have found that using questionnaires [<xref ref-type="bibr" rid="ref9">9</xref>] or International Classification of Diseases (ICD) codes [<xref ref-type="bibr" rid="ref10">10</xref>] is often insensitive, leads to underestimation of hypoglycemia events, and is nonspecific in detecting hypoglycemia events.</p>
        <p>EHRs have been widely adopted by health care systems, resulting in large amounts of data, including unstructured text in clinical notes [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. The amount of unstructured text is vast and continues to grow at a breakneck pace. Clinical notes enable health care providers to not only identify patients at risk of hypoglycemia but also to obtain details on hypoglycemia; for example, symptomatic or asymptomatic hypoglycemia [<xref ref-type="bibr" rid="ref13">13</xref>]. Once the patients at risk of hypoglycemia are identified, their treatment can be personalized, which helps to prevent future hypoglycemia and the resulting serious adverse effects. Traditional methods such as manual chart review can extract information related to hypoglycemia from EHR clinical notes [<xref ref-type="bibr" rid="ref14">14</xref>]; however, such methods are time-consuming, labor intensive, and not scalable, which makes them impractical for use in large populations [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
        <p>By contrast, novel data science approaches, including using natural language processing (NLP), have been applied to overcome the aforementioned difficulties [<xref ref-type="bibr" rid="ref16">16</xref>]. NLP, a form of artificial intelligence, uses computational algorithms to process human language content for a variety of purposes [<xref ref-type="bibr" rid="ref17">17</xref>]. The application of NLP algorithms is a scalable, efficient, and quick method to extract unstructured data from a large population [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. Applications of NLP in the health domain can be categorized into 2 groups: rule-based methods and machine learning methods [<xref ref-type="bibr" rid="ref20">20</xref>]. Rule-based NLP techniques are based on a predefined clinical vocabulary, which identifies a set of core concepts for target extraction (eg, hypoglycemia), and may also use pattern matching (such as regular expressions) and filters [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Rule-based systems are time-consuming to set up, but they are easy to understand and modify and often require fewer amounts of data than machine learning approaches [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Machine learning systems leverage the same feature sets as those used in rule-based systems but do the work to discover the rules needed for a solution; however, this comes at a price: the resulting systems often function as a <italic>black box</italic>, which is difficult for humans to understand and trust [<xref ref-type="bibr" rid="ref20">20</xref>]. In addition, machine learning systems typically require very large sample sizes for development [<xref ref-type="bibr" rid="ref23">23</xref>]. Deep learning approaches (neural networks) are a form of machine learning used in recent years [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>], which can achieve performances comparable with, or better than, those of domain experts in identifying clinical information [<xref ref-type="bibr" rid="ref16">16</xref>]. However, deep learning–based models require large amounts of training data to achieve high accuracy, hindering the adoption of deep learning–based models in scenarios with limited amounts of training data [<xref ref-type="bibr" rid="ref27">27</xref>]. As a result, state-of-the-art deep learning methods of NLP (eg, transformer models and transfer learning) were developed to address these issues, and they have been proven to be extremely effective in the NLP domain [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>].</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>Currently, little is known about what types of NLP algorithms were applied to identify hypoglycemia and how differences in hypoglycemia incidence identified from unstructured data using NLP compare with hypoglycemia incidence identified from structured data (eg, ICD codes) across studies. It was reported in 1 study that a higher number of hypoglycemia events could be identified in clinical notes by using NLP than by using ICD codes (65% vs 20%, respectively) [<xref ref-type="bibr" rid="ref29">29</xref>]. Thus, in this systematic review, we aimed to synthesize the literature on the application of NLP to extract hypoglycemia from EHR clinical notes and compare the differences between hypoglycemia incidence identified from unstructured data using NLP and hypoglycemia incidence identified from structured data (eg, ICD codes) across studies.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Search Strategies</title>
        <p>Literature searches for a comprehensive review were conducted in 7 electronic databases: PubMed, Web of Science Core Collection, CINAHL (EBSCO), PsycINFO (Ovid), IEEE Xplore, Google Scholar, and ACL Anthology. The search strategies were developed in consultation with a health sciences librarian (BCR). The searches were conducted before February 22, 2022. Database-specific subject headings (eg, Medical Subject Headings) and relevant keywords were identified to describe hypoglycemia and these terms were searched in combination with terms related to NLP. As few articles related to hypoglycemia and NLP were located, the searches were widened to include broader terms such as <italic>blood sugar</italic> or <italic>blood glucose</italic>, and <italic>machine learning</italic> or <italic>artificial intelligence</italic>. No date, language, or publication filters were applied within the databases. Appropriate Boolean operators were used to structure the search queries and both unqualified free-text searching and field tags were used; the detailed search queries for each database are presented in <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>.</p>
        <boxed-text id="box1" position="float">
          <title>Search strategies for hypoglycemia and natural language processing.</title>
          <p>
            <bold>PubMed</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>((<italic>Hypoglycemia</italic> [MeSH]) OR <italic>Blood Glucose</italic> [MeSH] OR <italic>hypoglycemi*</italic> [TW] OR <italic>blood sugar*</italic> [TW] OR <italic>blood glucose</italic> [TW]) AND ((((Natural Language Processing [MeSH]) OR <italic>Machine Learning</italic> [MeSH]) OR <italic>Artificial Intelligence</italic> [MeSH]) OR <italic>Data Mining</italic> [MeSH:noexp] OR <italic>NLP</italic> [TW] OR <italic>natural language processing</italic> [TW] OR <italic>machine learning</italic> [TW] OR <italic>artificial intelligence</italic> [TW] OR <italic>text mine</italic> [TW] OR <italic>text analys*</italic> [TW] OR <italic>text processing</italic> [TW] OR <italic>text classif*</italic> [TW] OR <italic>information extraction</italic> [TW] OR ((electronic health record* [TW]) AND (<italic>diagnos*</italic> [TW])))</p>
            </list-item>
          </list>
          <p>
            <bold>Web of Science</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>TS=(<italic>hypoglycemi*</italic> OR (<italic>blood NEAR/3 sugar</italic>) OR (<italic>blood NEAR/3 glucose</italic>)) AND TS=((<italic>“Natural Language Processing”</italic> OR <italic>NLP</italic> OR <italic>“Machine Learning”</italic> OR <italic>“Artificial Intelligence”</italic> OR (<italic>“text mining”</italic> OR <italic>“text mine”</italic> OR <italic>“text analys*”</italic> OR <italic>“text* analyst”</italic> OR <italic>“text* processing”</italic> OR <italic>“text classif*”</italic> OR <italic>“information extraction”)</italic> OR ((<italic>electronic health record*</italic> OR <italic>electronic medical record*</italic> OR <italic>electronic patient record*</italic>) AND <italic>diagnos*</italic>)))</p>
            </list-item>
            <list-item>
              <p>Document type: article</p>
            </list-item>
            <list-item>
              <p>Language: English</p>
            </list-item>
          </list>
          <p>
            <bold>CINAHL</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>((MH “<italic>Hypoglycemia</italic>”) OR (MH “<italic>Blood Glucose”</italic>) OR (<italic>hypoglycemi*</italic> OR <italic>“blood glucose”</italic> OR <italic>“blood sugar”</italic>)) AND (( (MH “<italic>Natural Language Processing</italic>”) OR <italic>“natural language processing”</italic> OR (MH “<italic>Artificial Intelligence</italic>+”) OR (MH “<italic>Data Mining”</italic>) OR (MH “<italic>Machine Learning</italic>+”) OR “<italic>text mining”</italic> OR “<italic>text analysis”</italic> OR “<italic>text processing”</italic> OR <italic>text classif*</italic> OR “<italic>information extraction”</italic> ) OR ( ((“<italic>electronic health record”</italic> OR “<italic>electronic medical record”</italic> OR “<italic>electronic patient record”</italic> OR “<italic>electronic health records”</italic> OR “<italic>electronic medical records</italic>” OR “<italic>electronic patient records”</italic> OR <italic>EHR</italic> OR <italic>EMR</italic>) N3 <italic>diagnos</italic>*) ))</p>
            </list-item>
          </list>
          <list list-type="bullet">
            <list-item>
              <p>Language: English</p>
            </list-item>
          </list>
          <p>
            <bold>PsycINFO (Ovid)</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>(<italic>hypoglycemi*.mp.</italic> or <italic>exp Hypoglycemia/ or blood sugar.mp.</italic> or <italic>exp Blood Sugar/ or blood glucose.mp.)</italic> AND <italic>(natural language processing.mp.</italic> or <italic>exp Natural Language Processing/</italic> or <italic>machine learning.mp.</italic> or <italic>exp Machine Learning/</italic> or <italic>artificial intelligence.mp.</italic> or <italic>exp Artificial Intelligence/</italic> or <italic>text mining.mp.</italic> or <italic>text processing.mp.</italic> or <italic>text classif*.mp.</italic> or <italic>information extraction.mp.</italic> or <italic>((exp Electronic Health Records/</italic> or <italic>electronic health record.mp.</italic> or <italic>electronic medical record.mp.</italic> or <italic>electronic patient record.mp.)</italic> and <italic>(exp Diagnosis/</italic> or <italic>diagnos*.mp.)))</italic></p>
            </list-item>
          </list>
          <p>
            <bold>ACL Anthology</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p><italic>hypoglycemia</italic> OR <italic>blood glucose</italic> OR <italic>blood sugar</italic> OR <italic>hypoglycemic</italic></p>
            </list-item>
          </list>
          <p>
            <bold>Google Scholar</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p><italic>natural language processing</italic> AND <italic>hypoglycemia</italic> AND <italic>electronic health records</italic></p>
            </list-item>
          </list>
          <p>
            <bold>IEEE Xplore</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>(<italic>All Metadata:blood sugar</italic> OR <italic>All Metadata:blood glucose</italic> OR <italic>All Metadata:hypoglycemia</italic> OR <italic>All Metadata:hypoglycemic)</italic> AND (<italic>All Metadata:natural language processing</italic> OR <italic>All Metadata:NLP</italic> OR <italic>All Metadata:“machine learning”</italic> OR <italic>All Metadata:“artificial intelligence”</italic> OR <italic>All Metadata:“text mining”</italic> OR <italic>All Metadata:“text analysis”</italic> OR <italic>All Metadata:“text analyses”</italic> OR <italic>All Metadata:“text analytics”</italic> OR <italic>All Metadata:“text processing”</italic>)</p>
            </list-item>
            <list-item>
              <p>Filters applied: journals</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>Inclusion and Exclusion Criteria</title>
        <p>The inclusion criteria were as follows: studies that (1) were restricted to participants aged ≥18 years; (2) reported a sample with a diagnosis of diabetes; (3) applied NLP to identify hypoglycemia; (4) reported the number or percentage of participants who had experienced at least one hypoglycemic episode, the incidence of hypoglycemic episodes experienced, or data to allow the calculation of one of these measures; (5) used EHR data; (6) were published as full papers in peer-reviewed journals; (7) were published in English. No restrictions were applied regarding the definition or measurement of hypoglycemia. No restrictions were applied to country or origin of the studies. Studies were excluded if (1) they did not report outcomes related to hypoglycemia, (2) they were pharmacological trials or the intervention focused on treatment or care, (3) the participants were all pregnant or children, and (4) they reported only conference papers or proceedings.</p>
      </sec>
      <sec>
        <title>Data Extraction</title>
        <p>We first developed and tested a data extraction form, with adaptations made accordingly. The titles, abstracts, and full-text articles were screened by 2 independent reviewers (MCRM, LS, Emily M Pan, or Yi Lan Zhang). Once conflicts were identified, agreement was reached after discussion with the third reviewer (YZ). The results related to the identification of eligible studies were summarized according to the PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) guidelines (<xref rid="figure1" ref-type="fig">Figure 1</xref>). The searches yielded 2070 citations, and after removing duplicates, 1705 (82.37%) titles and abstracts were screened for eligibility. After full-text retrieval of 334 potentially relevant papers, 326 (97.6%) were subsequently excluded, leaving 8 (2.4%) papers that applied NLP to identify hypoglycemia and reported the rates of hypoglycemia that were eligible for inclusion in the analyses. The reference sections of the relevant articles were searched manually, but no further relevant articles were found. Studies were summarized based on the following categories: authors and country, sample size and characteristics, medical conditions, antihyperglycemic medication, study design, data source, definition of hypoglycemia, method used to identify hypoglycemia, NLP algorithm (eg, rule-based or machine learning), NLP algorithm validation, and outcomes (<xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) flowchart. In the case of Google Scholar, the first 100 results based on relevancy ranking is suggested to identify additional articles, and in the case of ACL Anthology, all the citations found were added to the irrelevant set (excluded based on title and abstract) [<xref ref-type="bibr" rid="ref30">30</xref>]. NLP: natural language processing.</p>
          </caption>
          <graphic xlink:href="diabetes_v7i2e34681_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Summary of studies on natural language processing (NLP) and hypoglycemia.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="250"/>
            <col width="250"/>
            <col width="200"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td>Author, year, country</td>
                <td>Sample characteristics</td>
                <td>Medical conditions</td>
                <td>Antihyperglycemic medication</td>
                <td>Study design</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Nunes et al, 2016 [<xref ref-type="bibr" rid="ref31">31</xref>], United States</td>
                <td>N=844,683; age (years; n [%]): &#60;30: 10,138 (1.20), 30 to 39: 38,491 (4.56), 40 to 49: 105,476 (12.49), 50 to 59: 196,494 (23.26), 60 to 69: 232,885 (27.57), &#62;69: 261,199 (30.92); female (n [%]): 433,322 (51.30); White (n [%]): 655,474 (77.60); T2D<sup>a</sup> (n [%]): 844,683 (100); baseline measures, mean (SD): BMI (kg/m<sup>2</sup>): 31.8 (10.2), HbA<sub>1c</sub><sup>b</sup> (%): 7.0 (1.9), blood glucose level (mg/dL): 139.0 (82)</td>
                <td>Atrial fibrillation (n [%]): 60,773 (7.19); hypertension (n [%]): 555,482 (65.76); hyperlipidemia (n [%]): 510,944 (60.49); cerebrovascular disease (n [%]): 54,336 (6.43); chronic kidney disease: retinopathy (n [%]): 10,356 (1.23), neuropathy (n [%]): 44,352 (5.25), nephropathy (n [%]): 26,498 (3.14); ischemic heart disease (n [%]): 154,049 (18.24); congestive heart failure (n [%]): 59,438 (7.04)</td>
                <td>Not specified</td>
                <td>Retrospective cohort study</td>
              </tr>
              <tr valign="top">
                <td>Nunes et al 2017 [<xref ref-type="bibr" rid="ref29">29</xref>], United States</td>
                <td>N=143,635; age (years; n [%]): &#60;30: 1333 (0.93), 30 to 39: 5420 (3.77), 40 to 49: 15,645 (10.89), 50 to 59: 32,796 (22.83), 60 to 69: 39,852 (27.75), &#62;69: 48,491 (33.76); female (n [%]): 69,879 (48.65); White (n [%]): 116,701 (81.25); T2D (n [%]): 143,635 (100); baseline measures (median [IQR]): BMI (kg/m<sup>2</sup>): 32.3 (28.1-37.6), HbA<sub>1c</sub> (%): 7.1 (6.5-8.1), blood glucose level (mg/dL): 146.0 (116.0-191.0)</td>
                <td>N=143,635; cerebrovascular disease (n [%]): 11,903 (8.29); retinopathy (n [%]): 3091 (2.15); neuropathy (n [%]): 12,961 (9.02); nephropathy (n [%]): 8338 (5.80); ischemic heart disease (n [%]): 33,570 (23.37)</td>
                <td>N=143,635; sulfonylureas (n [%]): 143,635 (100)</td>
                <td>Retrospective cohort study</td>
              </tr>
              <tr valign="top">
                <td>Loughlin et al, 2018 [<xref ref-type="bibr" rid="ref32">32</xref>], United States</td>
                <td>N=6024; EQW<sup>c</sup> cohort (n [%]): 2008 (33.33%); age (years): —<sup>d</sup>; female (n [%]): 1004 (50); White (n [%]): 1630 (81.17); T2D (n [%]): 2008 (100); baseline measures: —; BI<sup>e</sup> cohort (n [%]): 4016 (66.67%); age (years): —; female (n [%]): 2036 (50.70); White (n [%]): 3277 (81.60); T2D (n [%]): 4016 (100); baseline measures: —</td>
                <td>—</td>
                <td>N=6024; insulin (n [%]): 6024 (100)</td>
                <td>Retrospective cohort study</td>
              </tr>
              <tr valign="top">
                <td>Pettus et al, 2019 [<xref ref-type="bibr" rid="ref33">33</xref>], United States</td>
                <td>N=831,456; BI switchers (n=3920 to 19,256); age (years): range 58.2-60.1; female (%): range 49.8-52.0; White (%): —; T2D: (831,456, 100%); baseline measures: BMI (kg/m<sup>2</sup>): range 33.8-35.0; HbA<sub>1c</sub> (%): range 8.91-9.02; blood glucose level (mg/dL): —; smoking (%): —. Insulin naïve (n=2279 to 47,085); age (years): range 58.8-60.4; female (%): range 48.6-52.1; White (%): —; T2D (n [%]): (100); baseline measures: BMI (kg/m<sup>2</sup>): range 34.0-34.6; HbA<sub>1c</sub> (%): range 9.39-9.64; blood glucose level (mg/dL): —; smoking (%): —</td>
                <td>BI switchers: hypertension: 63.4-73.4, hyperlipidemia: 68.1-77.8, microvascular complication: 44.7-55.7, macrovascular complication: 44.2-63.5. Insulin naïve: hypertension: 56.8-74.2; hyperlipidemia: 61.5-77.8, microvascular complication: 25.3-34.6, macrovascular complication: 32.7-63.5</td>
                <td>BI switchers: sulfonylureas: 24.5-28.3; any OAD<sup>f</sup>: 63.6- 75.2. Insulin naïve: sulfonylureas: 47.6-56.6;</td>
                <td>Retrospective cohort study</td>
              </tr>
              <tr valign="top">
                <td>Li et al, 2019 [<xref ref-type="bibr" rid="ref34">34</xref>], United States</td>
                <td>N=38,780; age (years), mean: 57.0; female (n [%]): 21,716 (56); White (%): 18,226 (47); T2D (%): —; baseline measures: BMI (kg/m<sup>2</sup>), mean (SD): 35.7 (9.8); HbA<sub>1c</sub> (n [%]): ≤6.5%: 5321 (13.72), &#62;6.5% to &#60;7%: 1840 (4.74), ≥7% to &#60;8%: 3155 (8.14), ≥8% to &#60;9%: 1773 (4.57), ≥9%: 3977 (10.26), missing: 22,714 (58.57)</td>
                <td>N=38,780; coronary artery disease (n [%]): 2021 (5.21); chronic heart failure (n [%]): 1582 (4.08); diabetic neuropathy (n [%]): 1414 (3.65)</td>
                <td>N=38,780; long-acting insulin (LAI<sup>g</sup>): 615 (1.59); sulfonylureas: 8727 (22.50)</td>
                <td>Retrospective cohort study</td>
              </tr>
              <tr valign="top">
                <td>Misra-Hebert et al, 2020 [<xref ref-type="bibr" rid="ref35">35</xref>], United States</td>
                <td>N=204,517; the values provided herein are from a subsample: (n=46,302); age (years): 61.48; female (%):22,633 (48.90); White (%):34,004 (73.40); T2D (n [%]):46,302 (100); baseline measures: BMI (kg/m<sup>2</sup>): 32.2; HbA<sub>1c</sub> (%): 6.6; blood glucose level (mg/dL): —</td>
                <td>n=46,302; cardiovascular disease (n [%]): 13,372 (28.9); congestive heart failure (n [%]): 2195 (4.7); chronic kidney disease (n [%]): 2460 (5.3)</td>
                <td>n=46,302; insulin (n [%]): 8050 (17.4); glucagon-like peptide-1 receptor agonist (n [%]): 1781 (3.8); dipeptidyl peptidase 4: 4437 (9.6); sodium-glucose cotransporter-2 inhibitor (n [%]): 791 (1.7); metformin: 28,851 (62.3); sulfonylureas (n [%]): 10,098 (21.8); alpha-glucosidase inhibitor (n [%]): 107 (0.2)</td>
                <td>Retrospective cohort study</td>
              </tr>
              <tr valign="top">
                <td>Uzoigw et al 2020 [<xref ref-type="bibr" rid="ref36">36</xref>], United States</td>
                <td>N=359,087; T2D (n [%]): 317,399 (88.39); age (years), median (IQR): 68.0 (18); female (n [%]): 154,512 (48.68); White (%):121,468 (38.27); baseline measures: BMI (kg/m<sup>2</sup>): —; HbA<sub>1c</sub> (%): —; blood glucose level (mg/dL): —; smoking (n [%]):106,760 (33.63). T1D<sup>h</sup>: (n [%]): 41,688 (11.61); age (years): median (IQR) 55.0 (30); female (n [%]): 21,034 (50.46); White (n [%]): 16,072 (38.55); baseline measures: BMI (kg/m<sup>2</sup>): —; HbA<sub>1c</sub> (%): —; blood glucose level (mg/dL): —; smoking (n [%]): 9174 (22)</td>
                <td>T2D: N=317,399; hypertension (n [%]): 257,093 (81); hyperlipidemia (n [%]): 193,616 (61); cardiovascular disease (n [%]): 158,699 (50). T1D: N=41,688; high blood sugar level or diabetic ketoacidosis (n [%]): 14,067 (33.74); cancer (n [%]): 6752 (16.20); stroke (n [%]): 7377 (17.70); substance use or abuse (n [%]): 4917 (11.79)</td>
                <td>T2D: N=317,399; insulin (n [%]): 174,569 (55); sulfonylureas (n [%]): 55,710 (17.55); metformin (n [%]): 114,263(36). T1D: N=41,688; insulin (n [%]): 37,279 (89.42); sulfonylureas (n [%]): 1846 (4.43); metformin (n [%]): 5059 (12.14)</td>
                <td>Retrospective cohort study</td>
              </tr>
              <tr valign="top">
                <td>Ganz et al 2014 [<xref ref-type="bibr" rid="ref37">37</xref>], United States</td>
                <td>N=7235; HbA<sub>1c</sub> (%): —; blood glucose level (mg/dL): —; smoking (%): —; T2D (n [%]): 7235 (100); age (years), mean (SD): 60.82 (11.65); female (n [%]): 3668 (50.70); White (n [%]): 4576 (63.25); baseline measures: BMI (kg/m<sup>2</sup>): —; HbA<sub>1c</sub> (%): —; blood glucose level (mg/dL): —; smoking (%): —</td>
                <td>T2D (n [%]): 7235 (100)</td>
                <td>Insulin: glargine (%): 77.24; neutral protamine Hagedorn insulin (%): 5.86; detemir (%): 16.90. Sulfonylureas (%): 38.06; metformin (%): 36.66; other OADs (%): 25.82</td>
                <td>Retrospective cohort study</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>T2D: type 2 diabetes.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>HbA<sub>1c</sub>: glycated hemoglobin.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>EQW: exenatide once weekly.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>Not available.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>BI: basal insulin.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>OAD: oral antidiabetic drug.</p>
            </fn>
            <fn id="table1fn7">
              <p><sup>g</sup>LAI: long-acting insulin.</p>
            </fn>
            <fn id="table1fn8">
              <p><sup>h</sup>T1D: type 1 diabetes.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Summary of studies on natural language processing (NLP) and hypoglycemia.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="90"/>
            <col width="160"/>
            <col width="160"/>
            <col width="130"/>
            <col width="140"/>
            <col width="140"/>
            <col width="180"/>
            <thead>
              <tr valign="top">
                <td>Author, year, country</td>
                <td>Data source</td>
                <td>Definition of hypoglycemia</td>
                <td>Method used to identify hypoglycemia</td>
                <td>NLP algorithm: rule-based or machine learning</td>
                <td>NLP algorithm validation</td>
                <td>Outcomes</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Nunes et al, 2016 [<xref ref-type="bibr" rid="ref31">31</xref>], United States</td>
                <td>Optum Humedica EHR<sup>a</sup> database, which incorporates EHRs from 35 large medical provider organizations (including &#62;195 hospitals), &#62;25,000 physicians, and &#62;25 million patients, making up the largest EHR database within the United States (January 2009 to March 2014)</td>
                <td>Serious: ICD-9<sup>b</sup> identified events were characterized as serious or nonserious if the diagnosis was identified within a problem list; NLP-identified categories included serious (eg, serious, acute, severe, and profound); mild to moderate: NLP-identified categories included mild to moderate (eg, mild, moderate, slight, and minor)</td>
                <td>ICD-9 algorithm (structured diagnostic codes only); NLP algorithm (NLP of clinical notes); combined algorithm (either ICD-9 diagnostic codes or NLP of clinical notes)</td>
                <td>Rule-based</td>
                <td>The final algorithm was validated by manual review: precision (PPV<sup>c</sup>)=0.77, recall (sensitivity)=0.67</td>
                <td>Period prevalence (%): any conditions: ICD-9: 12.37, NLP: 25.11, combined: 32.19; serious: ICD-9: 11.93, NLP: 10.71, combined: 18.72; mild to moderate: ICD-9: 0.00, NLP: 0.76, combined: 0.78. Incidence rate (per 100 person-years): any conditions: ICD-9: 2.25, NLP: 4.78, combined: 6.28. Serious: ICD-9: 2.12, NLP: 1.72, combined: 3.19; mild to moderate: ICD-9: 0.00, NLP: 0.09, combined: 0.08. Event rate (per 100 person-years): any conditions: ICD-9: 6.92, NLP: 10.03, combined: 16.12; serious: ICD-9: 6.63, NLP: 3.06, combined: 8.90; mild to moderate: ICD-9: 0.00, NLP: 0.20, combined: 0.19</td>
              </tr>
              <tr valign="top">
                <td>Nunes et al, 2017 [<xref ref-type="bibr" rid="ref29">29</xref>], United States</td>
                <td>Optum EHR database (January 2009 to December 2014)</td>
                <td>Serious: ICD<sup>d</sup> and CPT<sup>e</sup> evidence of medical intervention or abstracted descriptors suggestive of serious event; nonserious, mild to moderate: No ICD or CPT evidence of medical intervention but with abstracted descriptors suggestive of mild to moderate event; nonserious, unspecified: no ICD or CPT evidence of medical intervention and no descriptors of event seriousness</td>
                <td>ICD codes and NLP</td>
                <td>Rule-based</td>
                <td>The final algorithm was validated by manual review: precision (PPV)=0.77, recall (sensitivity)=0.67</td>
                <td>Incidence rate (per 100 person-years; 95% CI): any conditions: overall: 11.76 (11.49-12.04), sulfonylureas use: 12.77 (12.40-13.15), sulfonylureas nonuse: 10.39 (10.00-10.79). Serious: overall: 5.06 (4.88-5.24), sulfonylureas use: 5.77 (5.52-6.03), sulfonylureas nonuse: 4.09 (3.84-4.34). Nonserious, mild to moderate: overall: 0.14 (0.11-0.17), sulfonylureas use: 0.17 (0.13-0.22), sulfonylureas nonuse: 0.09 (0.06-0.13). Nonserious, unspecified: overall: 6.57 (6.37-6.78), sulfonylureas use: 6.83 (6.56-7.11), sulfonylureas nonuse: 6.21 (5.91-6.52)</td>
              </tr>
              <tr valign="top">
                <td>Loughlin et al, 2018 [<xref ref-type="bibr" rid="ref32">32</xref>], United States</td>
                <td>Optum EHR database (January 2012 to January 2015)</td>
                <td>Documented blood glucose level &#60;3.9 mmol/L or emergency physician–charted diagnosis of hypoglycemia</td>
                <td>Hypoglycemia and gastrointestinal symptoms (vomiting, nausea, diarrhea, or constipation) were identified by using both ICD-9 Clinical Modification diagnostic codes within structured fields and NLP clinical notes; hypoglycemia was identified using an algorithm developed by Optum, incorporated diagnostic codes, and NLP of clinical notes</td>
                <td>Rule-based</td>
                <td>The final algorithm was validated by manual review: precision (PPV)=0.77, recall (sensitivity)=0.67</td>
                <td>Incidence rate (per 1000 person-years; 95% CI): EQW<sup>f</sup> cohort: 52.5 (44.4-61.6), BI<sup>g</sup> cohort: 65.7 (59.1-72.7). Any gastrointestinal symptoms: EQW cohort: 225.5 (206.8-245.5), BI cohort: 191.0 (179.1-203.6). Participants with at least one event (n/N [%]): EQW cohort: 149/2008 (7.42), BI cohort: 368/4016 (9.16). Any gastrointestinal symptoms (n/N [%]): EQW cohort: 534/2008 (26.60), BI cohort: 946/4016 (23.56)</td>
              </tr>
              <tr valign="top">
                <td>Pettus et al, 2019 [<xref ref-type="bibr" rid="ref33">33</xref>], United States</td>
                <td>Optum Humedica EHR database (January 1, 2007, to March 31, 2017)</td>
                <td>Hypoglycemia: ICD-9 and ICD-10<sup>h</sup> codes for hypoglycemia; plasma glucose level measures ≤70 mg/dL; IM<sup>i</sup> glucagon administration; NLP: mention of hypoglycemia; severe hypoglycemia: ICD-9 and ICD-10 codes for hypoglycemia that is severe by default or ICD-9 and ICD-10 codes for hypoglycemia and hypoglycemia is reason for care on discharge or admission or hypoglycemia index date on same day as emergency department visit or inpatient diagnosis on admission (all related to hypoglycemic coma); plasma glucose level measures &#60;54 mg/dL; IM glucagon administration; NLP: mention of hypoglycemia with either a descriptor of hypoglycemia severity, including severity terms (eg, severe) and attributes (eg, emergency), or emergency department visit or inpatient admission on same day as medical record was written</td>
                <td>ICD-9 and ICD-10 codes; plasma glucose measures ≤70 mg/dL; IM glucagon administration; NLP</td>
                <td>Rule-based</td>
                <td>The final algorithm was validated by manual review: precision (PPV)=0.77, recall (sensitivity)=0.67</td>
                <td>Any hypoglycemia (%): BI switchers: 42.2-46.2. Insulin naïve: 22.8-28.8. Severe hypoglycemia: BI switchers: 8.2-17.4, insulin naïve: 2.7-8.6</td>
              </tr>
              <tr valign="top">
                <td>Li et al, 2019 [<xref ref-type="bibr" rid="ref34">34</xref>], United States</td>
                <td>Regenstrief Medical Record System, which is an urban safety-net medical institution in Indianapolis, Indiana, United States. In 2012, Eskenazi Health had 1081 physicians on staff and serviced 950,592 outpatient visits, including 234,637 community health center visits (January 1, 2004, to December 31, 2013)</td>
                <td>Plasma or point-of-care glucose value of at least 5 mg/dL and &#60;70 mg/dL, documented in the medical record; ICD-9 code: 251.1 or 251.2; ICD code 250.8 without any of the following codes: 259.8, 272.7, 681.xx, 682.x, 686.9, 707.1x, 707.2x, 707.8, 707.9, 709.3, 730.0x, 730.1x, 730.2x, 731.8; text note indicating hypoglycemia, including a blood glucose value</td>
                <td>Laboratory tests; diagnostic codes; NLP</td>
                <td>Rule-based</td>
                <td>—</td>
                <td>A 1-year window for prior episodes of hypoglycemia: overall prevalence (n/N [%]): 8182/38,780 (21); non-LAI<sup>j</sup> and sulfonylureas within 90 days (%): 42.92; sulfonylureas without insulin (%): 23.82; no insulin, no sulfonylureas (%): 17.85%; blood glucose value between 5 mg/dL and 70 mg/dL (n/N [%]): 7070/38,780 (18.23); blood glucose value&#60;54 mg/dL (n/N [%]): 4784/38,780 (12.34); NLP (n/N [%]): 3751/38,780 (9.67), with 539/38,780 (1.39), identified only by NLP</td>
              </tr>
              <tr valign="top">
                <td>Misra-Hebert et al, 2020 [<xref ref-type="bibr" rid="ref35">35</xref>], United States</td>
                <td>Cleveland Clinic Health System patient records (2005 to 2017)</td>
                <td>Hypoglycemia: blood glucose level &#60;70 mg/dL; severe hypoglycemia: patients with T2D<sup>k</sup> require hospitalization or emergency department visit; nonsevere hypoglycemia: does not require assistance for recovery</td>
                <td>NLP; ICD-9 codes: 251.0, 251.1, 251.2; ICD-10 codes: E08.641, E11.641, E11.649, E13.64, E13.641, E13.649, E16.0, E16.1, E15, E16.2</td>
                <td>Rule-based</td>
                <td>Compared with clinician chart review manually, PPV=93%</td>
                <td>Prevalence: among 204,517 patients with no codes for nonsevere hypoglycemia, evidence of nonsevere hypoglycemia was found in 7035 (3.4%) using NLP. Number of nonsevere hypoglycemia events: ICD codes (n/N [%]): 10,205/204,517 (4.99), NLP: 14,763/204,517 (7.22), with overlap of only 5 events. Incidence proportion of patients from 2005 to 2017 ICD codes (%): severe hypoglycemia: 0.3 to 1.7, nonsevere hypoglycemia: 0.4 to 1.3; NLP+ICD (%): nonsevere hypoglycemia: 0.8 to 2.6</td>
              </tr>
              <tr valign="top">
                <td>Uzoigw et al, 2020 [<xref ref-type="bibr" rid="ref36">36</xref>], United States</td>
                <td>Amplity Insights database, unstructured health records, generated from provider notes as transcribed from verbal to written form (January 1, 2016, to April 30, 2018)</td>
                <td>Nonsymptom-based: mention of hypoglycemia, low blood glucose level or blood glucose value≤70 mg/dL; symptom-based: keywords identified by endocrinologists, used by patients to describe hypoglycemia</td>
                <td>ICD codes; NLP</td>
                <td>Rule-based</td>
                <td>—</td>
                <td>Prevalence during 2 years (%): T2D: ICD: 52 (&#60;0.1); combined symptom and nonsymptom-based: 11.4; nonsymptom-based: 7.59; symptom-based: irritable or anxious: 14.50; cognitive issues: 12.14; elevated or irregular heart rate: 10.21. T1D<sup>l</sup>: ICD codes: 30 (0.1); combined symptom and nonsymptom-based: 20.4; nonsymptom-based: 18.12; symptom-based: irritable or anxious: 16.00; cognitive issues: 8.17; elevated or irregular heart rate: 8.17</td>
              </tr>
              <tr valign="top">
                <td>Ganz et al, 2014 [<xref ref-type="bibr" rid="ref37">37</xref>], United States</td>
                <td>Humedica real-time longitudinal clinical data patient-level EHR database (January 2008 to December 2011)</td>
                <td>Severe hypoglycemia: blood glucose level≤40 mg/dL</td>
                <td>ICD-9 codes 251.0x, 251.1x, 251.2x, or 250.3x on different days; NLP</td>
                <td>Rule-based</td>
                <td>The final algorithm was validated by manual review: precision (PPV)=0.77, recall (sensitivity)=0.67</td>
                <td>Posttitration follow-up period (1.8 years): incidence rate (per 100 patient-years; 95% CI)=4.63 (4.59-4.67); total severe hypoglycemia rate (per 100 patient-years)=9.69 (9.64-9.75). Incidence rate for patients with history of severe hypoglycemia events (95% CI)=5.91 (5.76-6.06). Total severe hypoglycemia rate for patients with history of severe hypoglycemia events (95% CI)=9.00 (8.87-9.12)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>EHR: electronic health record.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>ICD-9: International Classification of Diseases, Ninth Revision.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>PPV: positive predictive value.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>ICD: International Classification of Diseases.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>CPT: Current Procedures Terminology.</p>
            </fn>
            <fn id="table2fn6">
              <p><sup>f</sup>EQW: exenatide once weekly.</p>
            </fn>
            <fn id="table2fn7">
              <p><sup>g</sup>BI: basal insulin.</p>
            </fn>
            <fn id="table2fn8">
              <p><sup>h</sup>ICD-10: International Classification of Diseases, Tenth Revision.</p>
            </fn>
            <fn id="table2fn9">
              <p><sup>i</sup>IM: intramuscular.</p>
            </fn>
            <fn id="table2fn10">
              <p><sup>j</sup>LAI: long-acting insulin.</p>
            </fn>
            <fn id="table2fn11">
              <p><sup>k</sup>T2D: type 2 diabetes.</p>
            </fn>
            <fn id="table2fn12">
              <p><sup>l</sup>T1D: type 1 diabetes.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Description of Included Studies</title>
        <p>All included studies (n=8) were conducted in the United States [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]. The sample sizes were large, ranging from 6024 to 844,683. Of the 8 studies, 6 (75%) included only T2D [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref37">37</xref>], 1 (13%) included both T1D and T2D [<xref ref-type="bibr" rid="ref36">36</xref>], and 1 (13%) did not specify the type of diabetes [<xref ref-type="bibr" rid="ref34">34</xref>]. The participants varied in age from 57 to 68 years, and 48.7% to 56% were women. Among the studies (7/8, 88%) that reported on ethnicity, the percentage of non-White participants ranged from 18.8% to 62%. Mean BMI ranged from 31.8 (SD 10.2) to 35.7 (SD 9.8) kg/m<sup>2</sup>, and mean HbA<sub>1c</sub> ranged from 6.6% to 9.64%. Varied comorbidities were reported; for example, hypertension, hyperlipidemia, ischemic heart disease, and heart failure. Of the 8 studies, 4 (50%) provided diabetes-related complications, including retinopathy, neuropathy, and nephropathy [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]; 6 (75%) reported that 1.6% to 100% of the participants injected insulin [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]; and 6 (75%) reported 4.4% to 100% sulfonylureas use [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref37">37</xref>].</p>
        <p>All the included studies (n=8) were retrospective cohort study designs, with the observational durations of the cohort ranging from 2 to 12 years. Population samples were obtained from varied EHR databases such as Optum Humedica [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref37">37</xref>], Regenstrief [<xref ref-type="bibr" rid="ref34">34</xref>], Cleveland Clinic Health System patient records [<xref ref-type="bibr" rid="ref35">35</xref>], and Amplity Insights [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
      </sec>
      <sec>
        <title>Methods of Identifying Hypoglycemia</title>
        <p>All included studies used a combination of ICD codes and NLP to identify hypoglycemia; other methods were applied, including laboratory tests for plasma glucose measures ≤70 or &#60;54 mg/dL [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>] and glucagon administration [<xref ref-type="bibr" rid="ref33">33</xref>]. ICD-9 and ICD-10 codes used to identify hypoglycemia were described in detail by Misra-Hebert et al [<xref ref-type="bibr" rid="ref35">35</xref>]. Of the 8 studies, 3 (38%) reported both serious (level 3) and mild or moderate hypoglycemia (levels 1 and 2) [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref35">35</xref>], 1 (13%) reported both overall unspecified and severe hypoglycemia [<xref ref-type="bibr" rid="ref33">33</xref>], and 3 (38%) reported data on unspecified hypoglycemia [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>], whereas 2 (25%) studies also reported symptom-based and nonsymptom-based hypoglycemia [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref36">36</xref>].</p>
      </sec>
      <sec>
        <title>NLP Algorithms Applied to Identify Hypoglycemia</title>
        <p>All included studies applied rule-based algorithms (<xref ref-type="table" rid="table3">Table 3</xref>). The study by Misra-Hebert et al [<xref ref-type="bibr" rid="ref35">35</xref>] described in detail the NLP steps, including splitting clinical notes into sentences and phrases, filtering sentences and phrases to those containing references to a hypoglycemia-related Unified Medical Language System [<xref ref-type="bibr" rid="ref38">38</xref>] concept, identifying temporal phrases (identifying when the event occurred), and clarifying polarity (assertion or negation) into no, nonsevere, or severe event using both rule-based algorithms. Li et al [<xref ref-type="bibr" rid="ref34">34</xref>] identified hypoglycemia using a formally defined pattern (<italic>regular expression</italic>) [<xref ref-type="bibr" rid="ref39">39</xref>] such as a <italic>blood sugar word,</italic> followed within 5 words by what could be a low blood sugar value represented by a number ranging from 10 to 69. Uzoigwe et al [<xref ref-type="bibr" rid="ref36">36</xref>] identified keywords or concepts of interest related to both symptom-based and nonsymptom-based hypoglycemic events. The remaining studies (5/8, 63%) applied the same NLP algorithms to identify [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref37">37</xref>] (1) terms or concepts (eg, hypoglycemia), including alternative or incorrect spellings and abbreviations; (2) descriptive attributes of the hypoglycemia mention (eg, seriousness, duration, and frequency); (3) sentiment of the mention (eg, denial, affirmation, and discussion); and (4) other contextual information (eg, note section headers and neighboring text).</p>
        <p>Manual review of clinical notes was used as the gold standard to validate the NLP algorithms in 63% (5/8) of the studies. Of the 8 studies, 2 (25%) did not report validation of the algorithm, whereas in the 6 (75%) reporting studies, the precision (positive predictive value) for the hypoglycemia algorithm was 0.77% to 93% [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Of these 6 studies, 5 (83%) reported that the recall (sensitivity) was 0.67 [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref37">37</xref>].</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Natural language processing (NLP) algorithms applied in the reviewed studies.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="180"/>
            <col width="150"/>
            <col width="670"/>
            <thead>
              <tr valign="top">
                <td>Study</td>
                <td>NLP algorithm type</td>
                <td>Details of NLP algorithms</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Ganz et al, 2014 [<xref ref-type="bibr" rid="ref37">37</xref>]; Nunes et al, 2016 [<xref ref-type="bibr" rid="ref31">31</xref>]; Nunes et al, 2017 [<xref ref-type="bibr" rid="ref29">29</xref>]; Loughlin et al, 2018 [<xref ref-type="bibr" rid="ref32">32</xref>]; Pettus et al, 2019 [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td>Rule-based</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Identify terms consistent with hypoglycemia (including alternative or incorrect spellings and abbreviations)</p>
                    </list-item>
                    <list-item>
                      <p>Identify descriptive attributes of the hypoglycemia mention (eg, seriousness, duration, and frequency)</p>
                    </list-item>
                    <list-item>
                      <p>Identify sentiment of the mention (eg, denial and affirmation, including “has,” “diagnosed,” and “present”)</p>
                    </list-item>
                    <list-item>
                      <p>Identify contextual information (eg, note section headers and neighboring text). Sections such as “history of present illness,” “assessment,” “hospital course,” “reason,” “review of symptoms,” and “chief complaint” generally reflected occurrence of hypoglycemia</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Li et al, 2019 [<xref ref-type="bibr" rid="ref34">34</xref>]</td>
                <td>Rule-based</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>A formally defined pattern (regular expression), which identified clinical reports mentioning a “blood sugar word” followed within 5 words by what could be a low blood sugar value represented by a number ranging from 10 to 69</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Misra-Hebert et al, 2020 [<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>Rule-based</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Split clinical notes into sentences and phrases</p>
                    </list-item>
                    <list-item>
                      <p>Filter sentences and phrases to those containing a hypoglycemia-related Unified Medical Language System concept</p>
                    </list-item>
                    <list-item>
                      <p>Identify temporal phrases (when the event occurred)</p>
                    </list-item>
                    <list-item>
                      <p>Classify polarity (assertion or negation) into no, nonsevere, and severe event</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Uzoigwe et al, 2020 [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>Rule-based</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Identify keywords or concepts of interest: symptom-based and nonsymptom-based hypoglycemic events</p>
                    </list-item>
                  </list>
                  <list list-type="bullet">
                    <list-item>
                      <p>Symptom-based terms: neuroglycopenic and adrenergic symptomology associated with hypoglycemia.</p>
                    </list-item>
                  </list>
                  <list list-type="bullet">
                    <list-item>
                      <p>Adrenergic symptomology: elevated or irregular heart rate, sweating, tremor, trembling, tingling, or shaking, and vision impairment</p>
                    </list-item>
                    <list-item>
                      <p>Neuroglycopenic symptomology: cognitive issues, irritable or anxious, mood or behavior change+NOT substance abuse or alcohol, slurred speech+NOT stroke+NOT substance abuse or alcohol</p>
                    </list-item>
                  </list>
                  <list list-type="bullet">
                    <list-item>
                      <p>Nonsymptom-based definition:</p>
                    </list-item>
                  </list>
                  <list list-type="bullet">
                    <list-item>
                      <p>Mention of “hypoglycemia”</p>
                    </list-item>
                    <list-item>
                      <p>Relevant medical ontology such as “low glucose”</p>
                    </list-item>
                    <list-item>
                      <p>A blood glucose laboratory value ≤70 mg/dL documented</p>
                    </list-item>
                  </list>
                </td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Prevalence or Incidence of Hypoglycemia</title>
        <p>The prevalence or the incidence of hypoglycemia largely varied across studies. All studies used a combination of NLP and other approaches (eg, ICD codes) to identify hypoglycemia. Overall, the prevalence rate of any condition of hypoglycemia was 3.4% to 46.2%, as reported by 50% (4/8) of the studies [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>], and the incidence rate was 6.28% to 65.7%, as reported by 38% (3/8) of the studies [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. The prevalence rate of nonsevere hypoglycemia was 0.1% to 3.4% [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref35">35</xref>] and that of severe hypoglycemia was 5.1% to 18.7% [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Of the 8 studies, 4 (50%) compared the prevalence or incidence of hypoglycemia identified by NLP and ICD codes. In the study by Nunes et al (2016) [<xref ref-type="bibr" rid="ref31">31</xref>], the prevalence rates of any hypoglycemia within the study period were 12.4%, 25.1%, and 32.2% for the ICD-9, NLP algorithm, and combined algorithm, respectively. Similarly, Misra-Hebert et al [<xref ref-type="bibr" rid="ref35">35</xref>] found that NLP identified higher nonserious hypoglycemia events than ICD codes (14,763 vs 10,205 events) during the study period from 2005 to 2017; among 204,517 patients with no ICD codes for nonsevere hypoglycemia, evidence of nonsevere hypoglycemia was found in 7035 (3.44%) using NLP. Li et al [<xref ref-type="bibr" rid="ref34">34</xref>] also showed that hypoglycemia was identified in 21% of the participants, with 9.67% identified only by NLP algorithms. In addition, Uzoigwe et al [<xref ref-type="bibr" rid="ref36">36</xref>] found that the prevalence rates of hypoglycemia were 11.4% and &#60;0.1% using NLP algorithms and ICD codes, respectively, in T2D; the prevalence rates were 20.4% and 0.1%, respectively, in T1D.</p>
        <p>Using the combination of NLP and other approaches (eg, ICD codes) identified the highest prevalence or incidence of hypoglycemia compared with either method alone. Nunes et al [<xref ref-type="bibr" rid="ref31">31</xref>] found that the prevalence rates of hypoglycemia were 12.4% for ICD codes, 25.1% for NLP algorithm, and 32.2% for combined algorithms; the incidence rates per 100 person-years were 2.3%, 4.8%, and 6.3% using ICD codes, NLP, and combined algorithms, respectively. Similarly, Misra-Hebert et al [<xref ref-type="bibr" rid="ref35">35</xref>] identified that the incidence proportions of patients in the period from 2005 to 2017 were 0.4% and 1.3% for nonsevere hypoglycemia when using only ICD codes, whereas when NLP was added, the incidence proportions increased to 0.8% and 2.6%.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This systematic review aimed to synthesize the literature on the application of NLP to extract hypoglycemia from EHR clinical notes. Of the 8 studies, 4 (50%) reported that the prevalence rate of any level of hypoglycemia was 3.4% to 46.2%. Overall, the use of NLP to analyze clinical notes improved the capture of hypoglycemic events that may have been undocumented or missed using laboratory testing or ICD-9 and ICD-10 codes. The combination of NLP and other approaches significantly increased the identification of hypoglycemic events compared with individual methods. All reviewed studies applied rule-based NLP methods to identify hypoglycemia.</p>
        <p>Previous reviews of the prevalence and incidence of hypoglycemia using NLP are limited. Our study found that the prevalence rate of any condition of hypoglycemia was 3.4% to 46.2%, whereas a previous review study reported that the prevalence rate of any condition of hypoglycemia ranged from 1% to 19% for studies using EHR as a data source [<xref ref-type="bibr" rid="ref8">8</xref>]. In addition, 13% (1/8) of the studies in our review reported that symptom-based hypoglycemia—the estimated prevalence rate of hypoglycemia using combined symptom-based and nonsymptom-based definitions—was 20.4% (T1D) and 11.4% (T2D) [<xref ref-type="bibr" rid="ref36">36</xref>], which is more prevalent than previous analyses without applying NLP for data extraction [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>].</p>
        <p>All included studies (n=8) applied rule-based NLP to identify hypoglycemia. The main aim of our paper focused on the application of NLP algorithms to identify hypoglycemia and not on the method for developing algorithms. Published articles have reported developing machine learning or deep learning algorithms to identify hypoglycemia, but they did not report the incidence of hypoglycemia; therefore, we did not include such papers in our review. For example, Chen et al [<xref ref-type="bibr" rid="ref42">42</xref>] incorporated 3 machine learning algorithms to detect hypoglycemia, including logistic regression, linear support vector machines, and random forest. The result showed that single cross-validation logistic regression with cost-sensitive learning achieved the best performance with sensitivity of 0.693 and specificity of 0.974. In addition, Jin et al [<xref ref-type="bibr" rid="ref43">43</xref>] developed and evaluated deep learning–based NLP systems to automatically detect hypoglycemia events from EHR narratives; they found that the convolutional neural network model yielded a promising performance with precision of 0.96 and recall of 0.86 in a 10-fold cross-validation setting. Furthermore, none of our reviewed studies applied the currently dominant method (eg, transformer models and transfer learning) in NLP research to identify hypoglycemia from EHR data. Our review indicated that the applications of NLP to identify hypoglycemia mainly use the rule-based system. Although machine learning– and deep learning–based algorithms have been developed, they have not been applied in clinical research.</p>
        <p>A limitation of this review is the heterogeneity of the reported results. This heterogeneity prevents the estimation of the pooled incidence and prevalence of hypoglycemia in diabetes using NLP algorithms. In addition, excluding conference proceedings reduced the number of papers included. However, medical literature does not take conference proceedings into much consideration when making clinical decisions; therefore, conference proceedings are usually not included in a review paper in medical literature. However, in terms of clinical impacts, findings from the excluded conference proceedings would have more impact regarding the clinical decision of using NLP as a clinical algorithm, which can help patients or physicians to better identify high-risk hypoglycemia. To the best of our knowledge, this is the first systematic review to synthesize the prevalence and incidence of hypoglycemia using NLP in individuals with diabetes. All reviewed studies applied the combination of NLP with ICD codes and laboratory testing and identified higher incidence of hypoglycemia when using EHR data sources. This has significant clinical implications for the prevention and management of hypoglycemia; with the widespread use of EHRs, leveraging clinical notes significantly improves the identification of individuals with hypoglycemia. The preferred strategy is to use structured data (ICD codes), followed by using NLP to synthesize the unstructured data to pinpoint those at highest risk for hypoglycemia.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In conclusion, our findings provided evidence that the application of NLP to analyze clinical notes improved the capture of hypoglycemic events, particularly when combined with ICD-9 and ICD-10 codes and laboratory testing. Identifying such patients with diabetes is important and necessary for characterizing treatment and unmet needs, thus preventing the adverse events and mortality associated with hypoglycemia. The current application of NLP in the identification of hypoglycemia still relies on the traditional rule-based methods; although machine learning– and deep learning–based algorithms have been developed, they have not been applied in clinical research. Future research should explore comparison of the rule-based systems, machine learning approaches, and deep learning–based NLP methods (eg, transformer models and transfer learning) to improve NLP efficiency.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">HbA<sub>1c</sub></term>
          <def>
            <p>glycated hemoglobin</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">ICD</term>
          <def>
            <p>International Classification of Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ICD-10</term>
          <def>
            <p>International Classification of Diseases, Tenth Revision</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ICD-9</term>
          <def>
            <p>International Classification of Diseases, Ninth Revision</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">PRISMA</term>
          <def>
            <p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">T1D</term>
          <def>
            <p>type 1 diabetes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">T2D</term>
          <def>
            <p>type 2 diabetes</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors acknowledge Emily M Pan and Yi Lan Zhang for their assistance with article screening during the manuscript revision.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Centers for Disease Control and Prevention</collab>
          </person-group>
          <article-title>National Diabetes Statistics Report</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <year>2020</year>
          <access-date>2022-04-21</access-date>
          <publisher-loc>Atlanta, GA, USA</publisher-loc>
          <publisher-name>U.S. Dept of Health and Human Services</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/diabetes/data/statistics-report/index.html">https://www.cdc.gov/diabetes/data/statistics-report/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ogurtsova</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>da Rocha Fernandes</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Linnenkamp</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Guariguata</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Cavan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Makaroff</surname>
              <given-names>LE</given-names>
            </name>
          </person-group>
          <article-title>IDF Diabetes Atlas: global estimates for the prevalence of diabetes for 2015 and 2040</article-title>
          <source>Diabetes Res Clin Pract</source>
          <year>2017</year>
          <month>06</month>
          <volume>128</volume>
          <fpage>40</fpage>
          <lpage>50</lpage>
          <pub-id pub-id-type="doi">10.1016/j.diabres.2017.03.024</pub-id>
          <pub-id pub-id-type="medline">28437734</pub-id>
          <pub-id pub-id-type="pii">S0168-8227(17)30375-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>American Diabetes Association</collab>
          </person-group>
          <article-title>Economic costs of diabetes in the U.S. in 2017</article-title>
          <source>Diabetes Care</source>
          <year>2018</year>
          <month>05</month>
          <volume>41</volume>
          <issue>5</issue>
          <fpage>917</fpage>
          <lpage>28</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29567642"/>
          </comment>
          <pub-id pub-id-type="doi">10.2337/dci18-0007</pub-id>
          <pub-id pub-id-type="medline">29567642</pub-id>
          <pub-id pub-id-type="pii">dci18-0007</pub-id>
          <pub-id pub-id-type="pmcid">PMC5911784</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Warren</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>McEvoy</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Matsushita</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Sharrett</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Coresh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Selvin</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The association of severe hypoglycemia with incident cardiovascular events and mortality in adults with type 2 diabetes</article-title>
          <source>Diabetes Care</source>
          <year>2018</year>
          <month>01</month>
          <volume>41</volume>
          <issue>1</issue>
          <fpage>104</fpage>
          <lpage>11</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29127240"/>
          </comment>
          <pub-id pub-id-type="doi">10.2337/dc17-1669</pub-id>
          <pub-id pub-id-type="medline">29127240</pub-id>
          <pub-id pub-id-type="pii">dc17-1669</pub-id>
          <pub-id pub-id-type="pmcid">PMC5741158</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Akirov</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Grossman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shochat</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Shimon</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Mortality among hospitalized patients with hypoglycemia: insulin related and noninsulin related</article-title>
          <source>J Clin Endocrinol Metab</source>
          <year>2017</year>
          <month>02</month>
          <day>01</day>
          <volume>102</volume>
          <issue>2</issue>
          <fpage>416</fpage>
          <lpage>24</lpage>
          <pub-id pub-id-type="doi">10.1210/jc.2016-2653</pub-id>
          <pub-id pub-id-type="medline">27854553</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Edridge</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Dunkley</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bodicoat</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Rose</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Davies</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Khunti</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and incidence of hypoglycaemia in 532,542 people with type 2 diabetes on oral therapies and insulin: a systematic review and meta-analysis of population based studies</article-title>
          <source>PLoS One</source>
          <year>2015</year>
          <month>6</month>
          <day>10</day>
          <volume>10</volume>
          <issue>6</issue>
          <fpage>e0126427</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0126427"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0126427</pub-id>
          <pub-id pub-id-type="medline">26061690</pub-id>
          <pub-id pub-id-type="pii">PONE-D-15-00548</pub-id>
          <pub-id pub-id-type="pmcid">PMC4465495</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Silbert</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Salcido-Montenegro</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez-Gutierrez</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Katabi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McCoy</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>Hypoglycemia among patients with type 2 diabetes: epidemiology, risk factors, and prevention strategies</article-title>
          <source>Curr Diab Rep</source>
          <year>2018</year>
          <month>06</month>
          <day>21</day>
          <volume>18</volume>
          <issue>8</issue>
          <fpage>53</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29931579"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11892-018-1018-0</pub-id>
          <pub-id pub-id-type="medline">29931579</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11892-018-1018-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6117835</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alwafi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Alsharif</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Langan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Naser</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Mongkhon</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Ilomaki</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Al Metwazi</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Man</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>IC</given-names>
            </name>
          </person-group>
          <article-title>Incidence and prevalence of hypoglycaemia in type 1 and type 2 diabetes individuals: a systematic review and meta-analysis</article-title>
          <source>Diabetes Res Clin Pract</source>
          <year>2020</year>
          <month>12</month>
          <volume>170</volume>
          <fpage>108522</fpage>
          <pub-id pub-id-type="doi">10.1016/j.diabres.2020.108522</pub-id>
          <pub-id pub-id-type="medline">33096187</pub-id>
          <pub-id pub-id-type="pii">S0168-8227(20)30779-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Han</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yun</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>YM</given-names>
            </name>
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>YB</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Ko</surname>
              <given-names>SH</given-names>
            </name>
          </person-group>
          <article-title>Development and validation of a risk prediction model for severe hypoglycemia in adult patients with type 2 diabetes: a nationwide population-based cohort study</article-title>
          <source>Clin Epidemiol</source>
          <year>2018</year>
          <month>10</month>
          <day>23</day>
          <volume>10</volume>
          <fpage>1545</fpage>
          <lpage>59</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.2147/CLEP.S169835"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/CLEP.S169835</pub-id>
          <pub-id pub-id-type="medline">30425585</pub-id>
          <pub-id pub-id-type="pii">clep-10-1545</pub-id>
          <pub-id pub-id-type="pmcid">PMC6203120</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Karter</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Moffet</surname>
              <given-names>HH</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>JY</given-names>
            </name>
            <name name-style="western">
              <surname>Lipska</surname>
              <given-names>KJ</given-names>
            </name>
          </person-group>
          <article-title>Surveillance of hypoglycemia-limitations of emergency department and hospital utilization data</article-title>
          <source>JAMA Intern Med</source>
          <year>2018</year>
          <month>07</month>
          <day>01</day>
          <volume>178</volume>
          <issue>7</issue>
          <fpage>987</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29710182"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamainternmed.2018.1014</pub-id>
          <pub-id pub-id-type="medline">29710182</pub-id>
          <pub-id pub-id-type="pii">2678453</pub-id>
          <pub-id pub-id-type="pmcid">PMC6033620</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Beam</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in healthcare</article-title>
          <source>Nat Biomed Eng</source>
          <year>2018</year>
          <month>10</month>
          <volume>2</volume>
          <issue>10</issue>
          <fpage>719</fpage>
          <lpage>31</lpage>
          <pub-id pub-id-type="doi">10.1038/s41551-018-0305-z</pub-id>
          <pub-id pub-id-type="medline">31015651</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41551-018-0305-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <collab>MIT Critical Data</collab>
          </person-group>
          <source>Secondary Analysis of Electronic Health Records</source>
          <year>2016</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Siddiqui</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Seliger</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Blumenthal</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Doerfler</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fink</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Text preprocessing for improving hypoglycemia detection from clinical notes - a case study of patients with diabetes</article-title>
          <source>Int J Med Inform</source>
          <year>2019</year>
          <month>09</month>
          <volume>129</volume>
          <fpage>374</fpage>
          <lpage>80</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2019.06.020</pub-id>
          <pub-id pub-id-type="medline">31445280</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(18)31446-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Murdoch</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Detsky</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>The inevitable application of big data to health care</article-title>
          <source>JAMA</source>
          <year>2013</year>
          <month>04</month>
          <day>03</day>
          <volume>309</volume>
          <issue>13</issue>
          <fpage>1351</fpage>
          <lpage>2</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2013.393</pub-id>
          <pub-id pub-id-type="medline">23549579</pub-id>
          <pub-id pub-id-type="pii">1674245</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Siminerio</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Krall</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Anton</surname>
              <given-names>BB</given-names>
            </name>
            <name name-style="western">
              <surname>Hodges</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Bednarz</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Applying real-world data to inform continuous glucose monitoring use in clinical practice</article-title>
          <source>J Diabetes Sci Technol</source>
          <year>2021</year>
          <month>07</month>
          <volume>15</volume>
          <issue>4</issue>
          <fpage>968</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33703933"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1932296821997403</pub-id>
          <pub-id pub-id-type="medline">33703933</pub-id>
          <pub-id pub-id-type="pmcid">PMC8258536</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elbattah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Arnaud</surname>
              <given-names>É</given-names>
            </name>
            <name name-style="western">
              <surname>Gignon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dequen</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>The role of text analytics in healthcare: a review of recent developments and applications</article-title>
          <source>Proceedings of the 14th International Joint Conference on Biomedical Engineering Systems and Technologies</source>
          <year>2021</year>
          <conf-name>BIOSTEC '21</conf-name>
          <conf-date>February 11-13, 2021</conf-date>
          <conf-loc>Virtual</conf-loc>
          <fpage>825</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.5220/0010414508250832</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hirschberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>CD</given-names>
            </name>
          </person-group>
          <article-title>Advances in natural language processing</article-title>
          <source>Science</source>
          <year>2015</year>
          <month>07</month>
          <day>17</day>
          <volume>349</volume>
          <issue>6245</issue>
          <fpage>261</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1126/science.aaa8685</pub-id>
          <pub-id pub-id-type="medline">26185244</pub-id>
          <pub-id pub-id-type="pii">349/6245/261</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pivovarov</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Automated methods for the summarization of electronic health records</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2015</year>
          <month>09</month>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>938</fpage>
          <lpage>47</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25882031"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocv032</pub-id>
          <pub-id pub-id-type="medline">25882031</pub-id>
          <pub-id pub-id-type="pii">ocv032</pub-id>
          <pub-id pub-id-type="pmcid">PMC4986665</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Illipparambil</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Netherton</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Sheshadri</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Karu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>PH</given-names>
            </name>
          </person-group>
          <article-title>Racing against the clock: internal medicine residents' time spent on electronic health records</article-title>
          <source>J Grad Med Educ</source>
          <year>2016</year>
          <month>02</month>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>39</fpage>
          <lpage>44</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26913101"/>
          </comment>
          <pub-id pub-id-type="doi">10.4300/JGME-D-15-00240.1</pub-id>
          <pub-id pub-id-type="medline">26913101</pub-id>
          <pub-id pub-id-type="pii">JGME-D-15-00240</pub-id>
          <pub-id pub-id-type="pmcid">PMC4763387</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Olthof</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Shouche</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Fennema</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>IJpma</surname>
              <given-names>FF</given-names>
            </name>
            <name name-style="western">
              <surname>Koolstra</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Stirler</surname>
              <given-names>VM</given-names>
            </name>
            <name name-style="western">
              <surname>van Ooijen</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Cornelissen</surname>
              <given-names>LJ</given-names>
            </name>
          </person-group>
          <article-title>Machine learning based natural language processing of radiology reports in orthopaedic trauma</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2021</year>
          <month>09</month>
          <volume>208</volume>
          <fpage>106304</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0169-2607(21)00378-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2021.106304</pub-id>
          <pub-id pub-id-type="medline">34333208</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(21)00378-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Adekkanattu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Campion Jr</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Flory</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pathak</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>OV</given-names>
            </name>
            <name name-style="western">
              <surname>DuVall</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Major</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Aphinyanaphongs</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>From sour grapes to low-hanging fruit: a case study demonstrating a practical strategy for natural language processing portability</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2018</year>
          <month>5</month>
          <day>18</day>
          <volume>2017</volume>
          <fpage>104</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29888051"/>
          </comment>
          <pub-id pub-id-type="medline">29888051</pub-id>
          <pub-id pub-id-type="pmcid">PMC5961788</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sholle</surname>
              <given-names>ET</given-names>
            </name>
            <name name-style="western">
              <surname>Pinheiro</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Adekkanattu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Davila</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Pathak</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sinha</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lubansky</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Safford</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Campion</surname>
              <given-names>TR</given-names>
            </name>
          </person-group>
          <article-title>Underserved populations with missing race ethnicity data differ significantly from those with structured race/ethnicity documentation</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2019</year>
          <month>08</month>
          <day>01</day>
          <volume>26</volume>
          <issue>8-9</issue>
          <fpage>722</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31329882"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz040</pub-id>
          <pub-id pub-id-type="medline">31329882</pub-id>
          <pub-id pub-id-type="pii">5480563</pub-id>
          <pub-id pub-id-type="pmcid">PMC6696506</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>WK</given-names>
            </name>
            <name name-style="western">
              <surname>Hassanpour</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Heagerty</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rundell</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Suri</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Huhdanpaa</surname>
              <given-names>HT</given-names>
            </name>
            <name name-style="western">
              <surname>James</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Carrell</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Langlotz</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Organ</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Meier</surname>
              <given-names>EN</given-names>
            </name>
            <name name-style="western">
              <surname>Sherman</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kallmes</surname>
              <given-names>DF</given-names>
            </name>
            <name name-style="western">
              <surname>Luetmer</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>Griffith</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Nerenz</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Jarvik</surname>
              <given-names>JG</given-names>
            </name>
          </person-group>
          <article-title>Comparison of natural language processing rules-based and machine-learning systems to identify lumbar spine imaging findings related to low back pain</article-title>
          <source>Acad Radiol</source>
          <year>2018</year>
          <month>11</month>
          <volume>25</volume>
          <issue>11</issue>
          <fpage>1422</fpage>
          <lpage>32</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29605561"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.acra.2018.03.008</pub-id>
          <pub-id pub-id-type="medline">29605561</pub-id>
          <pub-id pub-id-type="pii">S1076-6332(18)30121-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC6162177</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lou</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Clinical trial cohort selection based on multi-level rule-based natural language processing system</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2019</year>
          <month>11</month>
          <day>01</day>
          <volume>26</volume>
          <issue>11</issue>
          <fpage>1218</fpage>
          <lpage>26</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31300825"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz109</pub-id>
          <pub-id pub-id-type="medline">31300825</pub-id>
          <pub-id pub-id-type="pii">5531899</pub-id>
          <pub-id pub-id-type="pmcid">PMC7647235</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sulieman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gilmore</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>French</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cronin</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>GP</given-names>
            </name>
            <name name-style="western">
              <surname>Russell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fabbri</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Classifying patient portal messages using Convolutional Neural Networks</article-title>
          <source>J Biomed Inform</source>
          <year>2017</year>
          <month>10</month>
          <volume>74</volume>
          <fpage>59</fpage>
          <lpage>70</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(17)30197-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2017.08.014</pub-id>
          <pub-id pub-id-type="medline">28864104</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(17)30197-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Datta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Si</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Soni</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Deep learning in clinical natural language processing: a methodical review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>03</month>
          <day>01</day>
          <volume>27</volume>
          <issue>3</issue>
          <fpage>457</fpage>
          <lpage>70</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31794016"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz200</pub-id>
          <pub-id pub-id-type="medline">31794016</pub-id>
          <pub-id pub-id-type="pii">5651084</pub-id>
          <pub-id pub-id-type="pmcid">PMC7025365</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rasmy</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Med-BERT: pretrained contextualized embeddings on large-scale structured electronic health records for disease prediction</article-title>
          <source>NPJ Digit Med</source>
          <year>2021</year>
          <month>05</month>
          <day>20</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>86</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-021-00455-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-021-00455-y</pub-id>
          <pub-id pub-id-type="medline">34017034</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-021-00455-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC8137882</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</source>
          <year>2019</year>
          <conf-name>NAACL '19</conf-name>
          <conf-date>June 2-7, 2019</conf-date>
          <conf-loc>Minneapolis, MN, USA</conf-loc>
          <fpage>4171</fpage>
          <lpage>86</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/N19-1423.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/N19-1423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nunes</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Iglay</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Radican</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Engel</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Doherty</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Dore</surname>
              <given-names>DD</given-names>
            </name>
          </person-group>
          <article-title>Hypoglycaemia seriousness and weight gain as determinants of cardiovascular disease outcomes among sulfonylurea users</article-title>
          <source>Diabetes Obes Metab</source>
          <year>2017</year>
          <month>10</month>
          <volume>19</volume>
          <issue>10</issue>
          <fpage>1425</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1111/dom.13000</pub-id>
          <pub-id pub-id-type="medline">28497592</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bramer</surname>
              <given-names>WM</given-names>
            </name>
          </person-group>
          <article-title>Serving Evidence Syntheses: improving literature retrieval in systematic reviews</article-title>
          <source>Erasmus University Rotterdam</source>
          <year>2019</year>
          <month>10</month>
          <day>29</day>
          <access-date>2022-05-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://repub.eur.nl/pub/120107">https://repub.eur.nl/pub/120107</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nunes</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Radican</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Engel</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Kurtyka</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tunceli</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Iglay</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Doherty</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Dore</surname>
              <given-names>DD</given-names>
            </name>
          </person-group>
          <article-title>Assessing occurrence of hypoglycemia and its severity from electronic health records of patients with type 2 diabetes mellitus</article-title>
          <source>Diabetes Res Clin Pract</source>
          <year>2016</year>
          <month>11</month>
          <volume>121</volume>
          <fpage>192</fpage>
          <lpage>203</lpage>
          <pub-id pub-id-type="doi">10.1016/j.diabres.2016.09.012</pub-id>
          <pub-id pub-id-type="medline">27744128</pub-id>
          <pub-id pub-id-type="pii">S0168-8227(16)30603-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Loughlin</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Qiao</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Nunes</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Ezzy</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Yochum</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Clifford</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Gately</surname>
              <given-names>RV</given-names>
            </name>
            <name name-style="western">
              <surname>Dore</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Seeger</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Effectiveness and tolerability of therapy with once-weekly exenatide versus basal insulin among injectable-naive patients with type 2 diabetes in a real-world setting in the United States</article-title>
          <source>Diabetes Spectr</source>
          <year>2018</year>
          <month>05</month>
          <volume>31</volume>
          <issue>2</issue>
          <fpage>129</fpage>
          <lpage>37</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29773932"/>
          </comment>
          <pub-id pub-id-type="doi">10.2337/ds16-0081</pub-id>
          <pub-id pub-id-type="medline">29773932</pub-id>
          <pub-id pub-id-type="pii">129</pub-id>
          <pub-id pub-id-type="pmcid">PMC5951230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pettus</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Roussel</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liz Zhou</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bosnyak</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Westerbacka</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Berria</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jimenez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Eliasson</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Hramiak</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Meneghini</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Rates of hypoglycemia predicted in patients with type 2 diabetes on insulin Glargine 300 U/ml versus first- and second-generation basal insulin analogs: the real-world LIGHTNING study</article-title>
          <source>Diabetes Ther</source>
          <year>2019</year>
          <month>04</month>
          <volume>10</volume>
          <issue>2</issue>
          <fpage>617</fpage>
          <lpage>33</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30767173"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s13300-019-0568-8</pub-id>
          <pub-id pub-id-type="medline">30767173</pub-id>
          <pub-id pub-id-type="pii">10.1007/s13300-019-0568-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6437256</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Radican</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cummins</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Engel</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Iglay</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Duke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Brodovicz</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Naik</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Leventhal</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chatterjee</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Rajpathak</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Weiner</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Predictive modeling of hypoglycemia for clinical decision support in evaluating outpatients with diabetes mellitus</article-title>
          <source>Curr Med Res Opin</source>
          <year>2019</year>
          <month>11</month>
          <volume>35</volume>
          <issue>11</issue>
          <fpage>1885</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1080/03007995.2019.1636016</pub-id>
          <pub-id pub-id-type="medline">31234649</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Misra-Hebert</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Milinovich</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zajichek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Hobbs</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Petraro</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>SX</given-names>
            </name>
            <name name-style="western">
              <surname>Mocarski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ganguly</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bauman</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Pantalone</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Zimmerman</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Kattan</surname>
              <given-names>MW</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing improves detection of nonsevere hypoglycemia in medical records versus coding alone in patients with type 2 diabetes but does not improve prediction of severe hypoglycemia events: an analysis using the electronic medical record in a large health system</article-title>
          <source>Diabetes Care</source>
          <year>2020</year>
          <month>08</month>
          <volume>43</volume>
          <issue>8</issue>
          <fpage>1937</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32414887"/>
          </comment>
          <pub-id pub-id-type="doi">10.2337/dc19-1791</pub-id>
          <pub-id pub-id-type="medline">32414887</pub-id>
          <pub-id pub-id-type="pii">dc19-1791</pub-id>
          <pub-id pub-id-type="pmcid">PMC7372042</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Uzoigwe</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hamersky</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Arbit</surname>
              <given-names>DI</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Radin</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Assessing prevalence of hypoglycemia in a medical transcription database</article-title>
          <source>Diabetes Metab Syndr Obes</source>
          <year>2020</year>
          <month>6</month>
          <day>24</day>
          <volume>13</volume>
          <fpage>2209</fpage>
          <lpage>16</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.2147/DMSO.S235298"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/DMSO.S235298</pub-id>
          <pub-id pub-id-type="medline">32612376</pub-id>
          <pub-id pub-id-type="pii">235298</pub-id>
          <pub-id pub-id-type="pmcid">PMC7322136</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ganz</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Wintfeld</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Gatt</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Severe hypoglycemia rates and associated costs among type 2 diabetics starting basal insulin therapy in the United States</article-title>
          <source>Curr Med Res Opin</source>
          <year>2014</year>
          <month>10</month>
          <volume>30</volume>
          <issue>10</issue>
          <fpage>1991</fpage>
          <lpage>2000</lpage>
          <pub-id pub-id-type="doi">10.1185/03007995.2014.936930</pub-id>
          <pub-id pub-id-type="medline">24945720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Humphreys</surname>
              <given-names>BL</given-names>
            </name>
            <name name-style="western">
              <surname>Lindberg</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Hole</surname>
              <given-names>WT</given-names>
            </name>
          </person-group>
          <article-title>Assessing and enhancing the value of the UMLS Knowledge Sources</article-title>
          <source>Proc Annu Symp Comput Appl Med Care</source>
          <year>1991</year>
          <fpage>78</fpage>
          <lpage>82</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/1807711"/>
          </comment>
          <pub-id pub-id-type="medline">1807711</pub-id>
          <pub-id pub-id-type="pmcid">PMC2247499</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Dillig</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Durrett</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Sketch-driven regular expression generation from natural language and examples</article-title>
          <source>Trans Assoc Comput Linguist</source>
          <year>2020</year>
          <month>12</month>
          <volume>8</volume>
          <fpage>679</fpage>
          <lpage>94</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2020.tacl-1.44.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.1162/tacl_a_00339</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ganz</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Paprocki</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Weatherall</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The burden of severe hypoglycemia in type 1 diabetes</article-title>
          <source>Curr Med Res Opin</source>
          <year>2018</year>
          <month>01</month>
          <volume>34</volume>
          <issue>1</issue>
          <fpage>171</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1080/03007995.2017.1391079</pub-id>
          <pub-id pub-id-type="medline">29019269</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ganz</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Paprocki</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Weatherall</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The burden of severe hypoglycemia in type 2 diabetes</article-title>
          <source>Curr Med Res Opin</source>
          <year>2018</year>
          <month>01</month>
          <volume>34</volume>
          <issue>1</issue>
          <fpage>179</fpage>
          <lpage>86</lpage>
          <pub-id pub-id-type="doi">10.1080/03007995.2017.1391080</pub-id>
          <pub-id pub-id-type="medline">29017368</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lalor</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Druhl</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Granillo</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Vimalananda</surname>
              <given-names>VG</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Detecting hypoglycemia incidents reported in patients' secure messages: using cost-sensitive learning and oversampling to reduce data imbalance</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>03</month>
          <day>11</day>
          <volume>21</volume>
          <issue>3</issue>
          <fpage>e11990</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/3/e11990/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/11990</pub-id>
          <pub-id pub-id-type="medline">30855231</pub-id>
          <pub-id pub-id-type="pii">v21i3e11990</pub-id>
          <pub-id pub-id-type="pmcid">PMC6431826</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>HYPE: a high performing NLP system for automatically detecting hypoglycemia events from electronic health record notes</article-title>
          <source>arXiv (forthcoming)</source>
          <year>2018</year>
          <month>11</month>
          <day>28</day>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1811.11945"/>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
