<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JD</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Diabetes</journal-id>
      <journal-title>JMIR Diabetes</journal-title>
      <issn pub-type="epub">2371-4379</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v5i1e14431</article-id>
      <article-id pub-id-type="pmid"/>
      <article-id pub-id-type="doi">10.2196/14431</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Using Social Media to Track Geographic Variability in Language About Diabetes: Infodemiology Analysis</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Richardson</surname>
            <given-names>Caroline</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Hendrikx</surname>
            <given-names>Roy</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Oser</surname>
            <given-names>Tamara</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Da Silva</surname>
            <given-names>Edson</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Griffis</surname>
            <given-names>Heather</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Children's Hospital of Philadelphia</institution>
            <addr-line>2716 South Street</addr-line>
            <addr-line>Philadelphia, PA, 19126</addr-line>
            <country>United States</country>
            <phone>1 2196880543</phone>
            <email>griffish@email.chop.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9284-4707</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Asch</surname>
            <given-names>David A</given-names>
          </name>
          <degrees>MD, MBA</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7970-286X</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Schwartz</surname>
            <given-names>H Andrew</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6383-3339</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Ungar</surname>
            <given-names>Lyle</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2047-1443</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Buttenheim</surname>
            <given-names>Alison M</given-names>
          </name>
          <degrees>MBA, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2432-1637</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Barg</surname>
            <given-names>Frances K</given-names>
          </name>
          <degrees>MEd, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3328-1980</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Mitra</surname>
            <given-names>Nandita</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7714-3910</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Merchant</surname>
            <given-names>Raina M</given-names>
          </name>
          <degrees>MD, MS</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9801-6881</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Children's Hospital of Philadelphia</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>University of Pennsylvania</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Stony Brook University</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Heather Griffis <email>griffish@email.chop.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Jan-Mar</season>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>11</day>
        <month>2</month>
        <year>2020</year>
      </pub-date>
      <volume>5</volume>
      <issue>1</issue>
      <elocation-id>e14431</elocation-id>
      <history>
        <date date-type="received">
          <day>17</day>
          <month>4</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>6</day>
          <month>6</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>23</day>
          <month>10</month>
          <year>2019</year>
        </date>
        <date date-type="accepted">
          <day>11</day>
          <month>11</month>
          <year>2019</year>
        </date>
      </history>
      <copyright-statement>©Heather Griffis, David A Asch, H Andrew Schwartz, Lyle Ungar, Alison M Buttenheim, Frances K Barg, Nandita Mitra, Raina M Merchant. Originally published in JMIR Diabetes (http://diabetes.jmir.org), 11.02.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Diabetes, is properly cited. The complete bibliographic information, a link to the original publication on http://diabetes.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://diabetes.jmir.org/2020/1/e14431/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Social media posts about diabetes could reveal patients’ knowledge, attitudes, and beliefs as well as approaches for better targeting of public health messages and care management.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to characterize the language of Twitter users’ posts regarding diabetes and describe the correlation of themes with the county-level prevalence of diabetes.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>A retrospective study of diabetes-related tweets identified from a random sample of approximately 37 billion tweets from the United States from 2009 to 2015 was conducted. We extracted diabetes-specific tweets and used machine learning to identify statistically significant topics of related terms. Topics were combined into themes and compared with the prevalence of diabetes by US counties and further compared with geography (US Census Divisions). Pearson correlation coefficients are reported for each topic and relationship with prevalence.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A total of 239,989 tweets from 121,494 unique users included the term diabetes. The themes emerging from the topics included unhealthy food and drink, treatment, symptoms/diagnoses, risk factors, research, recipes, news, health care, management, fundraising, diet, communication, and supplements/remedies. The theme of unhealthy foods most positively correlated with geographic areas with high prevalence of diabetes (<italic>r</italic>=0.088), whereas tweets related to research most negatively correlated (<italic>r</italic>=−0.162) with disease prevalence. Themes and topics about diabetes differed in overall frequency across the US geographical divisions, with the East South Central and South Atlantic states having a higher frequency of topics referencing unhealthy food (<italic>r</italic> range=0.073-0.146; <italic>P</italic>&lt;.001).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Diabetes-related tweets originating from counties with high prevalence of diabetes have different themes than tweets originating from counties with low prevalence of diabetes. Interventions could be informed from this variation to promote healthy behaviors.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>social media</kwd>
        <kwd>epidemiology</kwd>
        <kwd>infodemiology</kwd>
        <kwd>diabetes</kwd>
        <kwd>prevalence</kwd>
        <kwd>twitter</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Diabetes affects 30 million people in the United States, and its prevalence varies by geographic region. A better understanding of the regional differences concerning diabetes could allow for better public health messaging. The colloquial person-to-person communication about diabetes might inform that understanding, but word-of-mouth communication has been hard to measure until social media created the possibility of listening in.</p>
        <p>Social media platforms such as Twitter, Facebook, and Instagram have emerged as high-volume, real-time data sources to study and observe communications, including health-related communications, from broad population segments [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref5">5</xref>]. Web-based communities are often far reaching, offering various types of communication including person-to-person communication, information seeking and dissemination, social support, and broadcasting of ideas and opinions. In addition, these communities can have similar location-specific characteristics. The content and characteristics of social media posts are associated with the regional epidemiology of disease [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. For example, Instagram users residing in areas with low access to grocery stores (food deserts) posted about and consumed foods higher in fat and cholesterol compared with users residing in areas with greater access to grocery stores [<xref ref-type="bibr" rid="ref3">3</xref>]. Thus, a better understanding of how people talk about diabetes via social media could provide insights about how to provide better targeted disease management and treatment.</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>In this study, we sought to characterize language about diabetes on Twitter and examine the correlation between this language and the prevalence of diabetes.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Source and Sample</title>
        <p>This was a retrospective study of data extracted from Twitter about diabetes. Using natural language processing methodology, we found diabetes-specific terms, grouped them into clusters, and then quantified associations with the prevalence of diabetes. This study was approved by the Institutional Review Board of the University of Pennsylvania.</p>
        <p>Tweets are brief status updates (no more than 140 characters during the duration of this study) containing information about emotions, thoughts, behaviors, and other personally salient information. Twitter users are broadly represented across age, geography, and social distributions [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. African Americans, Latinos, and those in urban areas are overrepresented on Twitter relative to the general population [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        <p>For this study, we examined a random 10.00% (3,700,000/37,000,000) sample of all tweets between July 2009 and February 2015 (37 billion total tweets). We then extracted all tweets in English language with the keyword <italic>diabetes</italic> that originated in the United States, with GPS coordinates or other identifying information sufficient for linking to a US county (such as direct reference to a named county within a state, such as Philadelphia County, Pennsylvania). Approximately 21% of Twitter users provide their location information [<xref ref-type="bibr" rid="ref5">5</xref>].</p>
      </sec>
      <sec>
        <title>Twitter Topic Generation</title>
        <p>We first limited our analysis to diabetes-specific language by finding those words and phrases that had a significant association with posts mentioning diabetes. Specifically, we used a random sample of 25,000 tweets including the word <italic>diabetes</italic> and 25,000 tweets without the word <italic>diabetes</italic>, and out of the 5000 most frequently used words, we kept those that were used significantly more frequently in the diabetes-related messages according to a logistic regression (Benjamini-Hochberg corrected <italic>P</italic>&lt;.05 [<xref ref-type="bibr" rid="ref13">13</xref>]). This removed nondiabetes-related words such as <italic>the</italic> or <italic>like</italic>. We then grouped diabetes-specific vocabulary in topics (clusters of semantically related words) using Latent Dirichlet Allocation (LDA). LDA is an automated machine learning process by which frequently co-occurring words are organized into topics [<xref ref-type="bibr" rid="ref14">14</xref>]. Topic usage is quantified on a scale, referred to as <italic>topic probability</italic>, from 0 to 1 (from not used at all to exclusively used), which corresponds to the percentage of words from the given topic.</p>
        <p>Two research assistants then independently reviewed 100 topics and categorized them into common themes based on the language within the topics. Any deviations between the research assistants were discussed among the research team members to reach consensus.</p>
      </sec>
      <sec>
        <title>Relation of Diabetes Topics and Prevalence</title>
        <p>To determine how topics on diabetes relate to diabetes prevalence, topic probabilities were individually correlated with age-adjusted county diabetes rates from the Centers for Disease Control and Prevention at the county level for 2012 [<xref ref-type="bibr" rid="ref15">15</xref>]. In addition, topics were regressed against the 9 US Census Divisions using logistic regression controlling for language of the division.</p>
        <p><italic>P</italic> values were corrected for multiple testing using the Benjamini-Hochberg procedure. Pearson correlation coefficients are reported for topics, with <italic>P</italic>&lt;.01 indicating significance.</p>
        <p>All statistical analyses were performed with the Differential Language Analysis Toolkit version 1.1 [<xref ref-type="bibr" rid="ref16">16</xref>] and Python 2.7.10 (Python Software Foundation).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>From approximately 37 billion tweets, 1.8 billion included sufficient location information to map to US counties. Of those, 1.6 billion were in English, of which 239,989 tweets (0.15%) included the term <italic>diabetes</italic>, representing 121,494 unique users.</p>
      <p>Topics categorized into themes are displayed in <xref ref-type="table" rid="table1">Table 1</xref>. Each row of words represents 1 topic within the theme. Examples of topics that correlated with diabetes-related tweets included unhealthy food and drink-themed topics [(<italic>cupcakes</italic>, <italic>whipped</italic>, <italic>Haribo</italic>, and <italic>sundae</italic>) and (<italic>chocolate</italic>, <italic>Cinnabons</italic>, <italic>meats</italic>, and <italic>soda</italic>)] as well as a risk factors theme (<italic>body mass index</italic>, <italic>waist</italic>, <italic>drugs</italic>, <italic>alcoholic</italic>, and <italic>obese)</italic> and a fundraising theme (<italic>walk</italic>, <italic>charities</italic>, <italic>supporting</italic>, <italic>donation</italic>, and <italic>November).</italic></p>
      <p>Twitter users from regions with high prevalence of diabetes were more likely to tweet about unhealthy foods (<italic>candy bar</italic>, <italic>cookies</italic>, and <italic>Twinkies</italic>; <italic>r</italic>=0.088; <italic>P</italic>=.002), whereas twitter users from areas with low prevalence of diabetes were more likely to tweet about research (<italic>clinical</italic>, <italic>published</italic>, and <italic>enrolling</italic>; <italic>r</italic>=0.162; <italic>P</italic>&lt;.001)<italic>.</italic></p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Topics of diabetes-related terms with relevant words within topics, categorized into themes.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="258"/>
          <col width="742"/>
          <thead>
            <tr valign="top">
              <td>Theme</td>
              <td>Words within topics</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Unhealthy food/drink</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Cupcakes, whipped, Haribo, and sundae</p>
                  </list-item>
                  <list-item>
                    <p>Fattening, processed, and meats</p>
                  </list-item>
                  <list-item>
                    <p>Cinnabons, crispy, and sugar high</p>
                  </list-item>
                  <list-item>
                    <p>Kool-aid and lemonade</p>
                  </list-item>
                  <list-item>
                    <p>Candy, cookies, and bars</p>
                  </list-item>
                  <list-item>
                    <p>Sugar-sweetened, Kentucky Fried Chicken, soda, and Pepsi</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Treatment</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Exercise, diet, healthy, prevention, and managing</p>
                  </list-item>
                  <list-item>
                    <p>Medicine, treatment, symptoms, alternative, natural, and remedies</p>
                  </list-item>
                  <list-item>
                    <p>Pancreas, system, physical, and activity</p>
                  </list-item>
                  <list-item>
                    <p>Insulin, injections, and sensitivity</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Symptoms/diagnoses</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Overwhelmed, tiredness, and urination</p>
                  </list-item>
                  <list-item>
                    <p>Disease, excess, heart, and hereditary</p>
                  </list-item>
                  <list-item>
                    <p>Auto-immune, degenerative, Alzheimer, Crohns, and hyperlipidemia</p>
                  </list-item>
                  <list-item>
                    <p>Pregnancy, pre-eclampsia, gestation, and pre-existing</p>
                  </list-item>
                  <list-item>
                    <p>Charcot, gangrene, fungal, limbs, and ulcers</p>
                  </list-item>
                  <list-item>
                    <p>Unconscious, lightheaded, cramping, and sweating</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Risk factors</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Obesity, cardiovascular, and dysfunction</p>
                  </list-item>
                  <list-item>
                    <p>Obese, antipsychotics, adolescents, and teens</p>
                  </list-item>
                  <list-item>
                    <p>Alcoholic, drink, and rum</p>
                  </list-item>
                  <list-item>
                    <p>Drugs, statins, women, waist, and body mass index</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Research</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Mayoclinic.com, lifestyles, and interventions</p>
                  </list-item>
                  <list-item>
                    <p>Immunology, antigen, and enrolls</p>
                  </list-item>
                  <list-item>
                    <p>Variants, explanation, methylation, and blood</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Recipes</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Eggplant and recipe</p>
                  </list-item>
                  <list-item>
                    <p>Cookbook, ultratasty, health, and recipes</p>
                  </list-item>
                  <list-item>
                    <p>Solution, health, and recipe book</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>News</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>HealthDay, Yahoo, health news, share, and boost</p>
                  </list-item>
                  <list-item>
                    <p>CDC<sup>a</sup>, Americans, worldwide, cases, and percent</p>
                  </list-item>
                  <list-item>
                    <p>Rates, CDC rising, and death</p>
                  </list-item>
                  <list-item>
                    <p>Syndrome, metabolic, and diagnosis</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Health care</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Bloodwork, source book, and Dr’s</p>
                  </list-item>
                  <list-item>
                    <p>Payer, insurance, professionals, and telemedicine</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Management</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Glucose, management, monitoring, complications</p>
                  </list-item>
                  <list-item>
                    <p>Nurse, pharmacy, education, clinic, patient system</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Fundraising</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Juvenile, sponsor, walk, annual, research, and donating</p>
                  </list-item>
                  <list-item>
                    <p>Walk, step, cure, register, supporting, and donation</p>
                  </list-item>
                  <list-item>
                    <p>Charities and revamping</p>
                  </list-item>
                  <list-item>
                    <p>Awareness, November, month, national, and advocate</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Diet</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Mediterranean, diet, reverse, low-carb, high-fat, and paleo</p>
                  </list-item>
                  <list-item>
                    <p>Healthy, protein, carbs, meal, and stabilize</p>
                  </list-item>
                  <list-item>
                    <p>Plates, lose, eating, weight, and mindful</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Communication</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Blog, archive, post, and published</p>
                  </list-item>
                  <list-item>
                    <p>Community, topic, advocate, and educators</p>
                  </list-item>
                  <list-item>
                    <p>Support, group, education, self-management, and wellness</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>Supplements/remedies</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>Minerals, raspberries, anti-inflammatory, and chromium</p>
                  </list-item>
                  <list-item>
                    <p>Herbs, natural, and alternative care</p>
                  </list-item>
                  <list-item>
                    <p>Multivitamin, probiotics, and selenium</p>
                  </list-item>
                </list>
              </td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table1fn1">
            <p><sup>a</sup>CDC: Centers for Disease Control and Prevention.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>Themes and topics about diabetes differed in relation to overall prevalence of diabetes across US geographic divisions. Areas with high prevalence of diabetes, such as the East South Central and South Atlantic divisions, also had topics referencing unhealthy food (standardized beta range=0.073-0.146). However, research and exercise were most highly correlated with diabetes prevalence in the Northeast (standardized beta for research and exercise was .107 and .142, respectively).</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study reveals that (1) there is variation in what people post on Twitter about diabetes and (2) topics vary by county-level prevalence of diabetes. Unhealthy food–related topics were positively associated with high prevalence of diabetes; conversely, topics about research were negatively correlated with the prevalence of diabetes. The causal directions of these associations, if any, are unclear, but the results suggest opportunities to target online health messages relative to the prevalence of the disease.</p>
        <p>This growing body of research utilizing social media platforms to explore public health topics may be helpful for targeting specific patient populations for public health messaging via appropriate language and message content. The ability to relate to different patient populations based on language can better align public health professionals and patients [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Subpopulations of patients, based on geography, disease severity, or other factors, may use different synonyms or metaphors for symptoms not known to the general public or health professionals. Local health care organizations and professionals could, for example, utilize language common to a particular geographic area with high prevalence of diabetes to target healthy messaging on social media and print media. These organizations may also utilize healthy messaging from other areas with low prevalence of diabetes to influence health behaviors. Large national organizations may also utilize regional differences in content and language to better personalize and position tweets within particular geographic contexts [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
        <p>Content may also be enhanced by tweet modifiers (eg, hashtags and emotion) shown to impact dissemination of cardiovascular health–related Twitter posts [<xref ref-type="bibr" rid="ref7">7</xref>]. Mining social media to find these nuances within a population posting about diabetes would be useful for outreach and message targeting. Furthermore, learning how different message types (ie, shocking or humorous) are related to gaining knowledge of serious health effects for particular health behaviors is crucial to influence behavior change [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>This study has several limitations. Twitter users are not nationally representative, and tweets are not a direct proxy for all person-to-person communication. Tweets are short, and content is presumably what users are eager to share broadly (vs what they may be focused on privately). Nevertheless, tweets offer a window into public discourse about diabetes. This study also has strengths: it starts from an enormous sample of tweets, systematically addresses their content via machine learning techniques, and associates that content with disease prevalence. In doing so, it advances our understanding of public perceptions of diabetes.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study demonstrates that the language used to discuss diseases is variable and complex. Systematic assessment of social media about posts on diabetes could suggest targets for promoting healthy lifestyles and behaviors.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">LDA</term>
          <def>
            <p>Latent Dirichlet Allocation</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was supported by grant R01-HL1422457 from the National Heart, Lung, and Blood Institute (RM)</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>HG, HAS, LU, AMB, FKB, NM, and RMM declare no conflicts of interest. DAA owns stock in Berkshire Hathaway. He is a partner in and part owner of VAL Health; and has received compensation and/or travel support for speaking, writing, or consulting from the following organizations: AFYA, MTS Health Partnership, Children’s Hospital of Philadelphia, University of Virginia, Salzburg Global Seminars, GlaxoSmithKline (GSK), John F Kennedy Health System, Cosmetic Boot Camp, Meeting Designs, Capital Consulting, Healthcare Financial Management Association, Joslin Diabetes Center, National Academy of Medicine, the Commonwealth Fund, Massachusetts Medical Society, Endocrine Society, Osteoarthritis research society international, Baystate Medical Center, Weill-Cornell Medical College, Association of American Medical Colleges, Technology, Entertainment, Design(TED) Medical (MED), National Alliance of Health Care Purchaser Coalitions, Deloitte, Harvard University, American Association for Physician Leadership, Brandeis University, University of Rochester, Partner’s Health Care System, John Dolan Lectureship, Johns Hopkins University, and MITRE.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moorhead</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Hazlett</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Harrison</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Irwin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hoving</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A new dimension of health care: systematic review of the uses, benefits, and limitations of social media for health communication</article-title>
          <source>J Med Internet Res</source>
          <year>2013</year>
          <month>04</month>
          <day>23</day>
          <volume>15</volume>
          <issue>4</issue>
          <fpage>e85</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2013/4/e85/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.1933</pub-id>
          <pub-id pub-id-type="medline">23615206</pub-id>
          <pub-id pub-id-type="pii">v15i4e85</pub-id>
          <pub-id pub-id-type="pmcid">PMC3636326</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gough</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hunter</surname>
              <given-names>RF</given-names>
            </name>
            <name name-style="western">
              <surname>Ajao</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Jurek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McKeown</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Barrett</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ferguson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McElwee</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>McCarthy</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kee</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Tweet for behavior change: using social media for the dissemination of public health messages</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2017</year>
          <month>03</month>
          <day>23</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>e14</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2017/1/e14/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.6313</pub-id>
          <pub-id pub-id-type="medline">28336503</pub-id>
          <pub-id pub-id-type="pii">v3i1e14</pub-id>
          <pub-id pub-id-type="pmcid">PMC5383801</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choudhury</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kiciman</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Characterizing Dietary Choices, Nutrition, and Language in Food Deserts via Social Media</article-title>
          <source>Proceedings of the 19th ACM Conference on Computer-Supported Cooperative Work &amp; Social Computing</source>
          <year>2016</year>
          <conf-name>CSCW'16</conf-name>
          <conf-date>February 27–March 2, 2016</conf-date>
          <conf-loc>San Francisco, USA</conf-loc>
          <fpage>1157</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.1145/2818048.2819956</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferrara</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Measuring emotional contagion in social media</article-title>
          <source>PLoS One</source>
          <year>2015</year>
          <volume>10</volume>
          <issue>11</issue>
          <fpage>e0142390</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0142390"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0142390</pub-id>
          <pub-id pub-id-type="medline">26544688</pub-id>
          <pub-id pub-id-type="pii">PONE-D-15-26611</pub-id>
          <pub-id pub-id-type="pmcid">PMC4636231</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Kern</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Dziurzynski</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lucas</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lakshmikanth</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Sneha</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Seligman</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Characterizing Geographic Variation in Well-Being Using Tweets</article-title>
          <source>Proceedings of the Seventh International AAAI Conference on Weblogs and Social Media</source>
          <year>2013</year>
          <conf-name>ICWSM'13</conf-name>
          <conf-date>July 8–11, 2013</conf-date>
          <conf-loc>Cambridge, Massachusetts</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sinnenberg</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>DiSilvestro</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Mancheno</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dailey</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tufts</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Buttenheim</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Barg</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Asch</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Twitter as a potential data source for cardiovascular disease research</article-title>
          <source>JAMA Cardiol</source>
          <year>2016</year>
          <month>12</month>
          <day>1</day>
          <volume>1</volume>
          <issue>9</issue>
          <fpage>1032</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27680322"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamacardio.2016.3029</pub-id>
          <pub-id pub-id-type="medline">27680322</pub-id>
          <pub-id pub-id-type="pii">2556216</pub-id>
          <pub-id pub-id-type="pmcid">PMC5177459</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Kern</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Labarthe</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Jha</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dziurzynski</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Sap</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weeg</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Larson</surname>
              <given-names>EE</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Seligman</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Psychological language on Twitter predicts county-level heart disease mortality</article-title>
          <source>Psychol Sci</source>
          <year>2015</year>
          <month>02</month>
          <volume>26</volume>
          <issue>2</issue>
          <fpage>159</fpage>
          <lpage>69</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25605707"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/0956797614557867</pub-id>
          <pub-id pub-id-type="medline">25605707</pub-id>
          <pub-id pub-id-type="pii">0956797614557867</pub-id>
          <pub-id pub-id-type="pmcid">PMC4433545</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weeg</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Arango</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Using Twitter to measure public discussion of diseases: a case study</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2015</year>
          <month>06</month>
          <day>26</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>e6</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2015/1/e6/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.3953</pub-id>
          <pub-id pub-id-type="medline">26925459</pub-id>
          <pub-id pub-id-type="pii">v1i1e6</pub-id>
          <pub-id pub-id-type="pmcid">PMC4763717</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
          <source>Nielsen</source>
          <year>2012</year>
          <month>04</month>
          <day>12</day>
          <access-date>2019-12-05</access-date>
          <comment>State of the Media: The Social Media Report 2012<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://blog.nielsen.com/nielsenwire/social/">http://blog.nielsen.com/nielsenwire/social/</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Duggan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brenner</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>Pew Research Center</source>
          <year>2013</year>
          <month>02</month>
          <day>14</day>
          <access-date>2019-12-05</access-date>
          <publisher-loc>Washington, DC</publisher-loc>
          <publisher-name>Pew Internet and American Life Project</publisher-name>
          <comment>The Demographics of Social Media Users - 2012<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pewinternet.org/Reports/2013/social-media-users.aspx">http://www.pewinternet.org/Reports/2013/social-media-users.aspx</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Epstein</surname>
              <given-names>JO</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Xing</surname>
              <given-names>EP</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>A Latent Variable Model for Geographic Lexical Variation</article-title>
          <source>Proceedings of the 2010 Conference on Empirical Methods in Natural Language Processing</source>
          <year>2010</year>
          <conf-name>EMNLP'10</conf-name>
          <conf-date>October 9 - 11, 2010</conf-date>
          <conf-loc>Cambridge, MA</conf-loc>
          <fpage>1277</fpage>
          <lpage>87</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mislove</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Onnela</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenquist</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Understanding the Demographics of Twitter Users</article-title>
          <source>Proceedings of the Fifth International Conference on Weblogs and Social Media</source>
          <year>2011</year>
          <conf-name>ICWSM'11</conf-name>
          <conf-date>July 17-21, 2011</conf-date>
          <conf-loc>Barcelona, Catalonia, Spain</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benjamini</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hochberg</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Controlling the false discovery rate: a practical and powerful approach to multiple testing</article-title>
          <source>J R Stat Soc Series B Stat Methodol</source>
          <year>1995</year>
          <volume>57</volume>
          <issue>1</issue>
          <fpage>289</fpage>
          <lpage>300</lpage>
          <pub-id pub-id-type="doi">10.1111/j.2517-6161.1995.tb02031.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Latent dirichlet allocation</article-title>
          <source>Journal of Machine Learning Research</source>
          <year>2003</year>
          <volume>3</volume>
          <fpage>993</fpage>
          <lpage>1022</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmlr.org/papers/volume3/blei03a/blei03a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="book">
          <source>Crude and Age-Adjusted Rates of Diagnosed Diabetes per 100 Civilian, Non-Institutionalized Adult Population, United States, 1980-2014</source>
          <year>2015</year>
          <publisher-loc>Atlanta, GA</publisher-loc>
          <publisher-name>National Center for Health Statistics, Division of Health Interview Statistics</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Giorgi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sap</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Crutchley</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>DLATK: Differential Language Analysis ToolKit</article-title>
          <source>Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing</source>
          <year>2017</year>
          <conf-name>EMNLP'17</conf-name>
          <conf-date>September 7–11, 2017</conf-date>
          <conf-loc>Copenhagen, Denmark</conf-loc>
          <fpage>55</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/d17-2010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Karami</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dahl</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Turner-McGrievy</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kharrazi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Characterizing diabetes, diet, exercise, and obesity comments on Twitter</article-title>
          <source>Int J Inf Manag</source>
          <year>2018</year>
          <month>02</month>
          <volume>38</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijinfomgt.2017.08.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Semino</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Demjén</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Demmen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Koller</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Payne</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hardie</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rayson</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>The online use of Violence and Journey metaphors by patients with cancer, as compared with health professionals: a mixed methods study</article-title>
          <source>BMJ Support Palliat Care</source>
          <year>2017</year>
          <month>03</month>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>60</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25743439"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjspcare-2014-000785</pub-id>
          <pub-id pub-id-type="medline">25743439</pub-id>
          <pub-id pub-id-type="pii">bmjspcare-2014-000785</pub-id>
          <pub-id pub-id-type="pmcid">PMC5339544</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Reber</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Chon</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Tweeting as health communication: health organizations' use of Twitter for health promotion and public engagement</article-title>
          <source>J Health Commun</source>
          <year>2016</year>
          <volume>21</volume>
          <issue>2</issue>
          <fpage>188</fpage>
          <lpage>98</lpage>
          <pub-id pub-id-type="doi">10.1080/10810730.2015.1058435</pub-id>
          <pub-id pub-id-type="medline">26716546</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
