<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v4i4e37</article-id>
    <article-id pub-id-type="pmid">27836816</article-id>
    <article-id pub-id-type="doi">10.2196/medinform.6328</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Web-based Real-Time Case Finding for the Population Health Management of Patients With Diabetes Mellitus: A Prospective Validation of the Natural Language Processing–Based Algorithm With Statewide Electronic Medical Records</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Eysenbach</surname>
          <given-names>Gunther</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Pourmalek</surname>
          <given-names>Farshad</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Harrison</surname>
          <given-names>James</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1" equal-contrib="yes">
        <name name-style="western">
          <surname>Zheng</surname>
          <given-names>Le</given-names>
        </name>
        <degrees>BS</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4744-367X</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib2" equal-contrib="yes">
        <name name-style="western">
          <surname>Wang</surname>
          <given-names>Yue</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <xref rid="aff3" ref-type="aff">3</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-0981-935X</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib3" equal-contrib="yes">
        <name name-style="western">
          <surname>Hao</surname>
          <given-names>Shiying</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-7527-2460</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib4" equal-contrib="yes">
        <name name-style="western">
          <surname>Shin</surname>
          <given-names>Andrew Y</given-names>
        </name>
        <degrees>MD</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6713-0609</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib5">
        <name name-style="western">
          <surname>Jin</surname>
          <given-names>Bo</given-names>
        </name>
        <degrees>MS</degrees>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-9268-7134</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib6">
        <name name-style="western">
          <surname>Ngo</surname>
          <given-names>Anh D</given-names>
        </name>
        <degrees>MD, DrPH</degrees>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-0593-8420</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib7">
        <name name-style="western">
          <surname>Jackson-Browne</surname>
          <given-names>Medina S</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-0219-0744</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib8">
        <name name-style="western">
          <surname>Feller</surname>
          <given-names>Daniel J</given-names>
        </name>
        <degrees>BA</degrees>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-1258-7107</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib9">
        <name name-style="western">
          <surname>Fu</surname>
          <given-names>Tianyun</given-names>
        </name>
        <degrees>BS</degrees>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-8103-8841</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib10">
        <name name-style="western">
          <surname>Zhang</surname>
          <given-names>Karena</given-names>
        </name>
        <degrees>NA</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4065-2882</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib11">
        <name name-style="western">
          <surname>Zhou</surname>
          <given-names>Xin</given-names>
        </name>
        <degrees>MD</degrees>
        <xref rid="aff5" ref-type="aff">5</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-1395-7103</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib12">
        <name name-style="western">
          <surname>Zhu</surname>
          <given-names>Chunqing</given-names>
        </name>
        <degrees>MS</degrees>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-0649-4403</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib13">
        <name name-style="western">
          <surname>Dai</surname>
          <given-names>Dorothy</given-names>
        </name>
        <degrees>BS</degrees>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-9778-198X</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib14">
        <name name-style="western">
          <surname>Yu</surname>
          <given-names>Yunxian</given-names>
        </name>
        <degrees>MD PhD</degrees>
        <xref rid="aff6" ref-type="aff">6</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-3394-9832</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib15">
        <name name-style="western">
          <surname>Zheng</surname>
          <given-names>Gang</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff3" ref-type="aff">3</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-5864-2944</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib16">
        <name name-style="western">
          <surname>Li</surname>
          <given-names>Yu-Ming</given-names>
        </name>
        <degrees>MD</degrees>
        <xref rid="aff5" ref-type="aff">5</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-1981-8120</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib17">
        <name name-style="western">
          <surname>McElhinney</surname>
          <given-names>Doff B</given-names>
        </name>
        <degrees>MD</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-7242-0934</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib18">
        <name name-style="western">
          <surname>Culver</surname>
          <given-names>Devore S</given-names>
        </name>
        <degrees>MM</degrees>
        <xref rid="aff7" ref-type="aff">7</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-5826-2079</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib19">
        <name name-style="western">
          <surname>Alfreds</surname>
          <given-names>Shaun T</given-names>
        </name>
        <degrees>MBA</degrees>
        <xref rid="aff7" ref-type="aff">7</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-1752-4823</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib20">
        <name name-style="western">
          <surname>Stearns</surname>
          <given-names>Frank</given-names>
        </name>
        <degrees>MHA</degrees>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-2049-9163</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib21">
        <name name-style="western">
          <surname>Sylvester</surname>
          <given-names>Karl G</given-names>
        </name>
        <degrees>MD</degrees>
        <xref rid="aff2" ref-type="aff">2</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-8559-0155</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib22">
        <name name-style="western">
          <surname>Widen</surname>
          <given-names>Eric</given-names>
        </name>
        <degrees>MHA</degrees>
        <xref rid="aff4" ref-type="aff">4</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-8999-4659</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib23" corresp="yes">
      <name name-style="western">
        <surname>Ling</surname>
        <given-names>Xuefeng Bruce</given-names>
      </name>
      <degrees>PhD</degrees>
      <xref rid="aff2" ref-type="aff">2</xref>
      <address>
        <institution>Stanford University</institution>
        <addr-line>S370 Grant Bldg</addr-line>
        <addr-line>Stanford, CA,</addr-line>
        <country>United States</country>
        <phone>1 650 427 9198</phone>
        <fax>1 650 723 1154</fax>
        <email>bxling@stanford.edu</email>
      </address>  
      <xref rid="aff6" ref-type="aff">6</xref>
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-5386-3884</ext-link></contrib>
    </contrib-group>
    <aff id="aff1">
      <sup>1</sup>
      <institution>Tsinghua University</institution>
      <addr-line>Beijing</addr-line>
      <country>China</country>
    </aff>
    <aff id="aff2">
      <sup>2</sup>
      <institution>Stanford University</institution>
      <addr-line>Stanford, CA</addr-line>
      <country>United States</country>
    </aff>
    <aff id="aff3">
      <sup>3</sup>
      <institution>Zhejiang University</institution>
      <addr-line>Hangzhou</addr-line>
      <country>China</country>
    </aff>
    <aff id="aff4">
      <sup>4</sup>
      <institution>HBI Solutions Inc</institution>
      <addr-line>Palo Alto, CA</addr-line>
      <country>United States</country>
    </aff>
    <aff id="aff5">
    <sup>5</sup>
    <institution>Tianjin Key Laboratory of Cardiovascular Remodeling and Target Organ Injury</institution>
    <institution>Pingjin Hospital Heart Center</institution>  
    <addr-line>Tianjin</addr-line>
    <country>China</country></aff>
    <aff id="aff6">
    <sup>6</sup>
    <institution>School of Medicine</institution>
    <institution>Zhejiang University</institution>  
    <addr-line>Hangzhou</addr-line>
    <country>China</country></aff>
    <aff id="aff7">
      <sup>7</sup>
      <institution>HealthInfoNet</institution>
      <addr-line>Portland, ME</addr-line>
      <country>United States</country>
    </aff>
    <author-notes>
      <corresp>Corresponding Author: Xuefeng Bruce Ling 
      <email>bxling@stanford.edu</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><season>Oct-Dec</season><year>2016</year></pub-date>
    <pub-date pub-type="epub">
      <day>11</day>
      <month>11</month>
      <year>2016</year>
    </pub-date>
    <volume>4</volume>
    <issue>4</issue>
    <elocation-id>e37</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>7</day>
        <month>7</month>
        <year>2016</year>
      </date>
      <date date-type="rev-request">
        <day>2</day>
        <month>8</month>
        <year>2016</year>
      </date>
      <date date-type="rev-recd">
        <day>1</day>
        <month>10</month>
        <year>2016</year>
      </date>
      <date date-type="accepted">
        <day>12</day>
        <month>10</month>
        <year>2016</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Le Zheng, Yue Wang, Shiying Hao, Andrew Y Shin, Bo Jin, Anh D Ngo, Medina S Jackson-Browne, Daniel J Feller, Tianyun Fu, Karena Zhang, Xin Zhou, Chunqing Zhu, Dorothy Dai, Yunxian Yu, Gang Zheng, Yu-Ming Li, Doff B McElhinney, Devore S Culver, Shaun T Alfreds, Frank Stearns, Karl G Sylvester, Eric Widen, Xuefeng Bruce Ling. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 11.11.2016.</copyright-statement>
    <copyright-year>2016</copyright-year>
    <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://medinform.jmir.org/2016/4/e37/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>Diabetes case finding based on structured medical records does not fully identify diabetic patients whose medical histories related to diabetes are available in the form of free text. Manual chart reviews have been used but involve high labor costs and long latency.</p>
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>This study developed and tested a Web-based diabetes case finding algorithm using both structured and unstructured electronic medical records (EMRs).</p>
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>This study was based on the health information exchange (HIE) EMR database that covers almost all health facilities in the state of Maine, United States. Using narrative clinical notes, a Web-based natural language processing (NLP) case finding algorithm was retrospectively (July 1, 2012, to June 30, 2013) developed with a random subset of HIE-associated facilities, which was then blind tested with the remaining facilities. The NLP-based algorithm was subsequently integrated into the HIE database and validated prospectively (July 1, 2013, to June 30, 2014).</p>
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>Of the 935,891 patients in the prospective cohort, 64,168 diabetes cases were identified using diagnosis codes alone. Our NLP-based case finding algorithm prospectively found an additional 5756 uncodified cases (5756/64,168, 8.97% increase) with a positive predictive value of .90. Of the 21,720 diabetic patients identified by both methods, 6616 patients (6616/21,720, 30.46%) were identified by the NLP-based algorithm before a diabetes diagnosis was noted in the structured EMR (mean time difference = 48 days).</p>
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>The online NLP algorithm was effective in identifying uncodified diabetes cases in real time, leading to a significant improvement in diabetes case finding. The successful integration of the NLP-based case finding algorithm into the Maine HIE database indicates a strong potential for application of this novel method to achieve a more complete ascertainment of diagnoses of diabetes mellitus.</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>electronic medical record</kwd>
      <kwd>natural language processing</kwd>
      <kwd>diabetes mellitus</kwd>
      <kwd>data mining</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Diabetes mellitus (DM) is a leading cause of mortality and morbidity and accounts for significant burden of disease worldwide [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. In the United States, 9.3% of the population or 29.1 million people were reported to have diabetes in 2013, plus an estimate of 8.1 million people with undiagnosed diabetes [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Diabetes is a metabolic disorder caused by a high concentration of glucose in the blood stream. If untreated, diabetic patients will eventually develop a range of complications. Diabetes complications can be prevented through timely application of several measures such as lifestyle modification and control of blood glucose and blood pressure for diabetic patients [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref8">8</xref>].</p>
      <p>The identification of persons with diagnosed DM in electronic medical records (EMRs) is essential to quality improvement initiatives, clinical decision support systems, and regional disease prevalence estimates used by public health departments. Although DM diagnoses have typically been captured by International Classification of Diseases (ICD) codes and stored in EMRs, previous studies found that diagnostic codes alone do not adequately represent DM diagnoses across a population, resulting in underestimates of disease prevalence and challenging the development of electronic approaches to clinical management [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. The prevalence of DM in 2014 in Maine was 7.8%, whereas the codified prevalence is 6.8% in our database. It indicates a gap caused by uncodified DM in the structured EMRs of patients. Diabetic patients who have received little or no diabetes care are unlikely to be associated with a diabetes-specific diagnosis code for billing, as are patients who transfer their care between multiple unaffiliated health care systems but receive no DM care for some time. To overcome this shortcoming, manual chart reviews of unstructured clinical notes have been used to identify uncodified DM cases. However, this method involves high labor costs and long latency, which has limited use for large scale datasets [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      <p>One possible solution to the problem and a fully automated alternative and acceptable means of delivering cost-effective case finding is the use of natural language processing (NLP), a Web-based technique. NLP has increasingly been used to enhance case finding for some high-impact chronic diseases such as heart failure and cancer through analyzing narrative text in EMRs [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. The advantage of the automated NLP-based case finding algorithm is that it allows for the rapid real-time identification of uncodified diagnoses from large datasets. It also allows for the rapid preprocessing of unstructured clinical notes for different diseases and clinical conditions before a diagnosis is selected [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. However, the existing NLP applications are mainly based on a small sample of patients with a limited number of clinical notes. Currently, the application of NLP in public health and medicine faces the following challenges [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]: (1) a lack of a comprehensive knowledge base to generate the accumulated domain knowledge from the targeted patient population; (2) a lack of a comprehensive data model to encapsulate the unstructured clinical notes of various formats across different health care facilities; (3) and a lack of a robust and scalable analytics pipeline to process a large number of EMR notes across statewide health care facilities.</p>
      <p>The aim of this study was therefore to develop and integrate an online real-time NLP-based DM case finding algorithm into the health information exchange (HIE) care flow in the state of Maine, United States (<xref ref-type="fig" rid="figure1">Figure 1</xref>). We hypothesized that the algorithm we developed could find additional patients with DM who were not identified by codified diagnoses in structured EMRs. This algorithm was built on a knowledge base that incorporates taxonomies and controlled vocabularies encoding domain knowledge, as well as the task-oriented characteristics of clinical notes. It also used both structured and unstructured information and data available in EMRs, which were treated as variables for statistical learning in identification of uncodified DM diagnoses.</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>A schematic presentation of the natural language processing (NLP)–based algorithm integrated into the statewide diabetes mellitus case finding and surveillance. The clinical note was preprocessed and identified to generate the decision. The knowledge bases, statistical model, and the gold standard datasets form the basis of the NLP engine. ICD: International Classification of Diseases; NLM: US National Library of Medicine; MeSH: Medical Subject Headings; EMR: electronic medical record; HIE: health information exchange; PPV: positive predictive value. SNOMED CT: Systematized Nomenclature of Medicine – Clinical Terms.</p>
        </caption>
        <graphic xlink:href="medinform_v4i4e37_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethics Statements</title>
        <p>Protected personal health information was removed for the purpose of this research. Because this study analyzed deidentified data, it was exempted from ethics review by the Stanford University Institutional Review Board (October 16, 2014).</p>
      </sec>
      <sec>
        <title>Data Sources</title>
        <p>Data for this study were extracted from the HIE dataset administered by HealthInfoNet—an independent nonprofit organization. The dataset contains records of nearly 95% of the population in the state of Maine. There are 35 HIE-associated hospitals, 34 federally qualified health centers, and more than 400 ambulatory practices [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. To identify the DM cohort, clinical notes of all categories in the Maine HIE EMR database were analyzed. Clinical notes are also known as progress notes, which are the part of a medical record where health care professionals document the details of a patient's clinical status or achievements during the course of inpatient care or outpatient care. Clinical notes in our study are encounter based. These notes were divided into 2 subcohorts. The retrospective cohort contained 1,385,280 notes representing 1,129,952 patients covering the period from July 1, 2012, to June 30, 2013, and the prospective cohort comprised 982,211 clinical notes representing 935,891 patients recorded from July 1, 2013, to June 30, 2014 (<xref ref-type="fig" rid="figure2">Figure 2</xref>). Clinical notes were derived from more than 100 different types of clinical reports, including history or physical reports, discharge summaries, and emergency reports.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Cohort construction of the study. ICD9: International Classification of Diseases, Ninth Revision; DM: diabetes mellitus; MDS: multidimensional scaling.</p>
          </caption>
          <graphic xlink:href="medinform_v4i4e37_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Algorithm Overview</title>
        <p>The patients with DM were defined as those who had DM noted as either primary or secondary diagnosis (International Classification of Diseases, Ninth Revision, Clinical Modification, ICD-9-CM, codes: 249, 249.x, 249.xx, 250, 250.x, and 250.xx) in their medical records [<xref ref-type="bibr" rid="ref24">24</xref>]. The case finding algorithm consisted of 3 sequential steps based on both structured and unstructured EMR information (<xref ref-type="fig" rid="figure1">Figure 1</xref>). The first step involved a preprocessing of unstructured clinical notes to remove information indicating the patient did not have DM, such as family history of DM and negation (ie, the patient denied DM). This step removed the misleading information to avoid false-positive errors, thus improving the performance of subsequent steps. The second step entailed a feature extraction that mapped DM risk factors recognized in previous studies [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref29">29</xref>], medications extracted from Unified Medical Language System, and NLP terms into the structured metadata. In the third step, a decision tree–based model based on the retrospective cohort was developed to determine whether a patient had DM. The development procedures are detailed in later sections. To support the whole algorithm pipeline, the NLP engine was created, including knowledge base, statistical models, and gold standard datasets as functional modules. Their construction and utilization are described below.</p>
      </sec>
      <sec>
        <title>Knowledge Base</title>
        <p>The knowledge base consisted of 3 cores: (1) DM-related clinical terms as the controlled vocabularies; (2) antidiabetic medications; and (3) extracted rules in the clinical notes.</p>
        <p>Clinical terms in our NLP knowledge base were derived from the following sources: (1) the description and synonyms of ICD-9-CM codes under 249, 249.x, 249.xx, 250, 250.x, and 250.xx; (2) the comprehensive clinical terminologies within SNOMED CT (Systematized Nomenclature of Medicine – Clinical Terms) [<xref ref-type="bibr" rid="ref30">30</xref>]; (3) a mapping of ICD-9-CM with SNOMED CT proposed by the US National Library of Medicine (NLM) [<xref ref-type="bibr" rid="ref31">31</xref>], based on the concepts and synonyms mapped to ICD codes 249, 249.x, 249.xx, 250, 250.x, and 250.xx; (4) the headings returned by the query of “diabetes” using NLM for article indexing [<xref ref-type="bibr" rid="ref32">32</xref>] in a controlled vocabulary thesaurus, namely, Medical Subject Headings (MeSH). These clinical terms in the knowledge base were further tokenized, combined, and filtered to derive our controlled vocabulary of single and dual tokens. If those controlled vocabularies contained stop words, for example, “the,” “a,” “of,” provided by the text mining (tm) package (R Development Core Team) [<xref ref-type="bibr" rid="ref33">33</xref>], they were removed. In total, 742 final NLP terms were identified (<xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>); of these, 72 were found to be significantly associated with DM diagnosis (Mann-Whitney test <italic>P</italic> value &#60;.05) in the retrospective cohort. Here, the patients who were assigned any of the ICD-9-CM codes 249, 249.x, 249.xx, 250, 250.x, 250.xx during the encounter were defined as having a diagnosis of DM.</p>
        <p>Antidiabetic medications were identified from the Unified Medical Language System database. Out of 36 medications analyzed, 22 were found to be significantly associated with DM diagnosis (Mann-Whitney test <italic>P</italic> value &#60;.05) in the retrospective cohort.</p>
        <p>Because information on DM risk factors (eg, body mass index or BMI, high blood pressure, obesity, smoking history, and alcohol use disorders) might be presented in multiple unstructured formats in EMRs, we developed a series of regular expressions and rules to unify unstructured information and subsequently standardize feature categories. For example, BMI could be available from clinical notes, but in many instances only height and weight were provided. The BMI was then divided into 4 categories: underweight, normal, overweight, and obesity, according to the World Health Organization classification [<xref ref-type="bibr" rid="ref34">34</xref>]. Additionally, to make the knowledge base more compatible with the expression of clinical notes, it was updated iteratively along with development of the retrospective model.</p>
      </sec>
      <sec>
        <title>Preprocessing and Feature Extraction</title>
        <p>Intuitively, DM-related words in the notes can be used to classify a DM case. However, this simpleminded note-processing method ignores negative expressions, for example, “The patient denied DM” in the note. Obviously, such negation will mislead the algorithm to wrongly classify the patient as a DM case. To avoid this kind of error, negation should be handled first before being fed into the pipeline. Preprocessing to remove family DM history is done because of similar considerations: the note with sentence “his mother had diabetes mellitus” does not classify the corresponding patient, “he,” as a diabetic patient. To ensure NLP specificity, segments associated with negation and family history of DM as described above were removed during preprocessing according to the entries in the knowledge base. The vocabulary of negation was populated using the lexicon proposed by NegEX [<xref ref-type="bibr" rid="ref35">35</xref>]. The family-related words [<xref ref-type="bibr" rid="ref36">36</xref>] were used to initiate the vocabulary of family history.</p>
        <p>To break narrative text in clinical notes into smaller pieces, we applied the text semantics. A note was collapsed into paragraphs, sentences, and lines as basic units with nonoverlapping contents. Criteria to define a basic unit were developed on statistics of the text lengths and newline characters. If a paragraph (or a sentence, a line) satisfied criteria of a basic unit, it was regarded as one segment without further decomposition. The parts of speech were annotated and referred for sentence boundary detection against the confusion between periods and decimal points using openNLP (R Development Core Team) [<xref ref-type="bibr" rid="ref33">33</xref>]. When a segment contained a word or a phrase in the vocabularies associated with negation and family history, this segment was removed from the note.</p>
        <p>To map the unstructured text into structured metadata, the knowledge base was applied to the standardized clinical notes after preprocessing. When matching the text with the NLP terms and medications in the knowledge base was successful, the structured data of the notes were coded as “1,” otherwise as “0.” Then DM risk factors were extracted to further enrich the clinical notes metadata using the rules and regular expressions stored in the knowledge base.</p>
      </sec>
      <sec>
        <title>Workflow of Gold Standard Dataset</title>
        <p>Gold standard datasets were created for model development and validation purposes (<xref ref-type="fig" rid="figure2">Figure 2</xref>). The datasets contained a subset of patients with or without DM. The patient DM status was determined by manual chart reviews of clinical notes conducted by 2 physician-curators. If a patient had any notes showing DM diagnosis, he or she was coded as having DM. The 2 physicians reviewed each note individually and assessed whether the note showed the presence of DM. After individual review, the 2 assessments for each note were compared. Any disagreement was discussed by the 2 physicians and an agreement was reached [<xref ref-type="bibr" rid="ref37">37</xref>]. When there was a disagreement on diagnosis that could not be resolved by discussion between the 2 curators, the patient was excluded. The datasets created through this process were used as the gold standard to define the cutoff point, run the blind testing, or to validate our NLP-based case finding algorithm. The cohort construction of the gold standard datasets is shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>.</p>
      </sec>
      <sec>
        <title>Model Development</title>
        <p>A model was developed on the retrospective cohort (<xref ref-type="fig" rid="figure2">Figure 2</xref>). The clinic’s facilities where clinical notes were derived were randomly allocated to 1 of the 2 subsets: one for training and for finding the cutoff point (n=17 facilities) and the other for blind testing (n=18 facilities). Within the subsets for training and finding the cutoff point, all available notes (n=44,368) with codified DM diagnoses, and an equal number of uncodified notes (n=44,368), were selected to construct a training subcohort for model development. In the remaining uncodified subset, a gold standard dataset was constructed by randomly selecting 100 positive (DM) patients and 500 negative (non-DM) patients as the subcohort for finding the cutoff point. A further random sample of 100 positive and 500 negative patients identified from uncodified notes in the blind testing subset were selected to construct the blind testing subcohort.</p>
        <p>By feeding the training subcohort to the preprocessing and feature extraction, each note had a feature vector denoted as <italic>f</italic>. The identification of DM was stated as maximum a posteriori probability (MAP) estimation in <xref ref-type="fig" rid="figure3">Figure 3</xref> (a), where <italic>DM</italic> was a binary random variable indicating whether the sample had a DM diagnosis (<italic>DM</italic>=1). To take diagnosis codes into consideration, a binary variable <italic>ICD</italic> was introduced to indicate whether a note was codified (<italic>ICD</italic>=1). By inserting <italic>ICD</italic> into the posterior and then applying the Bayesian rule, we had the decomposition in <xref ref-type="fig" rid="figure3">Figure 3</xref> (b).</p>
        <p>Because the assignment of diagnosis code was independent of the extracted feature, the model was simplified to the equation in <xref ref-type="fig" rid="figure3">Figure 3</xref> (c).</p>
        <p>The first term on the right side determined the probability of DM for a codified note, while the second term on the right side for an uncodified note. As coding information was known, we had 2 branches to obtain the posterior a shown in <xref ref-type="fig" rid="figure3">Figure 3</xref> (d).</p>
        <p>The great majority of uncodified notes did not include a DM diagnosis, while most DM codified notes were ICD-9-CM DM diagnoses. This led us to develop the following class labeling method:</p>
        <p>1. If a note is codified, this note should have a diagnosis of DM (<xref ref-type="fig" rid="figure3">Figure 3</xref> (e));</p>
        <p>2. If a note is not codified, a model should be built to estimate the probability (<xref ref-type="fig" rid="figure3">Figure 3</xref> (f)).</p>
        <p>As a result, the inference of DM diagnosis for a codified note was only dependent on the ICD code noted in the structured data, whereas for uncodified notes we trained a random forest model [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref38">38</xref>] to obtain T(<italic>f</italic>) (<xref ref-type="fig" rid="figure3">Figure 3</xref> (g)), where <italic>t</italic><sub>n</sub> was the <italic>n</italic> th decision tree in the random forest.</p>
        <p>At the perspective of hierarchical tree, the model could be considered as a combination of a predetermined tree-based model and a random forest-based model. The predetermined tree was developed based on the ICD-9-CM diagnosis codes associated with DM, which represented human prior knowledge. The random forest-based model was developed by extracting information from clinical notes, which represented machine learning knowledge.</p>
        <p>The model was first trained with codified notes, the DM-positive sample, and uncodified notes, the DM-negative sample. The false positives in the training sample were uncodified notes either with or without a DM diagnosis. The former was regarded as the positive sample in the next round of training. By applying the 2 steps iteratively, the model as well as the knowledge base associated with the expression of family history and negation was fine-tuned. All false-positive cases were reviewed manually to understand how these occurred.</p>
        <p>This codified-note–driven iterative training scheme was based on the hypothesis that the notes’ features should be similar between codified notes and uncodified notes where a DM diagnosis was found. To test this hypothesis and validate the method, multidimensional scaling (MDS) plots were constructed with 1000 samples randomly selected from the training subcohort to illustrate the distribution of notes.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Equations describing the modeling process of the natural language processing (NLP)–based algorithm.</p>
          </caption>
          <graphic xlink:href="medinform_v4i4e37_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Patient Classification Cutoff Point Determination</title>
        <p>As the algorithm was developed to find out uncodified DM cases, the proportion of true positives among the identified samples, positive predictive value (PPV), was the most important indicator of performance. With a PPV of ≥90%, the proportion of false-positive cases is less than 10%. On the other hand, given that the method was to identify uncodified cases in addition to the codified cases, maintaining a high level of PPV at the expense of sensitivity is acceptable. The way we located the optimal cutoff by considering the trade-off between PPV and sensitivity was also presented in a previous NLP study [<xref ref-type="bibr" rid="ref39">39</xref>]. Given that our algorithm assigned a classification probability to each subject, we aimed to find an optimal cutoff point to achieve the maximum classification sensitivity with a predefined PPV of 90%. To achieve a 90% PPV, the classification specificity can be calculated through a linear formula, thus forming a straight line overlaid on the receiver operating characteristic (ROC) curve. The combination of sensitivity and specificity in the region above the line allowed for a performance with &#62;90% PPV. Thus, the cutoff point was set at the first intersection between the line and the ROC curve.</p>
        <p>At the final stage of the retrospective model development, the case finding algorithm was blind tested on patients from health care facilities that were not included in the training subset.</p>
      </sec>
      <sec>
        <title>Prospective Case Finding and Validation</title>
        <p>Our NLP-based DM case finding algorithm was then deployed online through integration into the HIE real-time population exploration dashboard system. The clinical notes (N=982,211) covering the period from July 1, 2013, to June 30, 2014, were aggregated for prospective validation of the algorithm. An independent gold standard dataset was constructed based on chart reviews of clinical notes of 200 patients with DM and 1000 patients without DM randomly selected from the prospective cohort (<xref ref-type="fig" rid="figure2">Figure 2</xref>). The prospective classification performance on the gold standard dataset was evaluated using the following parameters: PPV, sensitivity, specificity, negative predictive value (NPV), and the area under the ROC curve. A total of 200 samples were further randomly selected from the uncodified DM cases identified by the algorithm to evaluate the case finding accuracy on the entire prospective cohort. On the basis of the longitudinal records of both clinical notes and diagnosis codes for each patient in the HIE EMR database, a temporal comparison of the 2 sources was analyzed.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Case Finding Algorithm Performance</title>
        <p>An MDS plot was constructed to visualize the classification performance. As shown in <xref ref-type="fig" rid="figure4">Figure 4</xref>, out of 500 uncodified notes, 2 were classified as DM diagnosis. A closer examination revealed that these “false-positive” cases had notes with genuine diagnosis of DM. This MDS plot indicated that (1) our model effectively differentiated the notes from those patients with DM diagnosis and those without DM diagnosis and (2) our NLP-based analysis of clinical notes can identify uncodified notes with diagnosis of DM.</p>
        <p><xref ref-type="fig" rid="figure4">Figure 4</xref> shows that more than 99% of the uncodified notes were linked to patients without DM diagnosis and more than 99% of the codified notes were linked to patients with DM diagnosis. There were only 1% mislabeled samples in the training dataset, which did not alter the model performance [<xref ref-type="bibr" rid="ref40">40</xref>].</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>The multidimensional scaling (MDS) plots of the training result. This analysis was aimed at detecting meaningful underlying dimensions, for example, 1 and 2, which allow the explanation of the observed similarities (distances) between the investigated subjects. The axes of the MDS plots represent no real sizes and thus were marked as dimension 1 and dimension 2 without units. The red dots and blue triangles, indicating the positive and negative samples, were clearly separated. The “false positives” are circled in the plot. Chart reviews showed that these were notes with a genuine diagnosis of diabetes mellitus.</p>
          </caption>
          <graphic xlink:href="medinform_v4i4e37_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Diabetes Mellitus Discriminant Variables</title>
        <p>A total of 100 DM discriminant features were retained in the final model, including demographics (n=2), risk factors (n=5), clinical history (n=1), medications (n=20), and NLP-extracted clinical terms (n=72; <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>). <xref ref-type="fig" rid="figure5">Figure 5</xref> shows the top 30 features ranked by their importance in the model. The importance of each feature was rated according to the mean decrease in algorithm accuracy scaled by standard deviation after randomly permuting the variable values. A higher mean decrease in accuracy (node impurities from splitting on the variables; specifically, the node impurity is measured by the Gini index) corresponds to greater importance of the feature [<xref ref-type="bibr" rid="ref40">40</xref>]. Among the top 30 features, “diabetes” and “type 2,” which directly indicate DM, were the top 2 features, followed by age, an important predictor of DM [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>], and then “metformin,” a first-line antidiabetic drug. The remaining important discriminant features were high blood pressure, cigarette smoking, history of alcohol use, BMI, and “obesity.”</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>List of the top 30 clinical variables included in the diabetes mellitus natural language processing (NLP)–based model. BMI: body mass index.</p>
          </caption>
          <graphic xlink:href="medinform_v4i4e37_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Patient Classification Cutoff Point Determination</title>
        <p>The decision tree–based classification scores were evaluated to determine a cutoff point that allows maximal sensitivity with a ≥90% PPV (<xref ref-type="app" rid="app2">Multimedia Appendix 2</xref>). With this cutoff value (set as .618), the continuous classification scoring outputs were converted to reach a binary decision to identify genuine DM cases.</p>
      </sec>
      <sec>
        <title>Retrospective Blind Testing</title>
        <p>As shown in <xref ref-type="fig" rid="figure6">Figure 6</xref>, in the retrospective blind testing, our NLP-based analysis achieved a 95.4% (62/65) PPV, 62.0% (62/100) sensitivity, 99.4% (497/500) specificity, and 92.9% NPV (497/535). The blind testing results indicate that the knowledge acquired from some hospital facilities could be leveraged to allow prediction in others (eg, learning transfer) [<xref ref-type="bibr" rid="ref43">43</xref>].</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Performance evaluation of the proposed case finding algorithm. Top: the contingency tables on blind test and prospective gold standard datasets. Middle: the positive predictive value (PPV), negative predictive value (NPV), sensitivity, and specificity of the validation based on the retrospective blind testing subcohort and prospective cohort. Bottom: the prospective case finding results in the total population. DM: diabetes mellitus; GS: gold standard; ICD-9-CM: International Classification of Diseases, Ninth Revision, Clinical Modification; NLP: natural language processing.</p>
          </caption>
          <graphic xlink:href="medinform_v4i4e37_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Prospective Validation</title>
        <p>The prospective performance of the algorithm was explored by chart review over a gold standard dataset consisting of randomly selected 200 patients with DM and 1000 patients without DM in the uncodified subcohort (<xref ref-type="fig" rid="figure2">Figure 2</xref>). The PPV was 90.1% (136/151), which was within the 95% CI of the retrospective blind testing PPV (87.3%-98.4%). The sensitivity was 68.0% (136/200). The specificity, NPV, and area under ROC curve were 98.50% (985/1000), 93.90% (985/1049), and .929, respectively (<xref ref-type="fig" rid="figure6">Figure 6</xref>).</p>
        <p>The algorithm was deployed to allow real-time DM case finding on the entire prospective cohort. A total of 64,168 patients with DM were identified from codified DM diagnosis, while our NLP-based algorithm identified an additional 5756 patients, resulting in an 8.97% (5756/64,168) increase in the total patients with DM during the study period. To further explore the case finding accuracy, we randomly selected 200 samples from the 5756 samples. Manual review showed that of the 200 samples there were 183 DM cases and 17 normal patients, resulting in an accuracy of 91.5% (183/200). Such accuracy was above the predetermined PPV (90%) in the calibration phase and was within the 95% CI of the retrospective blind testing PPV (87.3%-98.4%). The consistency of performance shows that it is reasonable to use the results obtained on smaller samples to reflect the performance of the algorithm on a large population.</p>
      </sec>
      <sec>
        <title>Temporal Comparison</title>
        <p>The time point when a patient’s first DM diagnosis was identified by ICD codes was evaluated and compared with the time point when the DM was identified by NLP case finding algorithm. Out of 21,720 patients with DM identified by both methods, 6616 patients (6616/21,720, 30.46%) were identified by the NLP-based algorithm before a DM ICD code was noted in the medical record (mean time difference = 48 days). In particular, 19.86% (1314/6616) of patients were identified by NLP case finding 3 months or more before they were identified by a DM ICD code (<xref ref-type="app" rid="app3">Multimedia Appendix 3</xref>).</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>To the best of our knowledge, this is the first online deployment of a real-time NLP-based case finding method for DM, using both patients’ structured (eg, codified diagnosis) and unstructured (free text) clinical histories from a statewide EMR database. Consistent with our hypothesis, during a 1-year period (from July 1, 2013, to June 30, 2014), our algorithm identified 5756 additional patients with DM (an 8.97% increase in the total patients with DM) who were otherwise left undiagnosed when only code-based case finding was applied. Our finding indicates that the proportion of false negatives decreased using the NLP-based approach compared with the existing ICD-based approach (<italic>P</italic>&#60;.01). Many patients with DM who were misclassified as patients without DM by the code-based case finding were correctly identified by our NLP text searching algorithm, resulting in a more complete ascertainment of DM diagnoses.</p>
        <p>There exist several reasons why patients with diagnosed DM may have not been associated with a DM diagnosis code. Among the uncodified DM patients we identified, 30% had DM noted as secondary, discharged, or other types of diagnosis and 63% had a history of diabetes in clinical records. A possible reason for missing diagnostic codes in those cases might be that if a patient was admitted to the hospital owing to more acute or life-threatening clinical conditions, information related to DM was overlooked when ICD coding was conducted. Therefore, there is a strong need for enhancing the current ICD coding practice in hospitals and other health care facilities in the state of Maine to ensure that all DM diagnoses noted in the patients’ medical records are coded.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>Although several standardized coding systems (eg, ICD, Logical Observation Identifiers Names and Codes) have been used to record diagnoses, procedures, laboratory tests, and medications associated with each patient encounter, a large amount of information related to patients’ clinical histories were also available in the form of unstructured free text in EMRs. In addition to the terms directly describing DM (eg, “diabetic,” “type 1,” “diabetes mellitus”), our NLP algorithm was able to obtain more complete medical histories based on information about risk factors and medications available from clinical notes. A range of conventional DM risk markers (eg, age, smoking, BMI, and blood pressure) [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref44">44</xref>-<xref ref-type="bibr" rid="ref46">46</xref>], emerging risk markers (eg, overweight) [<xref ref-type="bibr" rid="ref47">47</xref>], and antidiabetic drugs (eg, metformin) were identified and used to enhance DM case detection. In particular, metformin, the first-line medication for type 2 diabetes, appeared to be the most important drug in our feature selection process. These findings indicate that our algorithm effectively incorporated a variety of clinically relevant features, leading to a significant improvement in DM case finding in the population of the state of Maine.</p>
        <p>Another strength of our NLP case finding algorithm is the ability to find uncodified DM cases before the assignment of ICD-9-CM codes. The proposed DM case finding methodology used NLP algorithm in parallel with ICD-9-CM codes. In the prospective study, 69,924 patients with DM were identified. Among those 69,924 patients, 21,720 patients were able to be identified by both methods. That is, there were 21,720 DM patients having clinical notes that indicated they had DM. 30.46% (6616/21,720) of those patients had such clinical notes associated with an encounter earlier than the assignment of a DM diagnosis code, while 69.54% (15,104/21,720) of those patients had such clinical notes during the same encounter when a DM diagnosis code was given. Compared with using ICD-9-CM codes alone, the NLP algorithm was able to identify 30.46% (6616/21,720) of patients with DM at an earlier encounter, giving a mean time difference of 48 days. More importantly, a significant proportion of these patients (1314/6616, 19.86%) were identified 3 months or more before a DM diagnosis code was noted. For those patients, this time period is sufficient to initiate aggressive lifestyle interventions that have a long-term impact to delay progression and prevent complications of diabetes [<xref ref-type="bibr" rid="ref48">48</xref>]. Thus, this early detection capability is clearly an advantage of our DM NLP algorithm such that these high-risk individuals can be selected for timely initiation of targeted prevention, care, and treatment.</p>
        <p>We noted that there are some limitations in our study. First, although the use of statistical learning improved the performance of the case finding algorithm, it has inevitable misclassification errors. There were a couple of DM cases located close to the “borderline,” that is, the cutoff point for the algorithm to differentiate between DM cases and normal samples. The DM cases with outputs closed to the cutoff point for the algorithm were those who were susceptible to misclassification errors, compromising false negatives. DM cases at borderline represented DM patients with incomplete DM feature profile, that is, patients having no DM-related risk factors or medication records but having clinical notes confirming DM diagnosis, or patients having no DM-related risk factors or clinical notes but having medication records. Such incomplete profiles could mislead the algorithm. Second, the relatively small sample size of the “gold standard” dataset introduced the possibility that some relatively rare clinical phenotypes of DM—where clinicians documented diabetes in a nonstandard way—might not be accounted for during model training. Third, we were unable to identify whether the patients with DM found by the NLP algorithm were those with newly diagnosed DM or those with a long-standing diagnosis. Fourth, we acknowledge our case finding method’s limitation that it depends on the physician’s diagnosis of the disease and the documentation quality in clinical notes. Finally, the model was developed on the patient data in the state of Maine. Extra risk factors such as sociodemographic factors may need to be considered for adjustment purpose when this learning is transferred and applied to other geographic regions.</p>
      </sec>
      <sec>
        <title>A Web-based Identification Tool</title>
        <p>Our NLP algorithm has been deployed online through integration into the Maine State HIE workflow, currently allowing real-time statewide identification of patients with uncodified DM. It provides doctors, hospitals, and other providers in the state HealthInfoNet network with an effective online utility to achieve a more complete assessment of the DM burden in their location. Incorporating the DM case finding algorithm with the existing health care system makes the best use of information available in EMRs. Together with the previously successful integration of our other NLP case finding algorithms, including that for congestive heart failure [<xref ref-type="bibr" rid="ref14">14</xref>], there is a strong potential to expand the application of this novel method to enhance case finding for other diseases in Maine and other states in the United States and in other countries.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Our NLP-based DM case finding algorithm was developed and validated on a population-based dataset in the state of Maine. The results strongly support our hypothesis that the NLP-based algorithm could identify additional patients with DM to complement the existing ICD-code–based case finding method. Online real-time integration of our DM case finding algorithm into the Maine HIE workflow can enhance DM case detection and facilitate efforts toward timely initiation of targeted management and care for patients with DM. From the patient’s perspective, many patients with DM across the state of Maine, who were not identified from ICD codified diagnosis, would benefit from information we provide by being able to take initiatives to seek care and plan their personal strategies to monitor and control their diabetes status. In this regard, our online real-time DM case finding utility not only benefits all stakeholders including payers, providers, and policy makers in the Maine health care system, but also serves as a demonstrative Web-based project for future application to improve DM case finding for targeted care and treatment in other states and countries, making a contribution to alleviate the DM burden.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>A list of 100 discriminant features used by the final model as well as the feature importance, and a list of 742 natural language processing terms used by the initial modeling process.</p>
        <media xlink:href="medinform_v4i4e37_app1.pdf" xlink:title="PDF File (Adobe PDF File), 55KB"/>
      </app>
      <app id="app2">
        <title>Multimedia Appendix 2</title>
        <p>Determination of the cutoff point of the subject classification probabilities. Top: the receiver operating characteristic curve and the line determined by the prevalence and 90% positive predictive value were intersected at the cutoff point. Bottom: their intersection (dashed rectangle) is magnified and indicated by the circle.</p>
        <media xlink:href="medinform_v4i4e37_app2.pdf" xlink:title="PDF File (Adobe PDF File), 73KB"/>
      </app>
      <app id="app3">
        <title>Multimedia Appendix 3</title>
        <p>The distribution of patients by the time intervals between natural language processing–based diabetes mellitus identification and codified diagnosis.</p>
        <media xlink:href="medinform_v4i4e37_app3.pdf" xlink:title="PDF File (Adobe PDF File), 50KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BMI</term>
          <def>
            <p>body mass index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">DM</term>
          <def>
            <p>diabetes mellitus</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">EMR</term>
          <def>
            <p>electronic medical record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">HIE</term>
          <def>
            <p>health information exchange</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ICD</term>
          <def>
            <p>International Classification of Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">ICD-9-CM</term>
          <def>
            <p>International Classification of Diseases, Ninth Revision, Clinical Modification</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">MDS</term>
          <def>
            <p>multidimensional scaling</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">MeSH</term>
          <def>
            <p>Medical Subject Headings</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">NLM</term>
          <def>
            <p>US National Library of Medicine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">NPV</term>
          <def>
            <p>negative predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">PPV</term>
          <def>
            <p>positive predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">ROC</term>
          <def>
            <p>receiver operating characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">SNOMED CT</term>
          <def>
            <p>Systematized Nomenclature of Medicine – Clinical Terms</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="con">
        <p>LZ, YW, SH, BJ, ADN, MJB, DJF, TF, KZ, XZ, YML, CZ, DD, YY, GZ, and DBM contributed to the analysis and interpretation of data; DSC and STA contributed to the data collection; and AYS, FS, KGS, EW, and XBL contributed to conception or design of the work. LZ, YW, and SH drafted the manuscript; LZ, YW, SH, BJ, ADN, MJB, DJF, TF, KZ, XZ, YML, CZ, DD, YY, GZ, DBM, DSC, STA, AYS, FS, KGS, EW, and XBL critically revised the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>The authors have the following interests: KGS, EW, and XBL are cofounders and equity holders of HBI Solutions, Inc, which is currently developing predictive analytics solutions for health care organizations. From the departments of pediatrics, surgery, and cardiothoracic surgery, Stanford University School of Medicine, Stanford, California, Zhejiang University School of Medicine and School of Management, Pingjin Hospital Heart Center, and Tsinghua University School of Electrical Engineering, LZ, YW, SH, AYS, KZ, XZ, YML, YY, GZ, DBM, KGS, and XBL conducted this research as part of a personal outside consulting arrangement with HBI Solutions, Inc. The research and research results are not, in any way, associated with these institutions. This does not alter the authors' adherence to all the journal policies on sharing data and materials, as detailed online in the guide for authors.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Murray</surname>
            <given-names>CJ</given-names>
          </name>
          <name name-style="western">
            <surname>Vos</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Lozano</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Naghavi</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Flaxman</surname>
            <given-names>AD</given-names>
          </name>
          <name name-style="western">
            <surname>Michaud</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Ezzati</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Shibuya</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Salomon</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Abdalla</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Aboyans</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Abraham</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Ackerman</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Aggarwal</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Ahn</surname>
            <given-names>SY</given-names>
          </name>
          <name name-style="western">
            <surname>Ali</surname>
            <given-names>MK</given-names>
          </name>
          <name name-style="western">
            <surname>Alvarado</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Anderson</surname>
            <given-names>HR</given-names>
          </name>
          <name name-style="western">
            <surname>Anderson</surname>
            <given-names>LM</given-names>
          </name>
          <name name-style="western">
            <surname>Andrews</surname>
            <given-names>KG</given-names>
          </name>
          <name name-style="western">
            <surname>Atkinson</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Baddour</surname>
            <given-names>LM</given-names>
          </name>
          <name name-style="western">
            <surname>Bahalim</surname>
            <given-names>AN</given-names>
          </name>
          <name name-style="western">
            <surname>Barker-Collo</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Barrero</surname>
            <given-names>LH</given-names>
          </name>
          <name name-style="western">
            <surname>Bartels</surname>
            <given-names>DH</given-names>
          </name>
          <name name-style="western">
            <surname>Basáñez</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Baxter</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Bell</surname>
            <given-names>ML</given-names>
          </name>
          <name name-style="western">
            <surname>Benjamin</surname>
            <given-names>EJ</given-names>
          </name>
          <name name-style="western">
            <surname>Bennett</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Bernabé</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Bhalla</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Bhandari</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Bikbov</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Bin</surname>
            <given-names>AA</given-names>
          </name>
          <name name-style="western">
            <surname>Birbeck</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Black</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Blencowe</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Blore</surname>
            <given-names>JD</given-names>
          </name>
          <name name-style="western">
            <surname>Blyth</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Bolliger</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Bonaventure</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Boufous</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Bourne</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Boussinesq</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Braithwaite</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Brayne</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Bridgett</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Brooker</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Brooks</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Brugha</surname>
            <given-names>TS</given-names>
          </name>
          <name name-style="western">
            <surname>Bryan-Hancock</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Bucello</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Buchbinder</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Buckle</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Budke</surname>
            <given-names>CM</given-names>
          </name>
          <name name-style="western">
            <surname>Burch</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Burney</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Burstein</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Calabria</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Campbell</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Canter</surname>
            <given-names>CE</given-names>
          </name>
          <name name-style="western">
            <surname>Carabin</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Carapetis</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Carmona</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Cella</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Charlson</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Cheng</surname>
            <given-names>AT</given-names>
          </name>
          <name name-style="western">
            <surname>Chou</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Chugh</surname>
            <given-names>SS</given-names>
          </name>
          <name name-style="western">
            <surname>Coffeng</surname>
            <given-names>LE</given-names>
          </name>
          <name name-style="western">
            <surname>Colan</surname>
            <given-names>SD</given-names>
          </name>
          <name name-style="western">
            <surname>Colquhoun</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Colson</surname>
            <given-names>KE</given-names>
          </name>
          <name name-style="western">
            <surname>Condon</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Connor</surname>
            <given-names>MD</given-names>
          </name>
          <name name-style="western">
            <surname>Cooper</surname>
            <given-names>LT</given-names>
          </name>
          <name name-style="western">
            <surname>Corriere</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Cortinovis</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>de Vaccaro</surname>
            <given-names>KC</given-names>
          </name>
          <name name-style="western">
            <surname>Couser</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Cowie</surname>
            <given-names>BC</given-names>
          </name>
          <name name-style="western">
            <surname>Criqui</surname>
            <given-names>MH</given-names>
          </name>
          <name name-style="western">
            <surname>Cross</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Dabhadkar</surname>
            <given-names>KC</given-names>
          </name>
          <name name-style="western">
            <surname>Dahiya</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Dahodwala</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Damsere-Derry</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Danaei</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Davis</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>De</surname>
            <given-names>LD</given-names>
          </name>
          <name name-style="western">
            <surname>Degenhardt</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Dellavalle</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Delossantos</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Denenberg</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Derrett</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Des Jarlais</surname>
            <given-names>DC</given-names>
          </name>
          <name name-style="western">
            <surname>Dharmaratne</surname>
            <given-names>SD</given-names>
          </name>
          <name name-style="western">
            <surname>Dherani</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Diaz-Torne</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Dolk</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Dorsey</surname>
            <given-names>ER</given-names>
          </name>
          <name name-style="western">
            <surname>Driscoll</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Duber</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Ebel</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Edmond</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Elbaz</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Ali</surname>
            <given-names>SE</given-names>
          </name>
          <name name-style="western">
            <surname>Erskine</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Erwin</surname>
            <given-names>PJ</given-names>
          </name>
          <name name-style="western">
            <surname>Espindola</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Ewoigbokhan</surname>
            <given-names>SE</given-names>
          </name>
          <name name-style="western">
            <surname>Farzadfar</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Feigin</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Felson</surname>
            <given-names>DT</given-names>
          </name>
          <name name-style="western">
            <surname>Ferrari</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Ferri</surname>
            <given-names>CP</given-names>
          </name>
          <name name-style="western">
            <surname>Fèvre</surname>
            <given-names>EM</given-names>
          </name>
          <name name-style="western">
            <surname>Finucane</surname>
            <given-names>MM</given-names>
          </name>
          <name name-style="western">
            <surname>Flaxman</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Flood</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Foreman</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Forouzanfar</surname>
            <given-names>MH</given-names>
          </name>
          <name name-style="western">
            <surname>Fowkes</surname>
            <given-names>FG</given-names>
          </name>
          <name name-style="western">
            <surname>Fransen</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Freeman</surname>
            <given-names>MK</given-names>
          </name>
          <name name-style="western">
            <surname>Gabbe</surname>
            <given-names>BJ</given-names>
          </name>
          <name name-style="western">
            <surname>Gabriel</surname>
            <given-names>SE</given-names>
          </name>
          <name name-style="western">
            <surname>Gakidou</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Ganatra</surname>
            <given-names>HA</given-names>
          </name>
          <name name-style="western">
            <surname>Garcia</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Gaspari</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Gillum</surname>
            <given-names>RF</given-names>
          </name>
          <name name-style="western">
            <surname>Gmel</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Gonzalez-Medina</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Gosselin</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Grainger</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Grant</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Groeger</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Guillemin</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Gunnell</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Gupta</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Haagsma</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Hagan</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Halasa</surname>
            <given-names>YA</given-names>
          </name>
          <name name-style="western">
            <surname>Hall</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Haring</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Haro</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Harrison</surname>
            <given-names>JE</given-names>
          </name>
          <name name-style="western">
            <surname>Havmoeller</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Hay</surname>
            <given-names>RJ</given-names>
          </name>
          <name name-style="western">
            <surname>Higashi</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Hill</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Hoen</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Hoffman</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Hotez</surname>
            <given-names>PJ</given-names>
          </name>
          <name name-style="western">
            <surname>Hoy</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>JJ</given-names>
          </name>
          <name name-style="western">
            <surname>Ibeanusi</surname>
            <given-names>SE</given-names>
          </name>
          <name name-style="western">
            <surname>Jacobsen</surname>
            <given-names>KH</given-names>
          </name>
          <name name-style="western">
            <surname>James</surname>
            <given-names>SL</given-names>
          </name>
          <name name-style="western">
            <surname>Jarvis</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Jasrasaria</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Jayaraman</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Johns</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Jonas</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Karthikeyan</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Kassebaum</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Kawakami</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Keren</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Khoo</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>King</surname>
            <given-names>CH</given-names>
          </name>
          <name name-style="western">
            <surname>Knowlton</surname>
            <given-names>LM</given-names>
          </name>
          <name name-style="western">
            <surname>Kobusingye</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Koranteng</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Krishnamurthi</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Laden</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Lalloo</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Laslett</surname>
            <given-names>LL</given-names>
          </name>
          <name name-style="western">
            <surname>Lathlean</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Leasher</surname>
            <given-names>JL</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>YY</given-names>
          </name>
          <name name-style="western">
            <surname>Leigh</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Levinson</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Lim</surname>
            <given-names>SS</given-names>
          </name>
          <name name-style="western">
            <surname>Limb</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>JK</given-names>
          </name>
          <name name-style="western">
            <surname>Lipnick</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Lipshultz</surname>
            <given-names>SE</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Loane</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Ohno</surname>
            <given-names>SL</given-names>
          </name>
          <name name-style="western">
            <surname>Lyons</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Mabweijano</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>MacIntyre</surname>
            <given-names>MF</given-names>
          </name>
          <name name-style="western">
            <surname>Malekzadeh</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Mallinger</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Manivannan</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Marcenes</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>March</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Margolis</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Marks</surname>
            <given-names>GB</given-names>
          </name>
          <name name-style="western">
            <surname>Marks</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Matsumori</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Matzopoulos</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Mayosi</surname>
            <given-names>BM</given-names>
          </name>
          <name name-style="western">
            <surname>McAnulty</surname>
            <given-names>JH</given-names>
          </name>
          <name name-style="western">
            <surname>McDermott</surname>
            <given-names>MM</given-names>
          </name>
          <name name-style="western">
            <surname>McGill</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>McGrath</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Medina-Mora</surname>
            <given-names>ME</given-names>
          </name>
          <name name-style="western">
            <surname>Meltzer</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Mensah</surname>
            <given-names>GA</given-names>
          </name>
          <name name-style="western">
            <surname>Merriman</surname>
            <given-names>TR</given-names>
          </name>
          <name name-style="western">
            <surname>Meyer</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Miglioli</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Miller</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Miller</surname>
            <given-names>TR</given-names>
          </name>
          <name name-style="western">
            <surname>Mitchell</surname>
            <given-names>PB</given-names>
          </name>
          <name name-style="western">
            <surname>Mock</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Mocumbi</surname>
            <given-names>AO</given-names>
          </name>
          <name name-style="western">
            <surname>Moffitt</surname>
            <given-names>TE</given-names>
          </name>
          <name name-style="western">
            <surname>Mokdad</surname>
            <given-names>AA</given-names>
          </name>
          <name name-style="western">
            <surname>Monasta</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Montico</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Moradi-Lakeh</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Moran</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Morawska</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Mori</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Murdoch</surname>
            <given-names>ME</given-names>
          </name>
          <name name-style="western">
            <surname>Mwaniki</surname>
            <given-names>MK</given-names>
          </name>
          <name name-style="western">
            <surname>Naidoo</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Nair</surname>
            <given-names>MN</given-names>
          </name>
          <name name-style="western">
            <surname>Naldi</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Narayan</surname>
            <given-names>KM</given-names>
          </name>
          <name name-style="western">
            <surname>Nelson</surname>
            <given-names>PK</given-names>
          </name>
          <name name-style="western">
            <surname>Nelson</surname>
            <given-names>RG</given-names>
          </name>
          <name name-style="western">
            <surname>Nevitt</surname>
            <given-names>MC</given-names>
          </name>
          <name name-style="western">
            <surname>Newton</surname>
            <given-names>CR</given-names>
          </name>
          <name name-style="western">
            <surname>Nolte</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Norman</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Norman</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>O'Donnell</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>O'Hanlon</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Olives</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Omer</surname>
            <given-names>SB</given-names>
          </name>
          <name name-style="western">
            <surname>Ortblad</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Osborne</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Ozgediz</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Page</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Pahari</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Pandian</surname>
            <given-names>JD</given-names>
          </name>
          <name name-style="western">
            <surname>Rivero</surname>
            <given-names>AP</given-names>
          </name>
          <name name-style="western">
            <surname>Patten</surname>
            <given-names>SB</given-names>
          </name>
          <name name-style="western">
            <surname>Pearce</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Padilla</surname>
            <given-names>RP</given-names>
          </name>
          <name name-style="western">
            <surname>Perez-Ruiz</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Perico</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Pesudovs</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Phillips</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Phillips</surname>
            <given-names>MR</given-names>
          </name>
          <name name-style="western">
            <surname>Pierce</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Pion</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Polanczyk</surname>
            <given-names>GV</given-names>
          </name>
          <name name-style="western">
            <surname>Polinder</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Pope</surname>
            <given-names>CA</given-names>
          </name>
          <name name-style="western">
            <surname>Popova</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Porrini</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Pourmalek</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Prince</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Pullan</surname>
            <given-names>RL</given-names>
          </name>
          <name name-style="western">
            <surname>Ramaiah</surname>
            <given-names>KD</given-names>
          </name>
          <name name-style="western">
            <surname>Ranganathan</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Razavi</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Regan</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Rehm</surname>
            <given-names>JT</given-names>
          </name>
          <name name-style="western">
            <surname>Rein</surname>
            <given-names>DB</given-names>
          </name>
          <name name-style="western">
            <surname>Remuzzi</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Richardson</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Rivara</surname>
            <given-names>FP</given-names>
          </name>
          <name name-style="western">
            <surname>Roberts</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Robinson</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>De Leòn</surname>
            <given-names>FR</given-names>
          </name>
          <name name-style="western">
            <surname>Ronfani</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Room</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Rosenfeld</surname>
            <given-names>LC</given-names>
          </name>
          <name name-style="western">
            <surname>Rushton</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Sacco</surname>
            <given-names>RL</given-names>
          </name>
          <name name-style="western">
            <surname>Saha</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Sampson</surname>
            <given-names>U</given-names>
          </name>
          <name name-style="western">
            <surname>Sanchez-Riera</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Sanman</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Schwebel</surname>
            <given-names>DC</given-names>
          </name>
          <name name-style="western">
            <surname>Scott</surname>
            <given-names>JG</given-names>
          </name>
          <name name-style="western">
            <surname>Segui-Gomez</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Shahraz</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Shepard</surname>
            <given-names>DS</given-names>
          </name>
          <name name-style="western">
            <surname>Shin</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Shivakoti</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Singh</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Singh</surname>
            <given-names>GM</given-names>
          </name>
          <name name-style="western">
            <surname>Singh</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Singleton</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Sleet</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Sliwa</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>JL</given-names>
          </name>
          <name name-style="western">
            <surname>Stapelberg</surname>
            <given-names>NJ</given-names>
          </name>
          <name name-style="western">
            <surname>Steer</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Steiner</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Stolk</surname>
            <given-names>WA</given-names>
          </name>
          <name name-style="western">
            <surname>Stovner</surname>
            <given-names>LJ</given-names>
          </name>
          <name name-style="western">
            <surname>Sudfeld</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Syed</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Tamburlini</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Tavakkoli</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Taylor</surname>
            <given-names>HR</given-names>
          </name>
          <name name-style="western">
            <surname>Taylor</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Taylor</surname>
            <given-names>WJ</given-names>
          </name>
          <name name-style="western">
            <surname>Thomas</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Thomson</surname>
            <given-names>WM</given-names>
          </name>
          <name name-style="western">
            <surname>Thurston</surname>
            <given-names>GD</given-names>
          </name>
          <name name-style="western">
            <surname>Tleyjeh</surname>
            <given-names>IM</given-names>
          </name>
          <name name-style="western">
            <surname>Tonelli</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Towbin</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Truelsen</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Tsilimbaris</surname>
            <given-names>MK</given-names>
          </name>
          <name name-style="western">
            <surname>Ubeda</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Undurraga</surname>
            <given-names>EA</given-names>
          </name>
          <name name-style="western">
            <surname>van der Werf</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>van Os</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Vavilala</surname>
            <given-names>MS</given-names>
          </name>
          <name name-style="western">
            <surname>Venketasubramanian</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Watt</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Weatherall</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Weinstock</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Weintraub</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Weisskopf</surname>
            <given-names>MG</given-names>
          </name>
          <name name-style="western">
            <surname>Weissman</surname>
            <given-names>MM</given-names>
          </name>
          <name name-style="western">
            <surname>White</surname>
            <given-names>RA</given-names>
          </name>
          <name name-style="western">
            <surname>Whiteford</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Wiebe</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Wiersma</surname>
            <given-names>ST</given-names>
          </name>
          <name name-style="western">
            <surname>Wilkinson</surname>
            <given-names>JD</given-names>
          </name>
          <name name-style="western">
            <surname>Williams</surname>
            <given-names>HC</given-names>
          </name>
          <name name-style="western">
            <surname>Williams</surname>
            <given-names>SR</given-names>
          </name>
          <name name-style="western">
            <surname>Witt</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Wolfe</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Woolf</surname>
            <given-names>AD</given-names>
          </name>
          <name name-style="western">
            <surname>Wulf</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Yeh</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Zaidi</surname>
            <given-names>AK</given-names>
          </name>
          <name name-style="western">
            <surname>Zheng</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Zonies</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Lopez</surname>
            <given-names>AD</given-names>
          </name>
          <name name-style="western">
            <surname>AlMazroa</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Memish</surname>
            <given-names>ZA</given-names>
          </name>
        </person-group>
        <article-title>Disability-adjusted life years (DALYs) for 291 diseases and injuries in 21 regions, 1990-2010: a systematic analysis for the Global Burden of Disease Study 2010</article-title>
        <source>Lancet</source>  
        <year>2012</year>  
        <month>12</month>  
        <day>15</day>  
        <volume>380</volume>  
        <issue>9859</issue>  
        <fpage>2197</fpage>  
        <lpage>223</lpage>  
        <pub-id pub-id-type="doi">10.1016/S0140-6736(12)61689-4</pub-id>
        <pub-id pub-id-type="medline">23245608</pub-id>
        <pub-id pub-id-type="pii">S0140-6736(12)61689-4</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Dörhöfer</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Lammert</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Krane</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Gorski</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Banas</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Wanner</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Krämer</surname>
            <given-names>BK</given-names>
          </name>
          <name name-style="western">
            <surname>Heid</surname>
            <given-names>IM</given-names>
          </name>
          <name name-style="western">
            <surname>Böger</surname>
            <given-names>CA</given-names>
          </name>
        </person-group>
        <article-title>Study design of DIACORE (DIAbetes COhoRtE) - a cohort study of patients with diabetes mellitus type 2</article-title>
        <source>BMC Med Genet</source>  
        <year>2013</year>  
        <volume>14</volume>  
        <fpage>25</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bmcmedgenet.biomedcentral.com/articles/10.1186/1471-2350-14-25"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1471-2350-14-25</pub-id>
        <pub-id pub-id-type="medline">23409726</pub-id>
        <pub-id pub-id-type="pii">1471-2350-14-25</pub-id>
        <pub-id pub-id-type="pmcid">PMC3577512</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
        <source>Centers for Disease Control and Prevention</source>  
        <year>2011</year>  
        <access-date>2016-07-03</access-date>
        <publisher-loc>Atlanta, GA</publisher-loc>
        <publisher-name>US Department of Health and Human Services</publisher-name>
        <comment>National Diabetes Fact Sheet: National estimates and general information on diabetes and prediabetes in the United States, 2011 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.cdc.gov/diabetes/pubs/pdf/ndfs_2011.pdf">https://www.cdc.gov/diabetes/pubs/pdf/ndfs_2011.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6io6Wx73s"/></comment> </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
        <source>Centers for Disease Control and Prevention (CDC)</source>  
        <year>2014</year>  
        <access-date>2016-07-04</access-date>
        <publisher-loc>Atlanta, GA</publisher-loc>
        <publisher-name>US Department of Health and Human Services</publisher-name>
        <comment>National Diabetes Statistics Report: Etimates of Diabetes and Its Burden in the United States, 2014 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.cdc.gov/diabetes/pubs/statsreport14/national-diabetes-report-web.pdf">https://www.cdc.gov/diabetes/pubs/statsreport14/national-diabetes-report-web.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6io7cyhpe"/></comment> </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nathan</surname>
            <given-names>DM</given-names>
          </name>
          <name name-style="western">
            <surname>Cleary</surname>
            <given-names>PA</given-names>
          </name>
          <name name-style="western">
            <surname>Backlund</surname>
            <given-names>JC</given-names>
          </name>
          <name name-style="western">
            <surname>Genuth</surname>
            <given-names>SM</given-names>
          </name>
          <name name-style="western">
            <surname>Lachin</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Orchard</surname>
            <given-names>TJ</given-names>
          </name>
          <name name-style="western">
            <surname>Raskin</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Zinman</surname>
            <given-names>B</given-names>
          </name>
          <collab>Diabetes ControlComplications Trial/Epidemiology of Diabetes InterventionsComplications (DCCT/EDIC) Study Research Group</collab>
        </person-group>
        <article-title>Intensive diabetes treatment and cardiovascular disease in patients with type 1 diabetes</article-title>
        <source>N Engl J Med</source>  
        <year>2005</year>  
        <month>12</month>  
        <day>22</day>  
        <volume>353</volume>  
        <issue>25</issue>  
        <fpage>2643</fpage>  
        <lpage>53</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16371630"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1056/NEJMoa052187</pub-id>
        <pub-id pub-id-type="medline">16371630</pub-id>
        <pub-id pub-id-type="pii">353/25/2643</pub-id>
        <pub-id pub-id-type="pmcid">PMC2637991</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gong</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Gregg</surname>
            <given-names>EW</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>An</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Shuai</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Gerzoff</surname>
            <given-names>RB</given-names>
          </name>
          <name name-style="western">
            <surname>Roglic</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Hu</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Bennett</surname>
            <given-names>PH</given-names>
          </name>
        </person-group>
        <article-title>Long-term effects of a randomised trial of a 6-year lifestyle intervention in impaired glucose tolerance on diabetes-related microvascular complications: the China Da Qing Diabetes Prevention Outcome Study</article-title>
        <source>Diabetologia</source>  
        <year>2011</year>  
        <month>02</month>  
        <volume>54</volume>  
        <issue>2</issue>  
        <fpage>300</fpage>  
        <lpage>7</lpage>  
        <pub-id pub-id-type="doi">10.1007/s00125-010-1948-9</pub-id>
        <pub-id pub-id-type="medline">21046360</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Tchobroutsky</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Relation of diabetic control to development of microvascular complications</article-title>
        <source>Diabetologia</source>  
        <year>1978</year>  
        <month>09</month>  
        <volume>15</volume>  
        <issue>3</issue>  
        <fpage>143</fpage>  
        <lpage>52</lpage>  
        <pub-id pub-id-type="medline">359393</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Engerman</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Bloodworth Jr</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Nelson</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Relationship of microvascular disease in diabetes to metabolic control</article-title>
        <source>Diabetes</source>  
        <year>1977</year>  
        <month>08</month>  
        <volume>26</volume>  
        <issue>8</issue>  
        <fpage>760</fpage>  
        <lpage>9</lpage>  
        <pub-id pub-id-type="medline">885298</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wei</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Leibson</surname>
            <given-names>CL</given-names>
          </name>
          <name name-style="western">
            <surname>Ransom</surname>
            <given-names>JE</given-names>
          </name>
          <name name-style="western">
            <surname>Kho</surname>
            <given-names>AN</given-names>
          </name>
          <name name-style="western">
            <surname>Chute</surname>
            <given-names>CG</given-names>
          </name>
        </person-group>
        <article-title>The absence of longitudinal data limits the accuracy of high-throughput clinical phenotyping for identifying type 2 diabetes mellitus subjects</article-title>
        <source>Int J Med Inform</source>  
        <year>2013</year>  
        <month>04</month>  
        <volume>82</volume>  
        <issue>4</issue>  
        <fpage>239</fpage>  
        <lpage>47</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22762862"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2012.05.015</pub-id>
        <pub-id pub-id-type="medline">22762862</pub-id>
        <pub-id pub-id-type="pii">S1386-5056(12)00109-8</pub-id>
        <pub-id pub-id-type="pmcid">PMC3478423</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Khokhar</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Jette</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Metcalfe</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Cunningham</surname>
            <given-names>CT</given-names>
          </name>
          <name name-style="western">
            <surname>Quan</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Kaplan</surname>
            <given-names>GG</given-names>
          </name>
          <name name-style="western">
            <surname>Butalia</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Rabi</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Systematic review of validated case definitions for diabetes in ICD-9-coded and ICD-10-coded data in adult populations</article-title>
        <source>BMJ Open</source>  
        <year>2016</year>  
        <month>08</month>  
        <volume>6</volume>  
        <issue>8</issue>  
        <fpage>e009952</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bmjopen.bmj.com/cgi/pmidlookup?view=long&#38;pmid=27496226"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/bmjopen-2015-009952</pub-id>
        <pub-id pub-id-type="medline">27496226</pub-id>
        <pub-id pub-id-type="pii">bmjopen-2015-009952</pub-id>
        <pub-id pub-id-type="pmcid">PMC4985868</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Vassar</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Holzmann</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>The retrospective chart review: important methodological considerations</article-title>
        <source>J Educ Eval Health Prof</source>  
        <year>2013</year>  
        <volume>10</volume>  
        <fpage>12</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.doi.org/10.3352/jeehp.2013.10.12"/>
        </comment>  
        <pub-id pub-id-type="doi">10.3352/jeehp.2013.10.12</pub-id>
        <pub-id pub-id-type="medline">24324853</pub-id>
        <pub-id pub-id-type="pii">jeehp-10-12</pub-id>
        <pub-id pub-id-type="pmcid">PMC3853868</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Shine</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Sundaram</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Torres</surname>
            <given-names>DM</given-names>
          </name>
          <name name-style="western">
            <surname>Johnstone</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Jaeger</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Sanguliano</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Can computerized cost data substitute for chart review?</article-title>
        <source>J Healthc Qual</source>  
        <year>2002</year>  
        <volume>24</volume>  
        <issue>6</issue>  
        <fpage>26</fpage>  
        <lpage>33</lpage>  
        <pub-id pub-id-type="medline">12432860</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Singh</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Singh</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Ahmed</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Wilson</surname>
            <given-names>GA</given-names>
          </name>
          <name name-style="western">
            <surname>Pickering</surname>
            <given-names>BW</given-names>
          </name>
          <name name-style="western">
            <surname>Herasevich</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Gajic</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Derivation and validation of automated electronic search strategies to extract Charlson comorbidities from electronic medical records</article-title>
        <source>Mayo Clin Proc</source>  
        <year>2012</year>  
        <month>09</month>  
        <volume>87</volume>  
        <issue>9</issue>  
        <fpage>817</fpage>  
        <lpage>24</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22958988"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.mayocp.2012.04.015</pub-id>
        <pub-id pub-id-type="medline">22958988</pub-id>
        <pub-id pub-id-type="pii">S0025-6196(12)00679-9</pub-id>
        <pub-id pub-id-type="pmcid">PMC3538495</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Luo</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Hao</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Shin</surname>
            <given-names>AY</given-names>
          </name>
          <name name-style="western">
            <surname>Jin</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Deng</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Zheng</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Hu</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Fu</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Hao</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Dai</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Culver</surname>
            <given-names>DS</given-names>
          </name>
          <name name-style="western">
            <surname>Alfreds</surname>
            <given-names>ST</given-names>
          </name>
          <name name-style="western">
            <surname>Todd</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Stearns</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Sylvester</surname>
            <given-names>KG</given-names>
          </name>
          <name name-style="western">
            <surname>Widen</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Ling</surname>
            <given-names>XB</given-names>
          </name>
        </person-group>
        <article-title>NLP based congestive heart failure case finding: A prospective analysis on statewide electronic medical records</article-title>
        <source>Int J Med Inform</source>  
        <year>2015</year>  
        <month>12</month>  
        <volume>84</volume>  
        <issue>12</issue>  
        <fpage>1039</fpage>  
        <lpage>47</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2015.06.007</pub-id>
        <pub-id pub-id-type="medline">26254876</pub-id>
        <pub-id pub-id-type="pii">S1386-5056(15)30013-7</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pakhomov</surname>
            <given-names>SV</given-names>
          </name>
          <name name-style="western">
            <surname>Buntrock</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Chute</surname>
            <given-names>CG</given-names>
          </name>
        </person-group>
        <article-title>Prospective recruitment of patients with congestive heart failure using an ad-hoc binary classifier</article-title>
        <source>J Biomed Inform</source>  
        <year>2005</year>  
        <month>04</month>  
        <volume>38</volume>  
        <issue>2</issue>  
        <fpage>145</fpage>  
        <lpage>53</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S1532-0464(04)00167-4"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2004.11.016</pub-id>
        <pub-id pub-id-type="medline">15797003</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(04)00167-4</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Carrell</surname>
            <given-names>DS</given-names>
          </name>
          <name name-style="western">
            <surname>Halgrim</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Tran</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Buist</surname>
            <given-names>DS</given-names>
          </name>
          <name name-style="western">
            <surname>Chubak</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Chapman</surname>
            <given-names>WW</given-names>
          </name>
          <name name-style="western">
            <surname>Savova</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Using natural language processing to improve efficiency of manual chart abstraction in research: the case of breast cancer recurrence</article-title>
        <source>Am J Epidemiol</source>  
        <year>2014</year>  
        <month>03</month>  
        <day>15</day>  
        <volume>179</volume>  
        <issue>6</issue>  
        <fpage>749</fpage>  
        <lpage>58</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://aje.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=24488511"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/aje/kwt441</pub-id>
        <pub-id pub-id-type="medline">24488511</pub-id>
        <pub-id pub-id-type="pii">kwt441</pub-id>
        <pub-id pub-id-type="pmcid">PMC3939853</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Krumholz</surname>
            <given-names>HM</given-names>
          </name>
        </person-group>
        <article-title>Big data and new knowledge in medicine: the thinking, training, and tools needed for a learning health system</article-title>
        <source>Health Aff (Millwood)</source>  
        <year>2014</year>  
        <month>07</month>  
        <volume>33</volume>  
        <issue>7</issue>  
        <fpage>1163</fpage>  
        <lpage>70</lpage>  
        <pub-id pub-id-type="doi">10.1377/hlthaff.2014.0053</pub-id>
        <pub-id pub-id-type="medline">25006142</pub-id>
        <pub-id pub-id-type="pii">33/7/1163</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jacob</surname>
            <given-names>JA</given-names>
          </name>
        </person-group>
        <article-title>On the Road to Interoperability, Public and Private Organizations Work to Connect Health Care Data</article-title>
        <source>JAMA</source>  
        <year>2015</year>  
        <month>09</month>  
        <volume>314</volume>  
        <issue>12</issue>  
        <fpage>1213</fpage>  
        <lpage>5</lpage>  
        <pub-id pub-id-type="doi">10.1001/jama.2015.5930</pub-id>
        <pub-id pub-id-type="medline">26393833</pub-id>
        <pub-id pub-id-type="pii">2442932</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ng</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Ghoting</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Steinhubl</surname>
            <given-names>SR</given-names>
          </name>
          <name name-style="western">
            <surname>Stewart</surname>
            <given-names>WF</given-names>
          </name>
          <name name-style="western">
            <surname>Malin</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Sun</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>PARAMO: a PARAllel predictive MOdeling platform for healthcare analytic research using electronic health records</article-title>
        <source>J Biomed Inform</source>  
        <year>2014</year>  
        <month>04</month>  
        <volume>48</volume>  
        <fpage>160</fpage>  
        <lpage>70</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S1532-0464(13)00203-7"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2013.12.012</pub-id>
        <pub-id pub-id-type="medline">24370496</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(13)00203-7</pub-id>
        <pub-id pub-id-type="pmcid">PMC4075460</pub-id></nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Forrest</surname>
            <given-names>CB</given-names>
          </name>
          <name name-style="western">
            <surname>Margolis</surname>
            <given-names>PA</given-names>
          </name>
          <name name-style="western">
            <surname>Bailey</surname>
            <given-names>LC</given-names>
          </name>
          <name name-style="western">
            <surname>Marsolo</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Del Beccaro</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Finkelstein</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Milov</surname>
            <given-names>DE</given-names>
          </name>
          <name name-style="western">
            <surname>Vieland</surname>
            <given-names>VJ</given-names>
          </name>
          <name name-style="western">
            <surname>Wolf</surname>
            <given-names>BA</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>FB</given-names>
          </name>
          <name name-style="western">
            <surname>Kahn</surname>
            <given-names>MG</given-names>
          </name>
        </person-group>
        <article-title>PEDSnet: a National Pediatric Learning Health System</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2014</year>  
        <volume>21</volume>  
        <issue>4</issue>  
        <fpage>602</fpage>  
        <lpage>6</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=24821737"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/amiajnl-2014-002743</pub-id>
        <pub-id pub-id-type="medline">24821737</pub-id>
        <pub-id pub-id-type="pii">amiajnl-2014-002743</pub-id>
        <pub-id pub-id-type="pmcid">PMC4078288</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sittig</surname>
            <given-names>DF</given-names>
          </name>
          <name name-style="western">
            <surname>Wright</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>What makes an EHR “open” or interoperable?</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2015</year>  
        <month>09</month>  
        <volume>22</volume>  
        <issue>5</issue>  
        <fpage>1099</fpage>  
        <lpage>101</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=26078411"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1093/jamia/ocv060</pub-id>
        <pub-id pub-id-type="medline">26078411</pub-id>
        <pub-id pub-id-type="pii">ocv060</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
        <source>Hinfonet</source>  
        <access-date>2016-09-30</access-date>
        <comment>HealthInfoNet 2016 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://hinfonet.org/">http://hinfonet.org/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6kvKLP6bc"/></comment> </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hao</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Jin</surname>
            <given-names>BO</given-names>
          </name>
          <name name-style="western">
            <surname>Shin</surname>
            <given-names>AY</given-names>
          </name>
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Hu</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Fu</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Ji</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Dai</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Culver</surname>
            <given-names>DS</given-names>
          </name>
          <name name-style="western">
            <surname>Alfreds</surname>
            <given-names>ST</given-names>
          </name>
          <name name-style="western">
            <surname>Rogow</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Stearns</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Sylvester</surname>
            <given-names>KG</given-names>
          </name>
          <name name-style="western">
            <surname>Widen</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Ling</surname>
            <given-names>XB</given-names>
          </name>
        </person-group>
        <article-title>Risk prediction of emergency department revisit 30 days post discharge: a prospective study</article-title>
        <source>PLoS One</source>  
        <year>2014</year>  
        <month>11</month>  
        <volume>9</volume>  
        <issue>11</issue>  
        <fpage>e112944</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0112944"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0112944</pub-id>
        <pub-id pub-id-type="medline">25393305</pub-id>
        <pub-id pub-id-type="pii">PONE-D-14-17606</pub-id>
        <pub-id pub-id-type="pmcid">PMC4231082</pub-id></nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Holt</surname>
            <given-names>TA</given-names>
          </name>
          <name name-style="western">
            <surname>Gunnarsson</surname>
            <given-names>CL</given-names>
          </name>
          <name name-style="western">
            <surname>Cload</surname>
            <given-names>PA</given-names>
          </name>
          <name name-style="western">
            <surname>Ross</surname>
            <given-names>SD</given-names>
          </name>
        </person-group>
        <article-title>Identification of undiagnosed diabetes and quality of diabetes care in the United States: cross-sectional study of 11.5 million primary care electronic records</article-title>
        <source>CMAJ Open</source>  
        <year>2014</year>  
        <month>10</month>  
        <volume>2</volume>  
        <issue>4</issue>  
        <fpage>E248</fpage>  
        <lpage>55</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25485250"/>
        </comment>  
        <pub-id pub-id-type="doi">10.9778/cmajo.20130095</pub-id>
        <pub-id pub-id-type="medline">25485250</pub-id>
        <pub-id pub-id-type="pii">20130095</pub-id>
        <pub-id pub-id-type="pmcid">PMC4251506</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Schulze</surname>
            <given-names>MB</given-names>
          </name>
          <name name-style="western">
            <surname>Hoffmann</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Boeing</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Linseisen</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Rohrmann</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Möhlig</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Pfeiffer</surname>
            <given-names>AF</given-names>
          </name>
          <name name-style="western">
            <surname>Spranger</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Thamer</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Häring</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Fritsche</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Joost</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>An accurate risk score based on anthropometric, dietary, and lifestyle factors to predict the development of type 2 diabetes</article-title>
        <source>Diabetes Care</source>  
        <year>2007</year>  
        <month>03</month>  
        <volume>30</volume>  
        <issue>3</issue>  
        <fpage>510</fpage>  
        <lpage>5</lpage>  
        <pub-id pub-id-type="doi">10.2337/dc06-2089</pub-id>
        <pub-id pub-id-type="medline">17327313</pub-id>
        <pub-id pub-id-type="pii">30/3/510</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Pan</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Jin</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>A Chinese diabetes risk score for screening of undiagnosed diabetes and abnormal glucose tolerance</article-title>
        <source>Diabetes Technol Ther</source>  
        <year>2011</year>  
        <month>05</month>  
        <volume>13</volume>  
        <issue>5</issue>  
        <fpage>501</fpage>  
        <lpage>7</lpage>  
        <pub-id pub-id-type="doi">10.1089/dia.2010.0106</pub-id>
        <pub-id pub-id-type="medline">21406016</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Collins</surname>
            <given-names>GS</given-names>
          </name>
          <name name-style="western">
            <surname>Mallett</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Omar</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>LM</given-names>
          </name>
        </person-group>
        <article-title>Developing risk prediction models for type 2 diabetes: a systematic review of methodology and reporting</article-title>
        <source>BMC Med</source>  
        <year>2011</year>  
        <month>9</month>  
        <volume>9</volume>  
        <fpage>103</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bmcmedicine.biomedcentral.com/articles/10.1186/1741-7015-9-103"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1741-7015-9-103</pub-id>
        <pub-id pub-id-type="medline">21902820</pub-id>
        <pub-id pub-id-type="pii">1741-7015-9-103</pub-id>
        <pub-id pub-id-type="pmcid">PMC3180398</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Balkau</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Lange</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Fezeu</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Tichet</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>de Lauzon-Guillain</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Czernichow</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Fumeron</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Froguel</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Vaxillaire</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Cauchi</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Ducimetière</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Eschwège</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Predicting diabetes: clinical, biological, and genetic approaches: data from the Epidemiological Study on the Insulin Resistance Syndrome (DESIR)</article-title>
        <source>Diabetes Care</source>  
        <year>2008</year>  
        <month>10</month>  
        <volume>31</volume>  
        <issue>10</issue>  
        <fpage>2056</fpage>  
        <lpage>61</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18689695"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2337/dc08-0368</pub-id>
        <pub-id pub-id-type="medline">18689695</pub-id>
        <pub-id pub-id-type="pii">dc08-0368</pub-id>
        <pub-id pub-id-type="pmcid">PMC2551654</pub-id></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Aekplakorn</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Bunnag</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Woodward</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Sritara</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Cheepudomwit</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Yamwong</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Yipintsoi</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Rajatanavin</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>A risk score for predicting incident diabetes in the Thai population</article-title>
        <source>Diabetes Care</source>  
        <year>2006</year>  
        <month>08</month>  
        <volume>29</volume>  
        <issue>8</issue>  
        <fpage>1872</fpage>  
        <lpage>7</lpage>  
        <pub-id pub-id-type="doi">10.2337/dc05-2141</pub-id>
        <pub-id pub-id-type="medline">16873795</pub-id>
        <pub-id pub-id-type="pii">29/8/1872</pub-id></nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>TY</given-names>
          </name>
          <name name-style="western">
            <surname>Hardiker</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Coenen</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Inter-terminology mapping of nursing problems</article-title>
        <source>J Biomed Inform</source>  
        <year>2014</year>  
        <month>06</month>  
        <volume>49</volume>  
        <fpage>213</fpage>  
        <lpage>20</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S1532-0464(14)00058-6"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2014.03.001</pub-id>
        <pub-id pub-id-type="medline">24632297</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(14)00058-6</pub-id></nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nadkarni</surname>
            <given-names>PM</given-names>
          </name>
          <name name-style="western">
            <surname>Darer</surname>
            <given-names>JA</given-names>
          </name>
        </person-group>
        <article-title>Migrating existing clinical content from ICD-9 to SNOMED</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2010</year>  
        <volume>17</volume>  
        <issue>5</issue>  
        <fpage>602</fpage>  
        <lpage>7</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=20819871"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/jamia.2009.001057</pub-id>
        <pub-id pub-id-type="medline">20819871</pub-id>
        <pub-id pub-id-type="pii">17/5/602</pub-id>
        <pub-id pub-id-type="pmcid">PMC2995664</pub-id></nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lipscomb</surname>
            <given-names>CE</given-names>
          </name>
        </person-group>
        <article-title>Medical Subject Headings (MeSH)</article-title>
        <source>Bull Med Libr Assoc</source>  
        <year>2000</year>  
        <month>07</month>  
        <volume>88</volume>  
        <issue>3</issue>  
        <fpage>265</fpage>  
        <lpage>6</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/10928714"/>
        </comment>  
        <pub-id pub-id-type="medline">10928714</pub-id>
        <pub-id pub-id-type="pmcid">PMC35238</pub-id></nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <collab>R Development Core Team</collab>
        </person-group>
        <source>R: A language and environment for statistical computing</source>  
        <year>2015</year>  
        <publisher-loc>Vienna, Austria</publisher-loc>
        <publisher-name>the R Foundation for Statistical Computing</publisher-name></nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <collab>WHO Expert Consultation</collab>
        </person-group>
        <article-title>Appropriate body-mass index for Asian populations and its implications for policy and intervention strategies</article-title>
        <source>Lancet</source>  
        <year>2004</year>  
        <month>01</month>  
        <day>10</day>  
        <volume>363</volume>  
        <issue>9403</issue>  
        <fpage>157</fpage>  
        <lpage>63</lpage>  
        <pub-id pub-id-type="doi">10.1016/S0140-6736(03)15268-3</pub-id>
        <pub-id pub-id-type="medline">14726171</pub-id>
        <pub-id pub-id-type="pii">S0140-6736(03)15268-3</pub-id></nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chapman</surname>
            <given-names>WW</given-names>
          </name>
          <name name-style="western">
            <surname>Hillert</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Velupillai</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kvist</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Skeppstedt</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Chapman</surname>
            <given-names>BE</given-names>
          </name>
          <name name-style="western">
            <surname>Conway</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Tharp</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Mowery</surname>
            <given-names>DL</given-names>
          </name>
          <name name-style="western">
            <surname>Deleger</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Extending the NegEx lexicon for multiple languages</article-title>
        <source>Stud Health Technol Inform</source>  
        <year>2013</year>  
        <volume>192</volume>  
        <fpage>677</fpage>  
        <lpage>81</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23920642"/>
        </comment>  
        <pub-id pub-id-type="medline">23920642</pub-id>
        <pub-id pub-id-type="pmcid">PMC3923890</pub-id></nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
        <source>English-for-students</source>  
        <access-date>2016-07-05</access-date>
        <comment>Family Vocabulary Word List 2015 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.english-for-students.com/Family-Vocabulary.html">http://www.english-for-students.com/Family-Vocabulary.html</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6io7Hc6c3"/></comment> </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Doan</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Maehara</surname>
            <given-names>CK</given-names>
          </name>
          <name name-style="western">
            <surname>Chaparro</surname>
            <given-names>JD</given-names>
          </name>
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Graham</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Berry</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Hsu</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Kanegaye</surname>
            <given-names>JT</given-names>
          </name>
          <name name-style="western">
            <surname>Lloyd</surname>
            <given-names>DD</given-names>
          </name>
          <name name-style="western">
            <surname>Ohno-Machado</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Burns</surname>
            <given-names>JC</given-names>
          </name>
          <name name-style="western">
            <surname>Tremoulet</surname>
            <given-names>AH</given-names>
          </name>
          <collab>Pediatric Emergency Medicine Kawasaki Disease Research Group</collab>
        </person-group>
        <article-title>Building a Natural Language Processing Tool to Identify Patients With High Clinical Suspicion for Kawasaki Disease from Emergency Department Notes</article-title>
        <source>Acad Emerg Med</source>  
        <year>2016</year>  
        <month>05</month>  
        <volume>23</volume>  
        <issue>5</issue>  
        <fpage>628</fpage>  
        <lpage>36</lpage>  
        <pub-id pub-id-type="doi">10.1111/acem.12925</pub-id>
        <pub-id pub-id-type="medline">26826020</pub-id>
        <pub-id pub-id-type="pmcid">PMC5031359</pub-id></nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Breiman</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Random forests</article-title>
        <source>Machine Learning</source>  
        <year>2001</year>  
        <volume>45</volume>  
        <issue>1</issue>  
        <fpage>5</fpage>  
        <lpage>32</lpage>  
        <pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id></nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Love</surname>
            <given-names>TJ</given-names>
          </name>
          <name name-style="western">
            <surname>Cai</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Karlson</surname>
            <given-names>EW</given-names>
          </name>
        </person-group>
        <article-title>Validation of psoriatic arthritis diagnoses in electronic medical records using natural language processing</article-title>
        <source>Semin Arthritis Rheum</source>  
        <year>2011</year>  
        <month>04</month>  
        <volume>40</volume>  
        <issue>5</issue>  
        <fpage>413</fpage>  
        <lpage>20</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20701955"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.semarthrit.2010.05.002</pub-id>
        <pub-id pub-id-type="medline">20701955</pub-id>
        <pub-id pub-id-type="pii">S0049-0172(10)00075-2</pub-id>
        <pub-id pub-id-type="pmcid">PMC3691811</pub-id></nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="web">
        <source>Stat.berkeley</source>  
        <access-date>2016-10-01</access-date>
        <comment>Random Forests 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.stat.berkeley.edu/~breiman/RandomForests/cc_home.htm">http://www.stat.berkeley.edu/~breiman/RandomForests/cc_home.htm</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6kvL2QzSq"/></comment> </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nayak</surname>
            <given-names>BS</given-names>
          </name>
          <name name-style="western">
            <surname>Sobrian</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Latiff</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Pope</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Rampersad</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Lourenço</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Samuel</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <article-title>The association of age, gender, ethnicity, family history, obesity and hypertension with type 2 diabetes mellitus in Trinidad</article-title>
        <source>Diabetes Metab Syndr</source>  
        <year>2014</year>  
        <volume>8</volume>  
        <issue>2</issue>  
        <fpage>91</fpage>  
        <lpage>5</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.dsx.2014.04.018</pub-id>
        <pub-id pub-id-type="medline">24907173</pub-id>
        <pub-id pub-id-type="pii">S1871-4021(14)00030-7</pub-id></nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ding</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Chong</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Jalaludin</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Comino</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Bauman</surname>
            <given-names>AE</given-names>
          </name>
        </person-group>
        <article-title>Risk factors of incident type 2-diabetes mellitus over a 3-year follow-up: Results from a large Australian sample</article-title>
        <source>Diabetes Res Clin Pract</source>  
        <year>2015</year>  
        <month>05</month>  
        <volume>108</volume>  
        <issue>2</issue>  
        <fpage>306</fpage>  
        <lpage>15</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.diabres.2015.02.002</pub-id>
        <pub-id pub-id-type="medline">25737033</pub-id>
        <pub-id pub-id-type="pii">S0168-8227(15)00099-6</pub-id></nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wiens</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Guttag</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Horvitz</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>A study in transfer learning: leveraging data from multiple hospitals to enhance hospital-specific predictions</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2014</year>  
        <volume>21</volume>  
        <issue>4</issue>  
        <fpage>699</fpage>  
        <lpage>706</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=24481703"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/amiajnl-2013-002162</pub-id>
        <pub-id pub-id-type="medline">24481703</pub-id>
        <pub-id pub-id-type="pii">amiajnl-2013-002162</pub-id>
        <pub-id pub-id-type="pmcid">PMC4078276</pub-id></nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jerant</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Franks</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>Body mass index, diabetes, hypertension, and short-term mortality: a population-based observational study, 2000-2006</article-title>
        <source>J Am Board Fam Med</source>  
        <year>2012</year>  
        <volume>25</volume>  
        <issue>4</issue>  
        <fpage>422</fpage>  
        <lpage>31</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jabfm.org/cgi/pmidlookup?view=long&#38;pmid=22773710"/>
        </comment>  
        <pub-id pub-id-type="doi">10.3122/jabfm.2012.04.110289</pub-id>
        <pub-id pub-id-type="medline">22773710</pub-id>
        <pub-id pub-id-type="pii">25/4/422</pub-id></nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Condliffe</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Link</surname>
            <given-names>CR</given-names>
          </name>
          <name name-style="western">
            <surname>Parasuraman</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Pollack</surname>
            <given-names>MF</given-names>
          </name>
        </person-group>
        <article-title>The effects of hypertension and obesity on total health-care expenditures of diabetes patients in the United States</article-title>
        <source>Applied Economics Letters</source>  
        <year>2013</year>  
        <month>05</month>  
        <volume>20</volume>  
        <issue>7</issue>  
        <fpage>649</fpage>  
        <lpage>652</lpage>  
        <pub-id pub-id-type="doi">10.1080/13504851.2012.727966</pub-id></nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Araneta</surname>
            <given-names>MR</given-names>
          </name>
          <name name-style="western">
            <surname>Kanaya</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Hsu</surname>
            <given-names>WC</given-names>
          </name>
          <name name-style="western">
            <surname>Chang</surname>
            <given-names>HK</given-names>
          </name>
          <name name-style="western">
            <surname>Grandinetti</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Boyko</surname>
            <given-names>EJ</given-names>
          </name>
          <name name-style="western">
            <surname>Hayashi</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Kahn</surname>
            <given-names>SE</given-names>
          </name>
          <name name-style="western">
            <surname>Leonetti</surname>
            <given-names>DL</given-names>
          </name>
          <name name-style="western">
            <surname>McNeely</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Onishi</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Sato</surname>
            <given-names>KK</given-names>
          </name>
          <name name-style="western">
            <surname>Fujimoto</surname>
            <given-names>WY</given-names>
          </name>
        </person-group>
        <article-title>Optimum BMI cut points to screen asian americans for type 2 diabetes</article-title>
        <source>Diabetes Care</source>  
        <year>2015</year>  
        <month>05</month>  
        <volume>38</volume>  
        <issue>5</issue>  
        <fpage>814</fpage>  
        <lpage>20</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25665815"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2337/dc14-2071</pub-id>
        <pub-id pub-id-type="medline">25665815</pub-id>
        <pub-id pub-id-type="pii">dc14-2071</pub-id>
        <pub-id pub-id-type="pmcid">PMC4407753</pub-id></nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <collab>American Diabetes Association</collab>
        </person-group>
        <article-title>Classification and diagnosis of diabetes. Sec. 2. In Standards of Medical Care in Diabetes-2016</article-title>
        <source>Diabetes Care</source>  
        <year>2016</year>  
        <month>01</month>  
        <volume>39</volume>  
        <issue>Suppl 1</issue>  
        <fpage>S13</fpage>  
        <lpage>22</lpage>  
        <pub-id pub-id-type="doi">10.2337/dc16-S005</pub-id>
        <pub-id pub-id-type="medline">26696675</pub-id>
        <pub-id pub-id-type="pii">39/Supplement_1/S13</pub-id></nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Schellenberg</surname>
            <given-names>ES</given-names>
          </name>
          <name name-style="western">
            <surname>Dryden</surname>
            <given-names>DM</given-names>
          </name>
          <name name-style="western">
            <surname>Vandermeer</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Ha</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Korownyk</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Lifestyle interventions for patients with and at risk for type 2 diabetes: a systematic review and meta-analysis</article-title>
        <source>Ann Intern Med</source>  
        <year>2013</year>  
        <month>10</month>  
        <day>15</day>  
        <volume>159</volume>  
        <issue>8</issue>  
        <fpage>543</fpage>  
        <lpage>51</lpage>  
        <pub-id pub-id-type="doi">10.7326/0003-4819-159-8-201310150-00007</pub-id>
        <pub-id pub-id-type="medline">24126648</pub-id>
        <pub-id pub-id-type="pii">1748845</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
