<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i10e17376</article-id>
      <article-id pub-id-type="pmid">33021486</article-id>
      <article-id pub-id-type="doi">10.2196/17376</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Implementation of a Cohort Retrieval System for Clinical Data Repositories Using the Observational Medical Outcomes Partnership Common Data Model: Proof-of-Concept System Validation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Goodwin</surname>
            <given-names>Travis</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Lalor</surname>
            <given-names>John</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Meystre</surname>
            <given-names>Stephane</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Sijia</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9763-1164</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Yanshan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4433-7839</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Wen</surname>
            <given-names>Andrew</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9090-8028</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Liwei</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9970-8604</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Hong</surname>
            <given-names>Na</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6798-1761</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Shen</surname>
            <given-names>Feichen</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7803-2331</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Bedrick</surname>
            <given-names>Steven</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0163-9397</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Hersh</surname>
            <given-names>William</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4114-5148</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Hongfang</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Health Sciences Research</institution>
            <institution>Mayo Clinic</institution>
            <addr-line>200 First Street SW</addr-line>
            <addr-line>Rochester, MN, 55901</addr-line>
            <country>United States</country>
            <phone>1 507 293 0057</phone>
            <email>liu.hongfang@mayo.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2570-3741</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Health Sciences Research</institution>
        <institution>Mayo Clinic</institution>
        <addr-line>Rochester, MN</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Computer Science and Electrical Engineering</institution>
        <institution>Oregon Health &#38; Science University</institution>
        <addr-line>Portland, OR</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Medical Informatics and Clinical Epidemiology</institution>
        <institution>Oregon Health &#38; Science University</institution>
        <addr-line>Portland, OR</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Hongfang Liu <email>liu.hongfang@mayo.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>10</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>6</day>
        <month>10</month>
        <year>2020</year>
      </pub-date>
      <volume>8</volume>
      <issue>10</issue>
      <elocation-id>e17376</elocation-id>
      <history>
        <date date-type="received">
          <day>10</day>
          <month>12</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>29</day>
          <month>2</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>4</day>
          <month>6</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>28</day>
          <month>7</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Sijia Liu, Yanshan Wang, Andrew Wen, Liwei Wang, Na Hong, Feichen Shen, Steven Bedrick, William Hersh, Hongfang Liu. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 06.10.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://medinform.jmir.org/2020/10/e17376/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Widespread adoption of electronic health records has enabled the secondary use of electronic health record data for clinical research and health care delivery. Natural language processing techniques have shown promise in their capability to extract the information embedded in unstructured clinical data, and information retrieval techniques provide flexible and scalable solutions that can augment natural language processing systems for retrieving and ranking relevant records.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>In this paper, we present the implementation of a cohort retrieval system that can execute textual cohort selection queries on both structured data and unstructured text—Cohort Retrieval Enhanced by Analysis of Text from Electronic Health Records (CREATE).</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>CREATE is a proof-of-concept system that leverages a combination of structured queries and information retrieval techniques on natural language processing results to improve cohort retrieval performance using the Observational Medical Outcomes Partnership Common Data Model to enhance model portability. The natural language processing component was used to extract common data model concepts from textual queries. We designed a hierarchical index to support the common data model concept search utilizing information retrieval techniques and frameworks.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our case study on 5 cohort identification queries, evaluated using the precision at 5 information retrieval metric at both the patient-level and document-level, demonstrates that CREATE achieves a mean precision at 5 of 0.90, which outperforms systems using only structured data or only unstructured text with mean precision at 5 values of 0.54 and 0.74, respectively.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The implementation and evaluation of Mayo Clinic Biobank data demonstrated that CREATE outperforms cohort retrieval systems that only use one of either structured data or unstructured text in complex textual cohort queries.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>cohort retrieval</kwd>
        <kwd>information retrieval</kwd>
        <kwd>common data model</kwd>
        <kwd>electronic health records</kwd>
        <kwd>natural language processing</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The widespread adoption of electronic health records has enabled the use of clinical data for clinical research and health care delivery [<xref ref-type="bibr" rid="ref1">1</xref>]. Many institutions have established clinical data repositories in conjunction with cohort retrieval tools (eg, Informatics for Integrating Biology &#38; the Bedside) to support the use of clinical data for research including retrospective studies as well as feasibility assessment or patient recruitment for clinical trials. However, electronic health record–based clinical research has been hampered by poor research reproducibility caused by the heterogeneity and complexity of both health care institutions and electronic health record systems.</p>
      <p>For structured electronic health record data, to ensure a standardized and logically unified representation of electronic health record data across multiple institutions (and across multiple sites), many large-scale clinical research networks such as Accrual to Clinical Trials [<xref ref-type="bibr" rid="ref2">2</xref>], Electronic Medical Records and Genomics [<xref ref-type="bibr" rid="ref3">3</xref>], and National Patient-Centered Clinical Research [<xref ref-type="bibr" rid="ref4">4</xref>] have adopted common data models aimed at producing comparable and reproducible results with the same research methods [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Our prior investigation [<xref ref-type="bibr" rid="ref7">7</xref>] demonstrated the generalizability of one of the common data models, the Observational Medical Outcomes Partnership (OMOP) Common Data Model, in achieving structural and semantic consistency of electronic health record data in multi-institutional research with the Observational Health Data Sciences and Informatics (OHDSI) program [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
      <p>In electronic health records, a significant portion of relevant patient information is embedded as unstructured text, and natural language processing techniques such as information extraction are critical when using these data for clinical research [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. Many clinical natural language processing systems have been developed to extract information from text for various downstream applications [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>] but have challenges in performance and portability [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref17">17</xref>]. Information retrieval, a technique used in search engines for storing, retrieving, and ranking documents from a large collection of text documents based on users’ queries, can provide an alternative approach to leverage clinical narratives for cohort retrieval as it is less semantic-dependent and can involve end users in the loop [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. The combination of natural language processing and information retrieval is a promising solution for cohort retrieval from unstructured clinical text, and there are several review articles [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref20">20</xref>] about information retrieval or natural language processing techniques for case detection.</p>
      <p>However, most of the current clinical data repository implementations do not support searches on both structured and unstructured text, seamlessly. An efficient and comprehensive patient-level search engine on both structured and unstructured data from electronic health record is, therefore, still highly demanded by health care practitioners and researchers. In this paper, we describe a proof-of-concept implementation of a cohort retrieval system—Cohort Retrieval Enhanced by Analysis of Text from Electronic Health Records (CREATE)—in which the same query to search both structured (electronic health record represented using the OMOP Common Data Model) and unstructured text (leveraging a concept extraction system) are used. Cohort retrieval in CREATE is conducted in 2 phases: the first phase filters patients using structured data, and the second phase retrieves and ranks results at either a document or a patient level. The functionality of the system was tested using a previously assembled query collection [<xref ref-type="bibr" rid="ref21">21</xref>] on a corpus composed of the electronic health record data from the Mayo Clinic Biobank cohort [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
      <p>There are generally 2 approaches to search unstructured text for purposes such as patient care, clinical research, and traceability of medical care [<xref ref-type="bibr" rid="ref23">23</xref>]. The first approach is based on a text search. For example, the Electronic Medical Record Search Engine (EMERSE) from the University of Michigan [<xref ref-type="bibr" rid="ref24">24</xref>] is a full-text search engine with the goal of facilitating the retrieval of information for clinicians, administrators, and clinical or translational researchers based on clinical narratives. However, EMERSE does not support queries using structured electronic health record data such as demographic information, lab tests, and medications. Dr. Warehouse, proposed by Garcelon et al [<xref ref-type="bibr" rid="ref25">25</xref>], is a free-text search engine using Oracle Text to index its documents. The system is based on relational databases and relies on ranking after retrieval, which may limit its capability to deploy state-of-the-art information retrieval methods such as best match 25 or Markov random fields. The other approach to searching unstructured text is to extract concepts using natural language processing systems. For example, SemEHR [<xref ref-type="bibr" rid="ref26">26</xref>] is a semantic search engine based on a Fast Healthcare Interoperability Resources [<xref ref-type="bibr" rid="ref27">27</xref>] representation of clinical semantic concepts extracted from a clinical natural language processing system named Bio-YODIE. The system showed a high performance in retrieving patients given queries of single concepts, such as Hepatitis C and HIV, in local electronic health record and lab test results when evaluated with the MIMIC-III (Medical Information Mart for Intensive Care) data set [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
      <p>National NLP Clinical Challenges 2018 (Shared-Task Track 1) [<xref ref-type="bibr" rid="ref28">28</xref>] also contributed to standardized evaluations of cohort retrieval systems from electronic health records. The evaluation data set includes clinical narrative texts of 288 patients for concept extraction, temporal reasoning, and inferencing. The official evaluation indicated that the top systems used rule-based and hybrid systems for the problems and led the directions of future system development for similar tasks. The 2018 corpus consists of semistructured and narrative text. The structured data are provided via sections of semistructured text rather than in structured formats. Therefore, cohort retrieval systems for the 2018 corpus require additional components to handle the semistructured metadata, which may not be applicable to systems for real-world electronic health record data.</p>
      <p>Several studies [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref31">31</xref>] have addressed the challenge of how to represent textual cohort criteria or queries via syntactic parsing or sequence labeling. The main focuses of proposed methods were to provide the functions of automatic parsing and modeling of textual queries of end-to-end retrieval systems. To further extend querying to support the customization of parsed results by end users, our cohort retrieval system has the following design principles: (1) the adoption of common data models to facilitate cohort retrieval using both structured and unstructured data for multi-institutional research, (2) the flexibility and ability to apply state-of-the-art information retrieval methods in the retrieval system, (3) the incorporation of relevance judgment for downstream machine learning–based cohort selection methods, and (4) the generation of semantic annotations during the indexing phrase to provide a real-time semantic search experience.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview of System Architecture</title>
        <p>An overview of our cohort retrieval system for clinical data repositories is shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>. Specifically, a textual query is expanded and divided, either automatically or manually, into structured and unstructured data fields according to specific clinical data repository implementations. The query fulfillment for structured data and unstructured text data are managed differently: structured electronic health record data can be retrieved from the corresponding clinical data repositories using Structured Query Language (SQL) on a relational database management system, and the unstructured electronic health record data can be preprocessed by natural language processing and retrieved by leveraging information retrieval techniques. Retrieved results can then be combined and aggregated for clinical research applications, such as clinical trial feasibility assessment or cohort identification. For cohort identification, the retrieved and screened cohort can be treated as a weakly labeled data set. Human relevance judgment is a potential subsequent step to manually validate the results through chart review.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Overview of CREATE’s workflow. CDR: clinical data repository; CM: clinical modification; CPT: current procedures terminology; EHR: electronic health record; ICD: International Classification of Diseases; NLP: natural language processing; OHDSI: Observational Health Data Sciences and Informatics; RDBMS: relational database management system.</p>
          </caption>
          <graphic xlink:href="medinform_v8i10e17376_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Adopting OMOP Common Data Model for Patient Retrieval</title>
        <p>To improve the interoperability and portability of our system (use with disparate data sources), we adopted the OMOP Common Data Model (version 5.3.1) [<xref ref-type="bibr" rid="ref32">32</xref>] to index electronic health record data. The hierarchical index structure of clinical data repositories using OMOP Common Data Model for cohort retrieval is shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>. The indexed tables include data from both unstructured and structured sources, consisting of extracted OMOP Common Data Model artifacts from unstructured clinical notes and encounter information, demographic information (represented as a common data model person), and diagnoses, procedures, and lab tests from structured data. The distinction between structured and unstructured data varies between different electronic health record systems. The specifics of implementation in adopters may, therefore, differ from those implemented in this study.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Hierarchical index structure using the OMOP Common Data Model. NLP: natural language processing.</p>
          </caption>
          <graphic xlink:href="medinform_v8i10e17376_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Structured data such as procedures, diagnoses, lab tests, and demographics are directly queried from relational databases and loaded into the index through an extract-transform-load process. We map structured data to Unified Medical Language System (UMLS) concept unique identifiers either through the usage of mapping definitions already in the UMLS Metathesaurus [<xref ref-type="bibr" rid="ref33">33</xref>] (eg, ICD-9-CM or ICD-10-CM, Current Procedural Terminology 4, and SNOMED Clinical Terms) or through the use of natural language processing (eg, local lab test codes). The concepts are subsequently mapped to equivalent OHDSI- or OMOP-compliant vocabulary codes via Athena (version 1.10.0; OHDSI) standardized vocabularies [<xref ref-type="bibr" rid="ref34">34</xref>].</p>
        <p>The clinical texts from Mayo Clinic electronic health records consisted of existing sections that provide brief descriptions of a specific perspective from a patient encounter, such as social history, diagnosis, and chief complaints. We chose to use the document sections to index clinical text for cohort retrieval based on the observation that while retrieval at a sentence level is insufficient for relevance judging relevance in the topic collections that we investigated, document-level retrieval may provide mostly irrelevant information.</p>
        <p>Various common data model concepts were extracted via the dictionary lookup component as entity mentions such as <italic>Drug</italic>, <italic>Procedure</italic>, and <italic>SignSymptom</italic> with their concept identifiers (eg, UMLS concept unique identifiers) by cTAKES (Apache Software Foundation) [<xref ref-type="bibr" rid="ref12">12</xref>] from clinical documents and subsequently indexed into Elasticsearch (Elasticsearch BV). In addition, the entity mention attributes such as <italic>negation</italic>, <italic>certainty</italic>, and <italic>family history</italic> are stored in the field <italic>term_modifiers</italic>.</p>
      </sec>
      <sec>
        <title>Textual Query Formation</title>
        <p>Natural language textual queries are fed into the same concept extraction pipeline used for indexing. Similarly, the normalized concepts and their associated attributes (eg, negation, certainty, experiencer, or status) are extracted from the textual query. Logical concepts such as <italic>must</italic> and <italic>must not</italic> are also used when generating queries from the text for further parsing and interpretation in the query backend. An example of the textual query modeling process is illustrated in <xref rid="figure3" ref-type="fig">Figure 3</xref>. In the query “Adults with inflammatory bowel disease (ulcerative colitis or Crohn's disease), who have not had surgery of the intestines, rectum, or anus entailing excision, ostomy,” the natural language processing component can detect and normalize the raw mentions of “bowel disease,” “ulcerative colitis,” and “Crohn’s disease” into various coding systems including OHDSI IDs, while the demographic information of “adults” and the list of surgeries can be manually added as structured data filters based on the date of birth and Current Procedural Terminology 4 codes.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Textual query modeling example. CUI: concept unique identifier; OHDSI: Observational Health Data Sciences and Informatics; SNOMEDCT: Systematized Nomenclature of Medicine—Clinical Terms; TUI:  (semantic) type unique identifier.</p>
          </caption>
          <graphic xlink:href="medinform_v8i10e17376_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>User Interface</title>
        <p>We developed a web-based user interface for CREATE, the details of which are described in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. All the information extracted is shown to the users by subject for potential insertion, modification, and deletion before query execution. Since the natural language processing component will suggest parsing results and map them into common data model concepts, the users are expected to focus on configuring the logistics between the extracted concepts and removing generic concepts (eg, UMLS concepts of <italic>Drug</italic> or <italic>Treatment</italic>), which do not require searching concepts among standard vocabularies from various sources and are not time consuming.</p>
      </sec>
      <sec>
        <title>Retrieval Methods</title>
        <p>CREATE uses Elasticsearch [<xref ref-type="bibr" rid="ref35">35</xref>] as the search engine of the backend information retrieval component. Since Elasticsearch includes support for hierarchical queries of parent–child relations, the hierarchical index architecture shown in <xref rid="figure2" ref-type="fig">Figure 2</xref> allows for significant flexibility in query strategies. Patients with a certain set of common data model concepts can be retrieved and filtered during the query execution by one of the structured fields (eg, encounter age), one of the unstructured fields (eg, whether the patient has sections containing common data model concepts from unstructured data), or both.</p>
        <p>Given a document <italic>d</italic> and a textual query <italic>q</italic>, the set of common data model concepts extracted from <italic>q</italic> can be represented as <italic>O</italic> = {<italic>o</italic><sub>1</sub>,...,<italic>o</italic><sub>n</sub>} where <italic>o</italic> is a common data model concept. The similarity score between <italic>d</italic> and <italic>o</italic> can then be represented as <italic>s</italic>(<italic>d</italic>,<italic>o</italic>). The total score of each document for each query would then be defined as:</p>
        <graphic xlink:href="medinform_v8i10e17376_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        <p>The first term on the right-hand side of the equation is the mean similarity of all common data model concepts in the query. The second term is the similarity between the document and the full-text query. In extreme use cases, the 2 terms can be weighted to place more emphasis on the contribution of either structured or unstructured data to the query. The patient-level similarity score is the mean of the top 100 document scores. The top rank threshold of 100 was selected based on our experiments on top 10, 20, 50, and 100 from test query results and may be subject to further tuning.</p>
      </sec>
      <sec>
        <title>Functionality Assessment of CREATE</title>
        <p>There are 2 aspects of the system design that require feasibility assessment by real-world implementation for clinical data repository.</p>
        <p>First, the data mapping needs to be created specifically for each clinical data repository architecture. A site-dependent correlation between clinical data repository representation, OMOP Common Data Model tables, and extracted natural language processing concepts has to be established before the data can be indexed into CREATE. Second, retrieved results need to be assessed to validate that the proposed query modeling and retrieval methods can generate meaningful retrieval results.</p>
        <p>The performance was measured using the mean <italic>precision at 5</italic> of 5 queries. As an evaluation of CREATE functionality, we randomly sampled 5 queries from a previously curated query collection [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref36">36</xref>] to evaluate CREATE through manual chart review. The structured query used manually transformed ICD-9-CM or ICD-10-CM codes. There was no ranking of relevance for the retrieved patients from structured electronic health record data, thus we randomly selected 5 patients from the relevant patients to be used as the top 5 in calculating the precision at 5. The top 5 patients from unstructured text queries and CREATE results were retrieved based on best match 25 [<xref ref-type="bibr" rid="ref30">30</xref>]. A medical expert performed complete chart review on the top 5 patients for each retrieval cohort. The patient relevancy was scored into the 3 categories, <italic>definitely relevant</italic>, <italic>partially relevant</italic>, and <italic>not relevant</italic>, by the medical expert. Definitely relevant, partially relevant, and not relevant were assigned scores of 1, 0.5, and 0, respectively, for precision at 5 calculations.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>We implemented CREATE as a feasibility assessment tool for the Mayo Clinic Biobank Rochester cohort, which is a large-scale institutionally funded research resource initiated in 2009 with blood, electronic health record, and patient-provided data on 45,613 Mayo Clinic Rochester patients who had consented to participate. This resource has been used in a wide array of over 250 health-related research and clinical studies [<xref ref-type="bibr" rid="ref22">22</xref>]. In our experiments, we limited inclusion to patients with at least one clinical note in their electronic health record and extracted the corresponding structured data.</p>
      <p>After data extraction, we investigated and compared the electronic health record system implementation at the Mayo Clinic to OMOP Common Data Model tables. During the data exploration stage, we found that the data elements under corresponding tables were generally straightforward to map; therefore, we show the mapping at the granularity of the table level. <xref ref-type="table" rid="table1">Table 1</xref> shows our mapping of several OMOP Common Data Model tables to Mayo Clinic electronic health record tables. The mapping used to transform named entity mention types of the cTAKES-type system to common data model tables is also listed in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Table-level mapping between OMOP Common Data Model and Mayo Clinic electronic health records.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="320"/>
          <col width="160"/>
          <col width="220"/>
          <col width="270"/>
          <thead>
            <tr valign="top">
              <td colspan="2">OMOP<sup>a</sup> Common Data Model and<break/>Mayo Clinic clinical data repository</td>
              <td>Number of records</td>
              <td>Vocabulary</td>
              <td>Natural language processing cTAKES-type system</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="5">
                <bold>Person</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Demographics</td>
              <td>45,613</td>
              <td>—<sup>b</sup></td>
              <td>—</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Condition</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Diagnosis</td>
              <td>9,712,736</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>ICD-9-CM<sup>c</sup></p>
                  </list-item>
                  <list-item>
                    <p>ICD-10-CM<sup>d</sup></p>
                  </list-item>
                </list>
              </td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p>SignSymptom</p>
                  </list-item>
                  <list-item>
                    <p>DiseaseDisorder</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Procedures</td>
              <td>13,014,264</td>
              <td>CPT<sup>e</sup></td>
              <td>Procedure</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Measurement</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Lab</td>
              <td>15,719,203</td>
              <td>Local code system</td>
              <td>Lab</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Vital Signs</td>
              <td>—</td>
              <td>—</td>
              <td>VitalSigns</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Drug_Exposure</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>DrugExposure</td>
              <td>—</td>
              <td>UMLS<sup>f</sup></td>
              <td>Medication</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Note</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Clinical notes</td>
              <td>68,198,499</td>
              <td>—</td>
              <td>—</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table1fn1">
            <p><sup>a</sup>OMOP: Observational Medical Outcomes Partnership.</p>
          </fn>
          <fn id="table1fn2">
            <p><sup>b</sup>There is no equivalent or no system is used for the equivalent concept.</p>
          </fn>
          <fn id="table1fn3">
            <p><sup>c</sup>ICD-9-CM: International Classification of Diseases, Ninth revision, Clinical Modification.</p>
          </fn>
          <fn id="table1fn4">
            <p><sup>d</sup>ICD-10-CM: International Classification of Diseases, Tenth revision, Clinical Modification.</p>
          </fn>
          <fn id="table1fn5">
            <p><sup>e</sup>CPT: Current Procedural Terminology.</p>
          </fn>
          <fn id="table1fn6">
            <p><sup>f</sup>UMLS: Unified Medical Language System.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p><xref ref-type="table" rid="table2">Table 2</xref> lists the detailed description of the 5 queries and the corresponding keywords used in the manual chart review process for judging patient relevance. The queries were different from the single condition criteria used to evaluate systems in some of the related work with regard to the level of detail, logic, and semantic complexity involved. The complete parsing results of the structured part of the queries and the CREATE query format specification can be found in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>, respectively.</p>
      <p>Precision at 5 results are shown in <xref ref-type="table" rid="table3">Table 3</xref>. The overall comparison shows that CREATE, as a combination of systems using structured and unstructured electronic health record data, outperformed the systems based on using only one of structured or unstructured electronic health record data for full-text queries. For each query, CREATE performs at least as well as the systems using only structured or unstructured electronic health record data.</p>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>The list of tested queries.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="70"/>
          <col width="500"/>
          <col width="430"/>
          <thead>
            <tr valign="top">
              <td>Query</td>
              <td>Description</td>
              <td>Keywords</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>1</td>
              <td>Adults with inflammatory bowel disease (ulcerative colitis or Crohn's disease), who have not had surgery of the intestines, rectum, or anus entailing excision, ostomy</td>
              <td>Ulcerative colitis, Crohn's disease, excision, ostomy, rectal prolapse, anal fistula, stricturoplasty resection</td>
            </tr>
            <tr valign="top">
              <td>2</td>
              <td>Adults 18-100 years old who have a diagnosis of hereditary hemorrhagic telangiectasia (HHT), which is also called Osler-Weber-Rendu syndrome.<break/></td>
              <td>Osler-Weber-Rendu syndrome, hereditary hemorrhagic telangiectasia</td>
            </tr>
            <tr valign="top">
              <td>3</td>
              <td>Children with localization-related (focal) epilepsy with simple or complex partial seizures diagnosed before 4 years old who have had an outpatient neurology visit.</td>
              <td>Epilepsy, partial seizure, neurology</td>
            </tr>
            <tr valign="top">
              <td>4</td>
              <td>Adults 18-70 years old with rheumatoid arthritis currently treated with methotrexate who have never used a biologic disease-modifying antirheumatic drug (DMARD).<break/></td>
              <td>Rheumatoid arthritis biologic methotrexate abatacept, adalimumab, anakinra, certolizumab, etanercept, golimumab, infliximab, rituximab, tocilizumab, tofacitinib</td>
            </tr>
            <tr valign="top">
              <td>5</td>
              <td>Adults who have been treated with an angiotensin-converting-enzyme (ACE) inhibitor and developed an associated cough, consistent with ACE inhibitor–induced cough as an adverse effect of the medication.</td>
              <td>Benazepril, Lotensin, Captopril, Enalapril, Vasotec, Fosinopril, Lisinopril, Prinivil, Zestril, Moexipril, Perindopril, Aceon, Quinapril, Accupril, Ramipril, Altace, Trandolapril, Mavik, cough, angiotensin-converting-enzyme (ACE) inhibitor</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>Precision at 5 of sampled queries for electronic health record text.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="160"/>
          <col width="200"/>
          <col width="220"/>
          <col width="420"/>
          <thead>
            <tr valign="bottom">
              <td>Query</td>
              <td>Structured</td>
              <td>Unstructured</td>
              <td>CREATE<sup>a</sup> (unstructured and structured combined)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>1</td>
              <td>0.8</td>
              <td>0.6</td>
              <td>0.8</td>
            </tr>
            <tr valign="top">
              <td>2</td>
              <td>0.7</td>
              <td>1.0</td>
              <td>1.0</td>
            </tr>
            <tr valign="top">
              <td>3</td>
              <td>0.3</td>
              <td>0.5</td>
              <td>0.8</td>
            </tr>
            <tr valign="top">
              <td>4</td>
              <td>0.7</td>
              <td>0.7</td>
              <td>1.0</td>
            </tr>
            <tr valign="top">
              <td>5</td>
              <td>0.2</td>
              <td>0.9</td>
              <td>0.9</td>
            </tr>
            <tr valign="top">
              <td>Mean</td>
              <td>0.54</td>
              <td>0.74</td>
              <td>0.90</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table3fn1">
            <p><sup>a</sup>CREATE: Cohort Retrieval Enhanced by Analysis of Text from Electronic Health Records.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>CREATE is a proof-of-concept for leveraging the combination of structured queries and information retrieval techniques to improve cohort retrieval performance while adopting the OMOP Common Data Model to enhance model portability. The evaluation of the implementation using sample queries supports our hypothesis that using a combination of structured and unstructured electronic health record data outperforms a single-source system in determining the relevance, from an input query, of any given patient electronic health record data for a particular clinical application. CREATE was designed to improve the efficiency of judging patient relevance, by shifting from human-query judgment (pull) to system-feed judgment (push).</p>
        <p>Intuitively, the nature of the queries and how the query-related data are presented in the clinical data repository significantly impact the performance of the data source queried (ie, structured, unstructured, and combined). For instance, one of the major concepts in query 5 is treatment with angiotensin-converting enzyme (ACE) inhibitors. It is effective for information retrieval methods on unstructured text to select patients with ACE inhibitor–related cough, as the keywords <italic>ACE inhibitor</italic> and <italic>cough</italic> usually co-occur in clinical text contexts as adverse drug events. In contrast, it is challenging for structured data queries in this experiment. In our clinical data repository, the medication information is present only as semistructured text generated by computerized provider order entry without normalization into structured data. Therefore, there is no reliable way to obtain the relevant cohort purely on structured data, which leads to very low relevancy of the retrieved cohort. Such a limitation is usually not critical when unstructured text are queried, because most of the clinical data are either presented or summarized in clinical notes.</p>
        <p>However, when querying on a cohort with age or gender criteria, querying solely on unstructured data cannot work effectively. For example, even when the age is mentioned in query 3, all the retrieved patients are adult patients rather than the expected pediatric patients. This is caused by the lack of the extraction the dates and ages from narrative texts, which is not a trivial information extraction task. To build a reliable query system for unstructured texts without providing metadata, such as date of birth or age at encounter, usually requires corpus-dependent engineering efforts to extract the dates and ages from narrative text.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study has multiple limitations that may offer directions for our future work. Our current functionality test is based on 5-query precision at 5 by one annotator, which is not sufficient to cover all cohort retrieval cases and longitudinal patient condition scenarios. Though we acknowledge that a larger number of queries on a fully-annotated patient cohort from annotators and adjudicators would be very helpful in evaluating the performance of the system, it is time consuming to judge complete patient history, especially for negated conditions and treatments (eg, to check if the patient does not have a certain disorder or procedure). With the system in production, the feedback of each study leveraging the system can be then retained and analyzed for more comprehensive statistics of the performance of the system.</p>
        <p>When processing concepts without a global coding system, concept mapping, such as that used in our solution, relies on the output of natural language processing algorithms. Although it is a fast and straightforward solution, current natural language processing tools cannot achieve the same level of accuracy as human assigned codes. Complete mapping from a local vocabulary requires extensive human efforts with data quality assurance [<xref ref-type="bibr" rid="ref37">37</xref>], thus it was not feasible within the scope of this study. A solution for this issue is to utilize value set repositories to manage the concepts. Though a one-to-one mapping may not be found in all semantic spaces, value set repositories can provide a systematic way to manage the concept sets in collections or aggregations [<xref ref-type="bibr" rid="ref38">38</xref>].</p>
        <p>There are also several potential approaches to further improve the information retrieval component in this system's framework. We only used the out-of-box query algorithms to measure the patient similarity and rank the relevancy in this study. More advanced information retrieval methods can be applied to the queries such as case-based reasoning [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref41">41</xref>], pseudo relevance feedback [<xref ref-type="bibr" rid="ref42">42</xref>], and different ranking models [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]. Though the equal weights of common data model concepts and raw text provide information from both sides, the weights can be tuned to meet different retrieval perspectives and demands.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>We developed CREATE, an end-to-end patient-level information retrieval system, with the ability to query both structured and unstructured data by leveraging the OMOP Common Data Model. Implementation and functionality assessment on Mayo Clinic Biobank demonstrated that CREATE outperforms cohort retrieval systems that use only one of either structured or unstructured data in complex textual cohort queries. The source code of the CREATE can be found at <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p>
        <p>In the future, we will refine the evaluation process by adding more query topics and larger cohort of manual chart reviews. An active learning component will be added to the system to enable human-in-the-loop analysis on the system-screened cohort to further improve the efficiency of relevance judgment. In doing so, both machine learning–based or rule-based cohort identification algorithms could be deployed and evaluated in real time. This could potentially then be extended to an active-learning cohort-identification framework [<xref ref-type="bibr" rid="ref45">45</xref>].</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Web-based graphical user interface of CREATE.</p>
        <media xlink:href="medinform_v8i10e17376_app1.docx" xlink:title="DOCX File , 658 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Parsing results of CREATE from textual queries.</p>
        <media xlink:href="medinform_v8i10e17376_app2.docx" xlink:title="DOCX File , 18 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Format specification for CREATE queries.</p>
        <media xlink:href="medinform_v8i10e17376_app3.docx" xlink:title="DOCX File , 16 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Source code of CREATE.</p>
        <media xlink:href="medinform_v8i10e17376_app4.docx" xlink:title="DOCX File , 12 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">CREATE</term>
          <def>
            <p>Cohort Retrieval Enhanced by Analysis of Text from Electronic Health Records</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">EMERSE</term>
          <def>
            <p>Electronic Medical Record Search Engine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">ICD-9-CM</term>
          <def>
            <p>International Classification of Diseases, Ninth Revision, Clinical Modification</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ICD-10-CM</term>
          <def>
            <p>International Classification of Diseases, Tenth Revision, Clinical Modification</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">OHDSI</term>
          <def>
            <p>Observational Health Data Sciences and Informatics</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">OMOP</term>
          <def>
            <p>Observational Medical Outcomes Partnership</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">SNOMED</term>
          <def>
            <p>Systematized Nomenclature of Medicine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">UMLS</term>
          <def>
            <p>Unified Medical Language System</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We sincerely thank Donna Ihrke who annotated the query corpus. The work was supported by the National Institutes of Health (grants R01LM011934, R01EB19403, R01LM11829, and U01TR02062). The content of this paper is solely the responsibility of the authors and does not necessarily represent the official views of the National Institutes of Health.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Methods and dimensions of electronic health record data quality assessment: enabling reuse for clinical research</article-title>
          <source>Journal of the American Medical Informatics Association</source>
          <year>2013</year>
          <month>01</month>
          <day>01</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>144</fpage>
          <lpage>151</lpage>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000681</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <article-title>Accrual to Clinical Trials (ACT) Network</article-title>
          <source>Clinical and Translational Science Institute</source>
          <access-date>2020-08-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ctsi.umn.edu/consultations-and-services/multi-site-study-support/accrual-clinical-trials-act-network">https://www.ctsi.umn.edu/consultations-and-services/multi-site-study-support/accrual-clinical-trials-act-network</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gottesman</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Kuivaniemi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tromp</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Faucett</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Manolio</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Sanderson</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Kannry</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zinberg</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Basford</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Brilliant</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Carey</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chisholm</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Connolly</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Crosslin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Gallego</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Haines</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Hakonarson</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Harley</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jarvik</surname>
              <given-names>GP</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Kullo</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Larson</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>McCarty</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ritchie</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Roden</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Böttinger</surname>
              <given-names>EP</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>The Electronic Medical Records and Genomics (eMERGE) Network: past, present, and future</article-title>
          <source>Genet Med</source>
          <year>2013</year>
          <month>6</month>
          <day>6</day>
          <volume>15</volume>
          <issue>10</issue>
          <fpage>761</fpage>
          <lpage>771</lpage>
          <pub-id pub-id-type="doi">10.1038/gim.2013.72</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <source>PCORnet: the National Patient-Centered Clinical Research Network</source>
          <access-date>2020-08-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pcornet.org/clinical-research-network/">https://pcornet.org/clinical-research-network/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meystre</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Lovis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bürkle</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tognola</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Budrionis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lehmann</surname>
              <given-names>CU</given-names>
            </name>
          </person-group>
          <article-title>Clinical Data Reuse or Secondary Use: Current Status and Potential Future Progress</article-title>
          <source>Yearb Med Inform</source>
          <year>2017</year>
          <month>08</month>
          <volume>26</volume>
          <issue>1</issue>
          <fpage>38</fpage>
          <lpage>52</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.15265/IY-2017-007"/>
          </comment>
          <pub-id pub-id-type="doi">10.15265/IY-2017-007</pub-id>
          <pub-id pub-id-type="medline">28480475</pub-id>
          <pub-id pub-id-type="pmcid">PMC6239225</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bycroft</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Freeman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Petkova</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Band</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Elliott</surname>
              <given-names>LT</given-names>
            </name>
            <name name-style="western">
              <surname>Sharp</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Motyer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vukcevic</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Delaneau</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>O’Connell</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cortes</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Welsh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Young</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Effingham</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McVean</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Leslie</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Donnelly</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Marchini</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The UK Biobank resource with deep phenotyping and genomic data</article-title>
          <source>Nature</source>
          <year>2018</year>
          <month>10</month>
          <day>10</day>
          <volume>562</volume>
          <issue>7726</issue>
          <fpage>203</fpage>
          <lpage>209</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-018-0579-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hersh</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>On Mapping Textual Queries to a Common Data Model</article-title>
          <year>2017</year>
          <conf-name>2017 IEEE International Conference on Healthcare Informatics (ICHI)</conf-name>
          <conf-date>23-26 Aug. 2017</conf-date>
          <conf-loc>Park City, UT, USA</conf-loc>
          <fpage>21</fpage>
          <lpage>25</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1109/ICHI.2017.63"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rastegar-Mojarad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moon</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Afzal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mehrabi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Clinical information extraction applications: A literature review</article-title>
          <source>Journal of Biomedical Informatics</source>
          <year>2018</year>
          <month>01</month>
          <volume>77</volume>
          <fpage>34</fpage>
          <lpage>49</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2017.11.011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>P-Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>C-W</given-names>
            </name>
            <name name-style="western">
              <surname>Kaddi</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Venugopalan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>MD</given-names>
            </name>
          </person-group>
          <article-title>-Omic and Electronic Health Record Big Data Analytics for Precision Medicine</article-title>
          <source>IEEE Trans Biomed Eng</source>
          <year>2017</year>
          <month>02</month>
          <volume>64</volume>
          <issue>2</issue>
          <fpage>263</fpage>
          <lpage>273</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27740470"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/TBME.2016.2573285</pub-id>
          <pub-id pub-id-type="medline">27740470</pub-id>
          <pub-id pub-id-type="pmcid">PMC5859562</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Murff</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>FitzHenry</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Matheny</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Gentry</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kotter</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Crimin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dittus</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Rosen</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Elkin</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Speroff</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Automated identification of postoperative complications within an electronic medical record using natural language processing</article-title>
          <source>JAMA</source>
          <year>2011</year>
          <month>08</month>
          <day>24</day>
          <volume>306</volume>
          <issue>8</issue>
          <fpage>848</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2011.1204</pub-id>
          <pub-id pub-id-type="medline">21862746</pub-id>
          <pub-id pub-id-type="pii">306/8/848</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maddox</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Albert</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Borden</surname>
              <given-names>WB</given-names>
            </name>
            <name name-style="western">
              <surname>Curtis</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Ferguson</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Kao</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Marcus</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>ED</given-names>
            </name>
            <name name-style="western">
              <surname>Redberg</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rumsfeld</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Tcheng</surname>
              <given-names>JE</given-names>
            </name>
          </person-group>
          <article-title>The Learning Healthcare System and Cardiovascular Care: A Scientific Statement From the American Heart Association</article-title>
          <source>Circulation</source>
          <year>2017</year>
          <month>04</month>
          <day>04</day>
          <volume>135</volume>
          <issue>14</issue>
          <pub-id pub-id-type="doi">10.1161/cir.0000000000000480</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Masanz</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ogren</surname>
              <given-names>PV</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kipper-Schuler</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
          </person-group>
          <article-title>Mayo clinical Text Analysis and Knowledge Extraction System (cTAKES): architecture, component evaluation and applications</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2010</year>
          <month>09</month>
          <day>01</day>
          <volume>17</volume>
          <issue>5</issue>
          <fpage>507</fpage>
          <lpage>513</lpage>
          <pub-id pub-id-type="doi">10.1136/jamia.2009.001560</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aronson</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Lang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>An overview of MetaMap: historical perspective and recent advances</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2010</year>
          <month>05</month>
          <day>01</day>
          <volume>17</volume>
          <issue>3</issue>
          <fpage>229</fpage>
          <lpage>236</lpage>
          <pub-id pub-id-type="doi">10.1136/jamia.2009.002733</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pradhan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>Wendy</given-names>
            </name>
            <name name-style="western">
              <surname>Manandhar</surname>
              <given-names>Suresh</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>Guergana</given-names>
            </name>
          </person-group>
          <article-title>SemEval-2014 Task 7: Analysis of Clinical Text</article-title>
          <year>2014</year>
          <conf-name>8th International Workshop on Semantic Evaluation (SemEval 2014)</conf-name>
          <conf-date>August 23-24, 2014</conf-date>
          <conf-loc>Dublin, Ireland</conf-loc>
          <fpage>54</fpage>
          <lpage>62</lpage>
          <pub-id pub-id-type="doi">10.3115/v1/s14-2007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pradhan</surname>
              <given-names>Sameer</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>Noemie</given-names>
            </name>
            <name name-style="western">
              <surname>South</surname>
              <given-names>Brett</given-names>
            </name>
            <name name-style="western">
              <surname>Martinez</surname>
              <given-names>David</given-names>
            </name>
            <name name-style="western">
              <surname>Christensen</surname>
              <given-names>Lee</given-names>
            </name>
            <name name-style="western">
              <surname>Vogel</surname>
              <given-names>Amy</given-names>
            </name>
            <name name-style="western">
              <surname>Suominen</surname>
              <given-names>Hanna</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>Wendy</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>Guergana</given-names>
            </name>
          </person-group>
          <article-title>Task 1: ShARe/CLEF eHealth Evaluation Lab 2013</article-title>
          <source>CLEF (Working Notes)</source>
          <year>2013</year>
          <conf-name>ShARe/CLEF eHealth Evaluation Lab</conf-name>
          <conf-date>September 23-26, 2013</conf-date>
          <conf-loc>Valencia, Spain</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>Will K</given-names>
            </name>
            <name name-style="western">
              <surname>Eyler</surname>
              <given-names>Anne E</given-names>
            </name>
            <name name-style="western">
              <surname>Mandelin</surname>
              <given-names>Arthur M</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>Tianxi</given-names>
            </name>
            <name name-style="western">
              <surname>Zink</surname>
              <given-names>Raquel M</given-names>
            </name>
            <name name-style="western">
              <surname>Pacheco</surname>
              <given-names>Jennifer A</given-names>
            </name>
            <name name-style="western">
              <surname>Boomershine</surname>
              <given-names>Chad S</given-names>
            </name>
            <name name-style="western">
              <surname>Lasko</surname>
              <given-names>Thomas A</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Hua</given-names>
            </name>
            <name name-style="western">
              <surname>Karlson</surname>
              <given-names>Elizabeth W</given-names>
            </name>
            <name name-style="western">
              <surname>Perez</surname>
              <given-names>Raul G</given-names>
            </name>
            <name name-style="western">
              <surname>Gainer</surname>
              <given-names>Vivian S</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>Shawn N</given-names>
            </name>
            <name name-style="western">
              <surname>Ruderman</surname>
              <given-names>Eric M</given-names>
            </name>
            <name name-style="western">
              <surname>Pope</surname>
              <given-names>Richard M</given-names>
            </name>
            <name name-style="western">
              <surname>Plenge</surname>
              <given-names>Robert M</given-names>
            </name>
            <name name-style="western">
              <surname>Kho</surname>
              <given-names>Abel Ngo</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>Katherine P</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>Joshua C</given-names>
            </name>
          </person-group>
          <article-title>Portability of an algorithm to identify rheumatoid arthritis in electronic health records</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2012</year>
          <month>06</month>
          <volume>19</volume>
          <issue>e1</issue>
          <fpage>e162</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22374935"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000583</pub-id>
          <pub-id pub-id-type="medline">22374935</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000583</pub-id>
          <pub-id pub-id-type="pmcid">PMC3392871</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mehrabi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Krishnan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Roch</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kesterson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Beesley</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dexter</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Palakal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Identification of Patients with Family History of Pancreatic Cancer--Investigation of an NLP System Portability</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2015</year>
          <volume>216</volume>
          <fpage>604</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26262122"/>
          </comment>
          <pub-id pub-id-type="medline">26262122</pub-id>
          <pub-id pub-id-type="pmcid">PMC5863760</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goodwin</surname>
              <given-names>Travis R</given-names>
            </name>
            <name name-style="western">
              <surname>Harabagiu</surname>
              <given-names>Sanda M</given-names>
            </name>
          </person-group>
          <article-title>Multi-modal Patient Cohort Identification from EEG Report and Signal Data</article-title>
          <source>Annual Symposium proceedings</source>
          <year>2016</year>
          <conf-name>American Medical Informatics Association</conf-name>
          <conf-date>Nov 12-16, 2016</conf-date>
          <conf-loc>Chicago, IL, USA</conf-loc>
          <fpage>1794</fpage>
          <lpage>1803</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hanauer</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Law</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Khanna</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Supporting information retrieval from electronic health records: A report of University of Michigan’s nine-year experience in developing and using the Electronic Medical Record Search Engine (EMERSE)</article-title>
          <source>Journal of Biomedical Informatics</source>
          <year>2015</year>
          <month>06</month>
          <volume>55</volume>
          <fpage>290</fpage>
          <lpage>300</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2015.05.003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ford</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>HE</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cassell</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Extracting information from the text of electronic medical records to improve case detection: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2016</year>
          <month>02</month>
          <day>05</day>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>1007</fpage>
          <lpage>1015</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocv180</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Timmons</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Uppili</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bedrick</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hersh</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Intrainstitutional EHR collections for patient-level information retrieval</article-title>
          <source>Journal of the Association for Information Science and Technology</source>
          <year>2017</year>
          <month>09</month>
          <day>18</day>
          <volume>68</volume>
          <issue>11</issue>
          <fpage>2636</fpage>
          <lpage>2648</lpage>
          <pub-id pub-id-type="doi">10.1002/asi.23884</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Olson</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Ryu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Koenig</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Maschke</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Morrisette</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Liebow</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>PY</given-names>
            </name>
            <name name-style="western">
              <surname>Fredericksen</surname>
              <given-names>ZS</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Hathcock</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Carnahan</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Pathak</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lindor</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Beebe</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Thibodeau</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Cerhan</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>The Mayo Clinic Biobank: A Building Block for Individualized Medicine</article-title>
          <source>Mayo Clinic Proceedings</source>
          <year>2013</year>
          <month>9</month>
          <volume>88</volume>
          <issue>9</issue>
          <fpage>952</fpage>
          <lpage>962</lpage>
          <pub-id pub-id-type="doi">10.1016/j.mayocp.2013.06.006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Biron</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Metzger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pezet</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sebban</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Barthuet</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Durand</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>An information retrieval system for computerized patient records in the context of a daily hospital practice: the example of the Léon Bérard Cancer Center (France)</article-title>
          <source>Appl Clin Inform</source>
          <year>2017</year>
          <month>12</month>
          <day>20</day>
          <volume>05</volume>
          <issue>01</issue>
          <fpage>191</fpage>
          <lpage>205</lpage>
          <pub-id pub-id-type="doi">10.4338/aci-2013-08-cr-0065</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hanauer</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Law</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Khanna</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Supporting information retrieval from electronic health records: A report of University of Michigan’s nine-year experience in developing and using the Electronic Medical Record Search Engine (EMERSE)</article-title>
          <source>Journal of Biomedical Informatics</source>
          <year>2015</year>
          <month>06</month>
          <volume>55</volume>
          <fpage>290</fpage>
          <lpage>300</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2015.05.003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Garcelon</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Neuraz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Salomon</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Faour</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Benoit</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Delapalme</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Munnich</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Burgun</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rance</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>A clinician friendly data warehouse oriented toward narrative reports: Dr. Warehouse</article-title>
          <source>Journal of Biomedical Informatics</source>
          <year>2018</year>
          <month>04</month>
          <volume>80</volume>
          <fpage>52</fpage>
          <lpage>63</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2018.02.019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Toti</surname>
              <given-names>Giulia</given-names>
            </name>
            <name name-style="western">
              <surname>Morley</surname>
              <given-names>Katherine I</given-names>
            </name>
            <name name-style="western">
              <surname>Ibrahim</surname>
              <given-names>Zina M</given-names>
            </name>
            <name name-style="western">
              <surname>Folarin</surname>
              <given-names>Amos</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>Richard</given-names>
            </name>
            <name name-style="western">
              <surname>Kartoglu</surname>
              <given-names>Ismail</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>Asha</given-names>
            </name>
            <name name-style="western">
              <surname>Stringer</surname>
              <given-names>Clive</given-names>
            </name>
            <name name-style="western">
              <surname>Gale</surname>
              <given-names>Darren</given-names>
            </name>
            <name name-style="western">
              <surname>Gorrell</surname>
              <given-names>Genevieve</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>Angus</given-names>
            </name>
            <name name-style="western">
              <surname>Broadbent</surname>
              <given-names>Matthew</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>Robert</given-names>
            </name>
            <name name-style="western">
              <surname>Dobson</surname>
              <given-names>Richard J B</given-names>
            </name>
          </person-group>
          <article-title>SemEHR: A general-purpose semantic search system to surface semantic data from clinical notes for tailored care, trial recruitment, and clinical research</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2018</year>
          <month>05</month>
          <day>01</day>
          <volume>25</volume>
          <issue>5</issue>
          <fpage>530</fpage>
          <lpage>537</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29361077"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocx160</pub-id>
          <pub-id pub-id-type="medline">29361077</pub-id>
          <pub-id pub-id-type="pii">4817428</pub-id>
          <pub-id pub-id-type="pmcid">PMC6019046</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>FHIR (Fast Healthcare Interoperability Resources)</collab>
          </person-group>
          <source>FHIR Overview</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hl7.org/fhir/overview.html">https://www.hl7.org/fhir/overview.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stubbs</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Filannino</surname>
              <given-names>Michele</given-names>
            </name>
            <name name-style="western">
              <surname>Soysal</surname>
              <given-names>Ergin</given-names>
            </name>
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>Samuel</given-names>
            </name>
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>Özlem</given-names>
            </name>
          </person-group>
          <article-title>Cohort selection for clinical trials: n2c2 2018 shared task track 1</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2019</year>
          <month>11</month>
          <day>01</day>
          <volume>26</volume>
          <issue>11</issue>
          <fpage>1163</fpage>
          <lpage>1171</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz163</pub-id>
          <pub-id pub-id-type="medline">31562516</pub-id>
          <pub-id pub-id-type="pii">5575392</pub-id>
          <pub-id pub-id-type="pmcid">PMC6798568</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Sim</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Richesson</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Formal representation of eligibility criteria: A literature review</article-title>
          <source>Journal of Biomedical Informatics</source>
          <year>2010</year>
          <month>06</month>
          <volume>43</volume>
          <issue>3</issue>
          <fpage>451</fpage>
          <lpage>467</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2009.12.004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Boland</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Theodoratos</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SB</given-names>
            </name>
          </person-group>
          <article-title>EliXR: an approach to eligibility criteria extraction and representation</article-title>
          <source>Journal of the American Medical Informatics Association</source>
          <year>2011</year>
          <month>12</month>
          <day>01</day>
          <volume>18</volume>
          <issue>Supplement 1</issue>
          <fpage>i116</fpage>
          <lpage>i124</lpage>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000321</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hruby</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Rusanov</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>EliIE: An open-source information extraction system for clinical trial eligibility criteria</article-title>
          <source>Journal of the American Medical Informatics Association</source>
          <year>2017</year>
          <volume>24</volume>
          <issue>6</issue>
          <fpage>1062</fpage>
          <lpage>1071</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocx019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <article-title>OMOP Common Data Model v5.3.1</article-title>
          <source>GitHub</source>
          <access-date>2020-08-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/OHDSI/CommonDataModel/tree/v5.3.1">https://github.com/OHDSI/CommonDataModel/tree/v5.3.1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <article-title>Metathesaurus</article-title>
          <source>UMLS</source>
          <access-date>2020-08-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nlm.nih.gov/research/umls/knowledge_sources/metathesaurus/index.html">https://www.nlm.nih.gov/research/umls/knowledge_sources/metathesaurus/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <source>ATHENA standardized vocabularies - OHDSI</source>
          <access-date>2020-08-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ohdsi.org/analytic-tools/athena-standardized-vocabularies/">https://www.ohdsi.org/analytic-tools/athena-standardized-vocabularies/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
          <source>Elasticsearch: The Official Distributed Search &#38; Analytics Engine</source>
          <access-date>2020-08-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.elastic.co/elasticsearch/">https://www.elastic.co/elasticsearch/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Yanshan</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>Andrew</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Sijia</given-names>
            </name>
            <name name-style="western">
              <surname>Hersh</surname>
              <given-names>William</given-names>
            </name>
            <name name-style="western">
              <surname>Bedrick</surname>
              <given-names>Steven</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Hongfang</given-names>
            </name>
          </person-group>
          <article-title>Test collections for electronic health record-based clinical information retrieval</article-title>
          <source>JAMIA Open</source>
          <year>2019</year>
          <month>10</month>
          <volume>2</volume>
          <issue>3</issue>
          <fpage>360</fpage>
          <lpage>368</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31709390"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooz016</pub-id>
          <pub-id pub-id-type="medline">31709390</pub-id>
          <pub-id pub-id-type="pii">ooz016</pub-id>
          <pub-id pub-id-type="pmcid">PMC6824517</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huser</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>DeFalco</surname>
              <given-names>FJ</given-names>
            </name>
            <name name-style="western">
              <surname>Schuemie</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Velez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Boyce</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Duke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Khare</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Utidjian</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Multisite Evaluation of a Data Quality Tool for Patient-Level Clinical                        Datasets</article-title>
          <source>eGEMs</source>
          <year>2016</year>
          <month>11</month>
          <day>30</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>24</fpage>
          <pub-id pub-id-type="doi">10.13063/2327-9214.1239</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>KJ</given-names>
            </name>
          </person-group>
          <article-title>Mining Hierarchies Similarity Clusters from Value Set Repositories</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <conf-name>AMIA Annual Symposium</conf-name>
          <conf-date>Nov 4-8, 2017</conf-date>
          <conf-loc>Washington, DC, USA</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marling</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Whitehouse</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Aha</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Watson</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Case-Based Reasoning in the Care of Alzheimer's Disease Patients</article-title>
          <source>International Conference on Case-Based Reasoning. Lecture Notes in Computer Science</source>
          <year>2001</year>
          <publisher-loc>Berlin</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>702</fpage>
          <lpage>715</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van den Branden</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wiratunga</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Burton</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Craw</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Integrating case-based reasoning with an electronic patient record system</article-title>
          <source>Artificial Intelligence in Medicine</source>
          <year>2011</year>
          <month>2</month>
          <volume>51</volume>
          <issue>2</issue>
          <fpage>117</fpage>
          <lpage>123</lpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2010.12.004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miotto</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Case-based reasoning using electronic health records efficiently identifies eligible patients for clinical trials</article-title>
          <source>Journal of the American Medical Informatics Association</source>
          <year>2015</year>
          <month>03</month>
          <day>13</day>
          <volume>22</volume>
          <issue>e1</issue>
          <fpage>e141</fpage>
          <lpage>e150</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocu050</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Buckley</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Singhal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mitra</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Salton</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>New Retrieval Approaches Using SMART: TREC 4</article-title>
          <source>The Fourth Text REtrieval Conference (TREC-4)</source>
          <year>1995</year>
          <conf-name>Fourth text retrieval conference (TREC-4)</conf-name>
          <conf-date>November 1-3</conf-date>
          <conf-loc>Gaithersburg, Maryland</conf-loc>
          <publisher-name>NIST Special Publication 500-236</publisher-name>
          <fpage>25</fpage>
          <lpage>48</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://trec.nist.gov/pubs/trec4/papers/Cornell_trec4.ps.gz"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Ranking with recursive neural networks and its application to multi-document summarization</article-title>
          <year>2015</year>
          <conf-name>Proceedings of the Twenty-Ninth AAAI Conference on Artificial Intelligence</conf-name>
          <conf-date>2015</conf-date>
          <conf-loc>Austin, TX, USA</conf-loc>
          <fpage>2153</fpage>
          <lpage>2159</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Unsupervised ensemble ranking of terms in electronic health record notes based on their importance to patients</article-title>
          <source>Journal of Biomedical Informatics</source>
          <year>2017</year>
          <month>04</month>
          <volume>68</volume>
          <fpage>121</fpage>
          <lpage>131</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2017.02.016</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lasko</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A study of active learning methods for named entity recognition in clinical text</article-title>
          <source>Journal of Biomedical Informatics</source>
          <year>2015</year>
          <month>12</month>
          <volume>58</volume>
          <fpage>11</fpage>
          <lpage>18</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2015.09.010</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
