<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i11e19612</article-id>
      <article-id pub-id-type="pmid">33151150</article-id>
      <article-id pub-id-type="doi">10.2196/19612</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Viewpoint</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Viewpoint</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Amplifying Domain Expertise in Clinical Data Pipelines</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Afzal</surname>
            <given-names>Muhammad</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Benis</surname>
            <given-names>Arriel</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Spiliopoulou</surname>
            <given-names>Myra</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Rahman</surname>
            <given-names>Protiva</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>The Ohio State University</institution>
            <addr-line>1800 Cannon Drive</addr-line>
            <addr-line>Columbus, OH, 43210</addr-line>
            <country>United States</country>
            <phone>1 3056135087</phone>
            <email>rahman.92@osu.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0000-8558</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Nandi</surname>
            <given-names>Arnab</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4138-603X</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Hebert</surname>
            <given-names>Courtney</given-names>
          </name>
          <degrees>MSc, MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1646-702X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>The Ohio State University</institution>
        <addr-line>Columbus, OH</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Protiva Rahman <email>rahman.92@osu.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>11</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>5</day>
        <month>11</month>
        <year>2020</year>
      </pub-date>
      <volume>8</volume>
      <issue>11</issue>
      <elocation-id>e19612</elocation-id>
      <history>
        <date date-type="received">
          <day>24</day>
          <month>4</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>25</day>
          <month>5</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>7</day>
          <month>7</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>22</day>
          <month>7</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Protiva Rahman, Arnab Nandi, Courtney Hebert. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 05.11.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2020/11/e19612" xlink:type="simple"/>
      <abstract>
        <p>Digitization of health records has allowed the health care domain to adopt data-driven algorithms for decision support. There are multiple people involved in this process: a data engineer who processes and restructures the data, a data scientist who develops statistical models, and a domain expert who informs the design of the data pipeline and consumes its results for decision support. Although there are multiple data interaction tools for data scientists, few exist to allow domain experts to interact with data meaningfully. Designing systems for domain experts requires careful thought because they have different needs and characteristics from other end users. There should be an increased emphasis on the system to optimize the experts’ interaction by directing them to high-impact data tasks and reducing the total task completion time. We refer to this optimization as amplifying domain expertise. Although there is active research in making machine learning models more explainable and usable, it focuses on the final outputs of the model. However, in the clinical domain, expert involvement is needed at every pipeline step: curation, cleaning, and analysis. To this end, we review literature from the database, human-computer information, and visualization communities to demonstrate the challenges and solutions at each of the data pipeline stages. Next, we present a taxonomy of expertise amplification, which can be applied when building systems for domain experts. This includes summarization, guidance, interaction, and acceleration. Finally, we demonstrate the use of our taxonomy with a case study.</p>
      </abstract>
      <kwd-group>
        <kwd>review</kwd>
        <kwd>data analysis</kwd>
        <kwd>data science</kwd>
        <kwd>clinical informatics</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Recent advancements in data availability (eg, digitization of health records) and deep neural networks [<xref ref-type="bibr" rid="ref1">1</xref>] have led to the resurgence of artificial intelligence. This has served as a catalyst for data-driven decision making in many domains. However, for high-stakes applications, such as financial and health care domains, it is rare for domain experts to execute decisions solely based on artificial intelligence algorithms [<xref ref-type="bibr" rid="ref2">2</xref>]. Domain experts in this context are individuals who are not necessarily trained in computational fields but inform the design and are end users of data-driven algorithms (eg, health care providers, hospital administrators). Note that domain experts can have different levels of expertise in their specific domain (eg, interns, residents, attendings), and we do not differentiate between these levels in this work. Although the role of experts has been studied in clinical decision support (CDS), we find a gap in their involvement in the data analysis pipeline, which we focus on in this work.</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Domain expertise amplification.</p>
        </caption>
        <graphic xlink:href="medinform_v8i11e19612_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>Domain expert involvement remains necessary in the health care domain, but this involvement brings significant challenges and implications for data-driven applications. Domain experts are expensive resources with limited time for these efforts, and excessive reliance on domain expertise could potentially lead to systems that are overly customized and not reproducible or scalable. Owing to these challenges, designing systems for them requires careful consideration. To address these challenges, we present a framework for amplified intelligence that identifies the points in the process where expertise can be effectively leveraged. <italic>Amplification of expertise</italic> then refers to the process of automating redundant or inferable tasks, so that domain experts can focus their efforts on tasks that require domain knowledge. This is a synergy between the domain expert and the system, which involves summarization of data and decisions, guidance toward insights, interaction by the domain expert, and acceleration of input (<xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
      <sec>
        <title>Prior Work</title>
        <p>There is active research on interactive and human-in-the-loop systems in many computer science disciplines. The database and visualization communities have produced numerous tools [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref8">8</xref>] to aid data scientists with data wrangling and analysis. At the decision-making stage, the machine learning community has looked at making black box models explainable [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref12">12</xref>], while the human-computer interaction (HCI) community has been studying how differences in explainability affect decision making [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Finally, the crowdsourcing community has concentrated on human-powered computation by optimizing tasks (eg, simplifying tasks [<xref ref-type="bibr" rid="ref15">15</xref>], minimizing the number of questions [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>], optimizing workflows [<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref20">20</xref>]). However, we focus on data-powered experts by amplifying expertise. Although we draw from prior work, systems designed for health care domain experts require special consideration because they have characteristics that distinguish them from data scientists and crowdworkers.</p>
      </sec>
      <sec>
        <title>Special Considerations in the Health Care Domain</title>
        <p>First, domain expert input is usually needed for data tasks that require experiential knowledge and judgment (such as medical diagnoses and forensic analysis [<xref ref-type="bibr" rid="ref21">21</xref>]). The critical and subjective nature of these decisions necessitates transparency, both from the algorithm and domain experts. Hence, the system needs to summarize the impact of algorithmic or experts’ manipulation of the data [<xref ref-type="bibr" rid="ref22">22</xref>]. Second, due to their specialized training, domain experts’ time is expensive and limited [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. This constraint makes it imperative that we build tools that provide insights while reducing physical and cognitive effort [<xref ref-type="bibr" rid="ref25">25</xref>]. Third, as domain experts are trained in noncomputational fields, systems designed for them should provide high-level interaction capabilities. This is referred to as <italic>editable shared representations</italic> between computers and humans [<xref ref-type="bibr" rid="ref26">26</xref>]. Examples include natural language interfaces and form-based input [<xref ref-type="bibr" rid="ref27">27</xref>]. Finally, domain experts are highly trained individuals, which allows systems to accelerate their input by using domain-specific assumptions and ontologies [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. Keeping these factors in mind, expertise amplification involves summarization, guidance, interaction, and acceleration (<xref rid="figure1" ref-type="fig">Figure 1</xref>). We will explore each of these in detail in the following sections.</p>
      </sec>
      <sec>
        <title>The Data Pipeline</title>
        <p>There are opportunities to amplify expertise at all stages of the pipeline. The data pipeline refers to the different stages that the data need to go through before they can provide decision support. It can roughly be broken into 3 stages: curation, cleaning, and analysis. Tools at the end of the pipeline have only looked at explaining models but not at amplification. In contrast, tools at earlier pipeline stages have been designed mainly for data scientists and not for experts. However, domain experts are involved at every stage of the pipeline [<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref31">31</xref>], especially in clinical research settings where data sets contain specialized information. Thus, there is a need to amplify domain expertise throughout the pipeline. In this work, we provide examples from the informatics literature to highlight the need for expert involvement at each pipeline step. We then review literature from the database, HCI, and visualization communities about challenges and current approaches at different stages. On the basis of our review, we present a novel taxonomy for amplifying domain expertise and demonstrate its use with a case study in empiric antibiotic treatment. Our review can serve as a guide to new clinical research projects, and our taxonomy can be applied when designing systems for experts, especially for low-budget projects when there are limited resources and availability of domain experts.</p>
      </sec>
    </sec>
    <sec>
      <title>Challenges in the Data Pipeline</title>
      <p>This section is organized to reflect the clinical data pipeline, which often involves the following steps: data are curated from the electronic health record (EHR) data warehouse and annotated with external data sources, cleaned and validated, and analyzed. Multiple people are involved in various stages of the pipeline. The prevalent notion of the workflow is that a data engineer restructures, cleans, and sets up the infrastructure for data analysis, and a data scientist then analyzes and models the data, which a software engineer implements into a decision support system. A domain expert then consumes the end product to make decisions. However, in clinical settings, domain expert involvement is required at every step of the pipeline. Allowing domain experts to directly and efficiently interact with data removes the need for them to rely on a data engineer or data scientist who can then focus on infrastructure and model construction. Moreover, since domain experts are the stakeholders in the output of data pipelines, in our experience, they tend to be engaged users who want to interact with data and leverage their expertise. In this section, we motivate domain expert involvement with examples from the past five years of research presented at the American Medical Informatics Association’s annual symposiums. We then review the computer science literature to identify current tools and opportunities for expertise amplification at the 3 stages of the data pipeline: data curation, data cleaning, and data analysis, as each of these corresponds to a research area of its own.</p>
      <sec>
        <title>Data Curation</title>
        <p>Curating data sets for analysis can be a laborious process that can involve combining multiple data sources and identifying relevant attributes. Data integration and data discovery address these problems.</p>
        <sec>
          <title>Data Integration</title>
          <p>Medical data pipelines often involve data that were collected for purposes other than answering the research question at hand. This usually implies that information is not captured in a manner fit for analysis [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>], with issues such as missing metadata information [<xref ref-type="bibr" rid="ref34">34</xref>]. Moreover, in some situations such as rare disease studies, the cohort size is too small for analysis [<xref ref-type="bibr" rid="ref35">35</xref>], while in other cases, external features such as air quality or drug components [<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref39">39</xref>] might be needed. One possible solution to these data quality issues is to curate data from multiple institutions and external sources. However, the different data representations [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref40">40</xref>] pose challenges in entity matching, metadata inference, and data integrity [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]. Data integration aims to automatically resolve schema matching and entity matching problems during data curation. For biomedical data sets, integration can involve standardization by mapping to ontologies with controlled vocabularies [<xref ref-type="bibr" rid="ref43">43</xref>-<xref ref-type="bibr" rid="ref45">45</xref>]. Although current approaches use deep learning for integration [<xref ref-type="bibr" rid="ref46">46</xref>-<xref ref-type="bibr" rid="ref50">50</xref>], generating a training corpus and validating results require domain expert input. For example, Cui et al [<xref ref-type="bibr" rid="ref35">35</xref>] require domain experts to validate data curation efforts for studying sudden death in epilepsy. In another example, building an automatic concept annotator for standardizing biomedical literature [<xref ref-type="bibr" rid="ref50">50</xref>] required experts to manually annotate different concepts [<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref54">54</xref>]. Furthermore, a domain expert will be able to catch inconsistencies or errors made by an automated integration tool much faster than a data engineer who is unfamiliar with the domain. Thus, there is a need to build interactive data integration tools for domain experts.</p>
        </sec>
        <sec>
          <title>Data Discovery</title>
          <p>Data discovery refers to the process of finding relevant attributes or cohorts for analysis. This is especially true for multidisciplinary teams where the domain expert knows the disease definition but is not familiar with the database schema. At the same time, the data engineer can explore the schema but might not recognize that a field is relevant. Integrating data from multiple sources only exacerbates this problem. In the informatics community, DIVA [<xref ref-type="bibr" rid="ref55">55</xref>] aids in cohort discovery by ingesting expert-defined constraints, while visual analytic systems [<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref57">57</xref>] such as CAVA provide an interactive interface. In the database community, Nargesian et al [<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref59">59</xref>] have looked at finding unionable (more data points) and joinable (more attributes) data for a given data set. These algorithms are useful when trying to augment data sets with publicly available data sets such as MIMIC [<xref ref-type="bibr" rid="ref60">60</xref>] or even for exploring a complex schema such as the Unified Medical Language System (UMLS) [<xref ref-type="bibr" rid="ref61">61</xref>]. In addition to using properties of the data to find possible attribute matches, domain rules can be useful for identifying relevant data subsets. This requires an interactive interface where domain experts can look at subsets of interest and iteratively join and filter the data [<xref ref-type="bibr" rid="ref62">62</xref>] to find the required cohort. Recently, query logs have been used to design precision interfaces [<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref64">64</xref>] that customize the interface for the user’s task.</p>
        </sec>
      </sec>
      <sec>
        <title>Data Cleaning</title>
        <p>After curating relevant data sets, data still need to go through multiple preprocessing steps before they are analysis-ready. These include identifying and fixing incorrect data, data augmentation, and data transformation [<xref ref-type="bibr" rid="ref65">65</xref>], all of which benefit from domain expert involvement.</p>
        <sec>
          <title>Error Fixes</title>
          <p>EHR data are known to be messy and have errors and missing values [<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref68">68</xref>]. A typical data cleaning method is the use of rule-based systems that identify dirty data by detecting violations of user-specified rules or known functional dependencies [<xref ref-type="bibr" rid="ref69">69</xref>-<xref ref-type="bibr" rid="ref78">78</xref>]. These systems do not optimize the expert’s rule specification process. Crowdsourcing systems have also been used to correct values [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref79">79</xref>], although they are not always an option due to data complexity or confidentiality. Another approach to identify and clean data is to augment the data with external knowledge bases [<xref ref-type="bibr" rid="ref80">80</xref>-<xref ref-type="bibr" rid="ref82">82</xref>]. More recently, there have been many approaches [<xref ref-type="bibr" rid="ref83">83</xref>-<xref ref-type="bibr" rid="ref85">85</xref>] that use deep learning for automated data cleaning. Of note is Holoclean [<xref ref-type="bibr" rid="ref84">84</xref>], which uses a statistical model to combine various data repair signals such as violation of integrity constraints, functional dependencies, and knowledge bases. Although this achieves higher performance than using each method in isolation, there is scope for identifying which of the signals are performing the poorest or what additional information would help improve the system’s performance. Identifying this information, incorporating domain knowledge, and presenting it succinctly to a domain expert remain open problems.</p>
        </sec>
        <sec>
          <title>Data Augmentation</title>
          <p>Although data entry errors [<xref ref-type="bibr" rid="ref86">86</xref>] and missing information can be imputed by semiautomated methods, a more difficult problem is that of creating a gold standard for training data, which is referred to as data augmentation. Many health care applications require annotating training data, for example, clinical text annotation [<xref ref-type="bibr" rid="ref87">87</xref>-<xref ref-type="bibr" rid="ref89">89</xref>], CDS [<xref ref-type="bibr" rid="ref90">90</xref>-<xref ref-type="bibr" rid="ref92">92</xref>], identifying new terms for ontologies [<xref ref-type="bibr" rid="ref93">93</xref>], index terms for articles [<xref ref-type="bibr" rid="ref94">94</xref>], and disease-specific annotations [<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref95">95</xref>,<xref ref-type="bibr" rid="ref96">96</xref>]. However, very few applications focus on optimizing the domain expert’s data augmentation effort, which is eventually crucial to model performance. A notable approach to this is the Snorkel system [<xref ref-type="bibr" rid="ref97">97</xref>], which automates data augmentation by learning the labeling function, thus accelerating the domain expert’s input. However, there are opportunities to make the initial labeling process more interactive, as domain experts are required to write code in Snorkel. Furthermore, the system does not provide feedback on how labels affect the data set or final model, which is crucial for building trust in medical pipelines. Examples of interactive solutions include Icarus [<xref ref-type="bibr" rid="ref28">28</xref>] for augmenting microbiology data and Halpern et al's system [<xref ref-type="bibr" rid="ref98">98</xref>] for annotating clinical anchors. Both systems use an ontology to interactively amplify domain expertise.</p>
        </sec>
        <sec>
          <title>Data Transformation</title>
          <p>Other than fixing incorrect values and augmenting data sets, often, data need to be restructured (eg, splitting values in a column, reformatting dates). Data wrangling has emerged as a separate field in the past decade because of data diversity. Potter’s Wheel [<xref ref-type="bibr" rid="ref99">99</xref>] is one of the first interactive data transformation systems. It allows the user to specify data transforms that are encoded as constraints and used to detect errors. Building on this idea, systems such as Polaris [<xref ref-type="bibr" rid="ref100">100</xref>] and Trifacta [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref101">101</xref>] infer syntactic rules from user edits. Similarly, programming-by-example systems [<xref ref-type="bibr" rid="ref102">102</xref>,<xref ref-type="bibr" rid="ref103">103</xref>] learn transformations from a set of input-output pairs. These techniques have informed the autofill function of Microsoft Excel. As many domain experts employ Excel for data transformations and analysis [<xref ref-type="bibr" rid="ref104">104</xref>], spreadsheet interfaces should consider incorporating domain knowledge.</p>
        </sec>
      </sec>
      <sec>
        <title>Data Analysis</title>
        <p>We now move to the final step of the pipeline. This includes exploratory analysis to identify attributes of interest and explainability of models for decision making.</p>
        <sec>
          <title>Data Exploration</title>
          <p>During the exploration step, it is crucial for the domain expert to be able to directly interact with the data for effective hypothesis generation. However, domain experts often must go through a data engineer to execute the relevant query [<xref ref-type="bibr" rid="ref105">105</xref>,<xref ref-type="bibr" rid="ref106">106</xref>] or extract information from unstructured notes [<xref ref-type="bibr" rid="ref107">107</xref>]. The data are then validated by the domain expert through manual chart review, since data engineers without domain knowledge may apply naive filters that hide insights or find spurious correlations. To address these challenges, the informatics community has built tools to accelerate chart review [<xref ref-type="bibr" rid="ref108">108</xref>] and allow interactive filtering and analysis [<xref ref-type="bibr" rid="ref109">109</xref>,<xref ref-type="bibr" rid="ref110">110</xref>]. Finalizing an analysis data set can then take multiple iterations of requests and validations between the domain expert and data engineer. In some cases, data engineers create custom dashboards for domain experts [<xref ref-type="bibr" rid="ref111">111</xref>-<xref ref-type="bibr" rid="ref113">113</xref>], but the latter are then limited to brushing and linking on the provided view. Mixed-initiative interfaces such as Tableau [<xref ref-type="bibr" rid="ref100">100</xref>] and Dive [<xref ref-type="bibr" rid="ref5">5</xref>] recommend visualizations based on statistical properties of the data but do not use domain-specific ontologies that can enrich the domain experts’ interaction and accelerate their workflow.</p>
          <p>Visualizations, when used appropriately, can provide effective summaries and reveal patterns not immediately evident by statistical overviews [<xref ref-type="bibr" rid="ref114">114</xref>]. Summaries reduce the cognitive load on domain experts during multidimensional data exploration, allowing them to drill down to specific instances as needed [<xref ref-type="bibr" rid="ref115">115</xref>]. Although many visualization recommendation systems exist for analyzing numerical data [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref116">116</xref>-<xref ref-type="bibr" rid="ref118">118</xref>], visualizations in health care often include categorical and text data [<xref ref-type="bibr" rid="ref119">119</xref>-<xref ref-type="bibr" rid="ref122">122</xref>]. As such, node-link diagrams are a common data representation and have been used for tracking family history [<xref ref-type="bibr" rid="ref123">123</xref>], decision making [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref124">124</xref>], and identifying hidden variables [<xref ref-type="bibr" rid="ref125">125</xref>]. Visual interfaces thus amplify expertise by summarizing data. However, they can be more powerful if they allow interaction, provide guidance by highlighting interesting regions for exploration [<xref ref-type="bibr" rid="ref126">126</xref>], and accelerate workflows by extrapolating domain expert interactions based on properties of the data [<xref ref-type="bibr" rid="ref22">22</xref>]. Thus, there is a need to provide domain experts with tools that allow for more sophisticated data interaction.</p>
        </sec>
        <sec>
          <title>Explainability</title>
          <p>Finally, we cannot discuss clinical pipelines without discussing explainability. The interpretability of rule-based systems has made them popular in a variety of clinical applications, including decision support [<xref ref-type="bibr" rid="ref127">127</xref>,<xref ref-type="bibr" rid="ref128">128</xref>], antibiotic recommendation [<xref ref-type="bibr" rid="ref129">129</xref>], updating annotations [<xref ref-type="bibr" rid="ref130">130</xref>], and auditing [<xref ref-type="bibr" rid="ref131">131</xref>]. Interpretability is essential because domain experts want a cause-and-effect relationship, based on which actionable decisions can be made [<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref132">132</xref>]. Furthermore, health care providers may not use models they do not trust, and building trust requires providing context and explanations [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
          <p>Current approaches in health care research use weights and activation of features to characterize attribute importance [<xref ref-type="bibr" rid="ref133">133</xref>-<xref ref-type="bibr" rid="ref135">135</xref>]. RuleMatrix [<xref ref-type="bibr" rid="ref136">136</xref>] provides an alternate approach where a set of rules represents the deep learning model. The expert can explore various facets of each rule, such as data affected, distribution, and errors. In another example, Cai et al [<xref ref-type="bibr" rid="ref29">29</xref>] built a tool to help pathologists find similar images to aid in diagnoses. The tool allows domain experts to search for similar images and then interactively refine the search results. It allows refinement by region (crop an image), refinement by concept (filter by extracted concepts from image embeddings), and refinement by example (select multiple images as examples). These refinement techniques are examples of acceleration, where interactions are interpolated to the entire data set by learning general functions. Explainability is thus key to the adoption of deep learning models. Although they have mainly been applied in the analysis stage of the pipeline, they are equally important when applying automated algorithms to curation and cleaning.</p>
          <p>Therefore, amplifying domain experts’ abilities in the analysis stage requires interactive data systems using a combination of statistical algorithms and compelling visualizations. Moreover, these systems need to follow design-study principles [<xref ref-type="bibr" rid="ref137">137</xref>]. They need to allow interaction with domain experts for a needs assessment and an empirical evaluation to ensure that correct information is portrayed effectively. Otherwise, the system can end up burdening and biasing the domain expert instead of helping [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref101">101</xref>].</p>
          <p>We have highlighted the need for domain expert involvement in the pipeline and describe some of the challenges they encounter. Although we have briefly expanded on some available solutions, <xref ref-type="table" rid="table1">Table 1</xref> provides a more comprehensive list of references. Summarizing each technique is outside the scope of this paper, but it provides a guide to interested readers for further reading.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Review of current approaches for each data pipeline stage.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="30"/>
              <col width="360"/>
              <col width="0"/>
              <col width="580"/>
              <thead>
                <tr valign="top">
                  <td colspan="3">Current solutions</td>
                  <td colspan="2">Domain expert role</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="5">
                    <bold>Data curation</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Data integration</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <list list-type="bullet">
                      <list-item>
                        <p>Schema matching [<xref ref-type="bibr" rid="ref138">138</xref>-<xref ref-type="bibr" rid="ref143">143</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Interactive integration [<xref ref-type="bibr" rid="ref144">144</xref>,<xref ref-type="bibr" rid="ref145">145</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Webtables integration [<xref ref-type="bibr" rid="ref146">146</xref>-<xref ref-type="bibr" rid="ref151">151</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Machine learning [<xref ref-type="bibr" rid="ref46">46</xref>-<xref ref-type="bibr" rid="ref49">49</xref>]</p>
                      </list-item>
                    </list>
                  </td>
                  <td>Domain experts are needed to validate results of integration, and interactively correct automated methods, which can then update their algorithm</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Data discovery</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <list list-type="bullet">
                      <list-item>
                        <p>Attribute search [<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref152">152</xref>,<xref ref-type="bibr" rid="ref153">153</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Interactive querying [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref62">62</xref>-<xref ref-type="bibr" rid="ref64">64</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Visual analytics [<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref57">57</xref>]</p>
                      </list-item>
                    </list>
                  </td>
                  <td>Domain expert feedback is needed to finalize the analysis data set</td>
                </tr>
                <tr valign="top">
                  <td colspan="5">
                    <bold>Data cleaning</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Error fixes</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <list list-type="bullet">
                      <list-item>
                        <p>Rule-based [<xref ref-type="bibr" rid="ref69">69</xref>-<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref154">154</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Crowdbased [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref79">79</xref>,<xref ref-type="bibr" rid="ref155">155</xref>,<xref ref-type="bibr" rid="ref156">156</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Knowledgebase [<xref ref-type="bibr" rid="ref80">80</xref>-<xref ref-type="bibr" rid="ref82">82</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Machine learning [<xref ref-type="bibr" rid="ref83">83</xref>-<xref ref-type="bibr" rid="ref85">85</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Functional dependency [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref165">165</xref>]</p>
                      </list-item>
                    </list>
                  </td>
                  <td>Domain expert input can be used to identify and fix errors</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Augmentation</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <list list-type="bullet">
                      <list-item>
                        <p>Machine learning [<xref ref-type="bibr" rid="ref97">97</xref>,<xref ref-type="bibr" rid="ref166">166</xref>,<xref ref-type="bibr" rid="ref167">167</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Interactive [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref98">98</xref>,<xref ref-type="bibr" rid="ref168">168</xref>-<xref ref-type="bibr" rid="ref170">170</xref>]</p>
                      </list-item>
                    </list>
                  </td>
                  <td>Domain experts can augment missing data with domain-specific rules</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Transformation</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <list list-type="bullet">
                      <list-item>
                        <p>Programming by example [<xref ref-type="bibr" rid="ref102">102</xref>,<xref ref-type="bibr" rid="ref103">103</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Interactive rules [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref99">99</xref>-<xref ref-type="bibr" rid="ref101">101</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Foreign-key detection [<xref ref-type="bibr" rid="ref153">153</xref>,<xref ref-type="bibr" rid="ref171">171</xref>-<xref ref-type="bibr" rid="ref175">175</xref>]</p>
                      </list-item>
                    </list>
                  </td>
                  <td>Domain experts can restructure the data to make it semantically valid</td>
                </tr>
                <tr valign="top">
                  <td colspan="5">
                    <bold>Data analysis</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Exploration</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <list list-type="bullet">
                      <list-item>
                        <p>Optimize performance [<xref ref-type="bibr" rid="ref176">176</xref>-<xref ref-type="bibr" rid="ref179">179</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Optimize insight [<xref ref-type="bibr" rid="ref126">126</xref>,<xref ref-type="bibr" rid="ref180">180</xref>,<xref ref-type="bibr" rid="ref181">181</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Provenance [<xref ref-type="bibr" rid="ref182">182</xref>,<xref ref-type="bibr" rid="ref183">183</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Visualizations [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref116">116</xref>-<xref ref-type="bibr" rid="ref118">118</xref>,<xref ref-type="bibr" rid="ref184">184</xref>-<xref ref-type="bibr" rid="ref188">188</xref>]</p>
                      </list-item>
                    </list>
                  </td>
                  <td>Domain experts interact with summaries and outliers to draw insight</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Explainable</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <list list-type="bullet">
                      <list-item>
                        <p>Systems [<xref ref-type="bibr" rid="ref189">189</xref>,<xref ref-type="bibr" rid="ref190">190</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Visualizations [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref136">136</xref>]</p>
                      </list-item>
                      <list-item>
                        <p>Empirical studies [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]</p>
                      </list-item>
                    </list>
                  </td>
                  <td>Domain experts inform the model design to ensure explainability</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
        </sec>
      </sec>
    </sec>
    <sec>
      <title>Taxonomy of Expertise Amplification</title>
      <p>The previous section elucidated the need for domain expert involvement throughout the clinical data pipeline. In all steps, domain expert involvement can improve automated methods but must be implemented appropriately to ensure that the process remains robust and reproducible. Taking this into consideration, we propose a taxonomy that can be employed when designing systems to amplify expertise in the clinical pipeline. Domain expertise amplification by a system can broadly be categorized into 4 dimensions: summarization, guidance, interactivity, and acceleration, as shown in <xref rid="figure1" ref-type="fig">Figures 1</xref> and <xref rid="figure2" ref-type="fig">2</xref>. Thus, a system that wishes to amplify expertise should apply one or more of these dimensions. We demonstrate these categories with examples from computer science literature.</p>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Taxonomy of expertise amplification: the first level shows the 4 dimensions that should be employed by a system for expertise amplification. The second level enumerates the subdimensions along which amplification can be done, while the fourth level in gray shows tools that can be applied.</p>
        </caption>
        <graphic xlink:href="medinform_v8i11e19612_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <sec>
        <title>Summarization</title>
        <p>The time constraints of experts along with transparency requirements in the clinical domain motivate the need for effective summaries of data and human decisions. Although data summaries are important for analysis, summaries of human decisions allow for improved explainability and reproducibility.</p>
        <sec>
          <title>Data</title>
          <p>An amplification system should summarize large and complex data sets so that experts can meaningfully consume them. This is relevant for identifying inconsistencies as well as for open-ended exploration during analysis. It can be overwhelming for an expert to go through large and wide tables. Therefore, amplification systems should automatically summarize complex data [<xref ref-type="bibr" rid="ref191">191</xref>]. Although providing data samples [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref76">76</xref>] and statistical summaries such as mean, variance, and standard deviation can be useful for providing a bird’s eye view, they are not always enough to reveal patterns [<xref ref-type="bibr" rid="ref114">114</xref>]. In such cases, <italic>visual summaries</italic> can provide additional insight, as done by the CAVA system [<xref ref-type="bibr" rid="ref56">56</xref>]. Multidimensional data can be visually summarized by presenting each dimension as a coordinated histogram with linked brushing and filtering [<xref ref-type="bibr" rid="ref176">176</xref>].</p>
        </sec>
        <sec>
          <title>Human Decisions</title>
          <p>In addition to data, amplification systems need to summarize algorithmic and human decisions as well. This is because domain expert involvement is usually required in situations where it is necessary to have high-quality data [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. Hence, amplification systems also require high transparency [<xref ref-type="bibr" rid="ref189">189</xref>,<xref ref-type="bibr" rid="ref192">192</xref>]. To support algorithm transparency, amplification systems can show visual activation of features that led to the recommendation [<xref ref-type="bibr" rid="ref9">9</xref>] or similar cases in the data that serve as evidence for the current recommendation [<xref ref-type="bibr" rid="ref193">193</xref>]. Summarizing human decisions can involve expressing data transformations as natural language rules [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref28">28</xref>] and visual node-link diagrams [<xref ref-type="bibr" rid="ref22">22</xref>]. Furthermore, as summarized data provide an abstract or aggregate view, there is a need for data transparency, meaning that experts should be able to trace individual data points, which contributed to the aggregate summary. This involves incorporating ideas from <italic>provenance systems</italic> such as Smoke [<xref ref-type="bibr" rid="ref182">182</xref>] and Scorpion [<xref ref-type="bibr" rid="ref183">183</xref>], which provide fast data lineage tracking. Finally, for each application, empirical studies are needed to see what and how information should be presented or summarized because too much transparency can overwhelm and negatively impact the expert [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        </sec>
      </sec>
      <sec>
        <title>Guidance</title>
        <p>Although summaries provide a global view of the data, the goals of exploratory analysis include finding insights and data quality issues [<xref ref-type="bibr" rid="ref191">191</xref>], which might require looking at a more detailed view. Systems can guide experts by navigating to informative subsets and by suggesting data transformations and edits.</p>
        <sec>
          <title>Data Subset</title>
          <p>Amplification systems should guide the expert’s navigation to meaningful subsets. For example, SeeDB [<xref ref-type="bibr" rid="ref116">116</xref>] automatically finds interesting visualizations. Given a query, it defines <italic>interestingness</italic> as the deviation of the query’s result set from a baseline data set. In a similar vein<bold>,</bold> TPFlow [<xref ref-type="bibr" rid="ref194">194</xref>] uses tensor decomposition to guide users to interesting regions in spatiotemporal exploration. For data cleaning, error detection algorithms such as Uguide [<xref ref-type="bibr" rid="ref78">78</xref>] and DataProf [<xref ref-type="bibr" rid="ref76">76</xref>] use <italic>functional dependencies</italic> and Armstrong samples, respectively, to find incorrect tuples for human validation, while Icarus [<xref ref-type="bibr" rid="ref28">28</xref>] presents the expert with impactful subsets for data completion. Visual summary tools such as Profiler [<xref ref-type="bibr" rid="ref184">184</xref>] use statistics to find data quality issues. When guiding users with visual summaries, it is important to select optimal visual encodings to reveal relevant insights or <italic>outliers</italic>. This can be informed from recent work by Correll et al [<xref ref-type="bibr" rid="ref185">185</xref>], which empirically evaluated different visual encodings on their effectiveness in revealing data quality issues.</p>
        </sec>
        <sec>
          <title>Edits</title>
          <p>In addition to navigating data sets, amplification systems can also guide experts by suggesting data transformations to edit the data during the cleaning and preparation stage [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref103">103</xref>]. However, even in this case, transparency is required. This is evidenced by the fact that in empirical studies of Proactive Wrangler [<xref ref-type="bibr" rid="ref101">101</xref>], users often ignored the suggested transformation but then manually performed the same one because the semantics of the operation were unclear. Methods to aid in data transformation transparency include showing previews and transitions of the data changes [<xref ref-type="bibr" rid="ref195">195</xref>] resulting from the transformation operation.</p>
        </sec>
      </sec>
      <sec>
        <title>Interaction</title>
        <p>Along with making system internals explainable [<xref ref-type="bibr" rid="ref10">10</xref>], allowing experts to interact and modify data and the output of algorithms increases their trust in amplification systems [<xref ref-type="bibr" rid="ref11">11</xref>]. For empiric antibiotic recommendation [<xref ref-type="bibr" rid="ref196">196</xref>], this can involve allowing the health care provider to edit model features. Providing interaction comes at the cost of maintaining strict latency constraints since experts expect to see the results of interaction almost immediately [<xref ref-type="bibr" rid="ref137">137</xref>]. Techniques for maintaining interactive performance include sampling [<xref ref-type="bibr" rid="ref197">197</xref>] and predictive prefetching [<xref ref-type="bibr" rid="ref198">198</xref>]. Interaction modes can include data transformation suggestions and what-if analysis.</p>
        <sec>
          <title>Data Transformation</title>
          <p>The mode of interaction for data transformation in expertise amplification systems also needs to cater to their background and training. For example, transformations should be presented as <italic>natural language</italic> statements [<xref ref-type="bibr" rid="ref4">4</xref>] as opposed to code snippets [<xref ref-type="bibr" rid="ref97">97</xref>,<xref ref-type="bibr" rid="ref154">154</xref>]. Although graphical user interfaces can decrease trust and control for system administrators [<xref ref-type="bibr" rid="ref199">199</xref>], they are needed in amplification systems. Gestural query systems, such as GestureDB [<xref ref-type="bibr" rid="ref62">62</xref>] and DBTouch [<xref ref-type="bibr" rid="ref200">200</xref>], and <italic>direct manipulation interfaces</italic> might be preferable to domain experts who are unfamiliar with SQL. Furthermore, domain experts’ affinity for spreadsheet tools [<xref ref-type="bibr" rid="ref104">104</xref>] motivates designing systems with spreadsheet interfaces but advanced querying capabilities such as Dataspread [<xref ref-type="bibr" rid="ref201">201</xref>] and Sieuferd [<xref ref-type="bibr" rid="ref202">202</xref>].</p>
        </sec>
        <sec>
          <title>What-if Analysis</title>
          <p>To support collaborative decision making, amplification systems should allow for what-if analysis, where domain experts can apply or test different <italic>decisions</italic> and <italic>assumptions</italic> and see how it affects the data set. Collaborative decision making is important for consensus and conflict resolution. Domain experts are highly trained and experienced individuals in their fields, which affects how they interact with systems [<xref ref-type="bibr" rid="ref203">203</xref>,<xref ref-type="bibr" rid="ref204">204</xref>]. Data pipeline tasks that require their input need them to apply knowledge from training and experience [<xref ref-type="bibr" rid="ref28">28</xref>]. Such tasks inherently require judgment, which can be biased and can vary between and within domain experts [<xref ref-type="bibr" rid="ref205">205</xref>]. To account for this bias, consensus from multiple experts is needed. However, unlike crowdworkers, where differences in results can indicate bad actors entering random choices [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref206">206</xref>,<xref ref-type="bibr" rid="ref207">207</xref>], in the case of domain experts, they reveal differing judgments. As such, automatic conflict resolution [<xref ref-type="bibr" rid="ref208">208</xref>], such as majority voting, cannot be used because disagreements require expert discussion [<xref ref-type="bibr" rid="ref22">22</xref>]. Collaboration is required for conflict resolution, and what-if analysis can speed up this process. Capturing and sharing metadata is also useful for collaboration [<xref ref-type="bibr" rid="ref209">209</xref>-<xref ref-type="bibr" rid="ref212">212</xref>].</p>
        </sec>
      </sec>
      <sec>
        <title>Acceleration</title>
        <p>Time constraints of domain experts necessitate the need to accelerate their input provision. This involves designing interfaces that aid the expert’s task and building interactions that interpolate from edits to generalize to multiple data points.</p>
        <sec>
          <title>Interface Design</title>
          <p>Most experts use structured interfaces such as forms [<xref ref-type="bibr" rid="ref213">213</xref>] or free-text notes [<xref ref-type="bibr" rid="ref214">214</xref>] for data entry or querying and spreadsheet interfaces for data exploration [<xref ref-type="bibr" rid="ref104">104</xref>]. Following <italic>user-centered interface</italic> design and adhering to latency constraints is even more essential for these systems. Query interface layouts can be optimized by using statistical properties of the data [<xref ref-type="bibr" rid="ref215">215</xref>-<xref ref-type="bibr" rid="ref217">217</xref>] and prior query logs [<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref218">218</xref>], while spreadsheet interfaces can be improved by incorporating higher expressibility [<xref ref-type="bibr" rid="ref201">201</xref>,<xref ref-type="bibr" rid="ref202">202</xref>]. The Usher [<xref ref-type="bibr" rid="ref216">216</xref>] system, an example of the former, uses a probabilistic model on prior input form data to optimize the form structure. This involves showing highly selective data attributes at the beginning of the form to reduce the complexity at later stages, thus reducing the scope of error and accelerating input provision.</p>
        </sec>
        <sec>
          <title>Generalize</title>
          <p>An advantage of building systems for domain experts is that domain-specific information can be used to accelerate their input. For example, Icarus [<xref ref-type="bibr" rid="ref28">28</xref>] uses the organism and antibiotic hierarchy encoded as foreign-key relations in the database to generalize a single edit to a rule that fills in multiple cells, accelerating the data completion process. In another example, the system by Cai et al [<xref ref-type="bibr" rid="ref29">29</xref>] allows domain experts to refine result sets with domain-specific concepts extracted from image embeddings.</p>
        </sec>
      </sec>
    </sec>
    <sec>
      <title>Case Study</title>
      <p>We illustrate our taxonomy with a case study from a representative clinical data project: modeling empiric antibiotic treatment (<xref rid="figure3" ref-type="fig">Figure 3</xref>). We apply the 4 dimensions of amplification to the 3 stages of the pipeline. This is summarized in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
      <fig id="figure3" position="float">
        <label>Figure 3</label>
        <caption>
          <p>Data pipeline for empiric antibiotic prediction. EHR: electronic health record.</p>
        </caption>
        <graphic xlink:href="medinform_v8i11e19612_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Applying 4 dimensions of amplification to the clinical data pipeline for empiric antibiotic prediction.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="0"/>
          <col width="30"/>
          <col width="440"/>
          <col width="0"/>
          <col width="500"/>
          <thead>
            <tr valign="top">
              <td colspan="4">Domain expert task</td>
              <td colspan="2">Amplification</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="6">
                <bold>Data curation</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">Identify variables of interest, validate patients included in the cohort, and make domain-specific exclusionary rules</td>
              <td colspan="2">
                <list list-type="bullet">
                  <list-item>
                    <p><italic>Summarization</italic>: present distribution of variables of interest</p>
                  </list-item>
                  <list-item>
                    <p><italic>Guidance</italic>: suggesting additional variables based on the selected ones</p>
                  </list-item>
                  <list-item>
                    <p><italic>Interactions</italic>: allow expert to select and remove data points</p>
                  </list-item>
                  <list-item>
                    <p><italic>Acceleration</italic>: suggest criteria based on the domain expert’s inclusion and exclusion</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="6">
                <bold>Data cleaning</bold>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="2">
                <break/>
              </td>
              <td colspan="4">
                <bold>Augmentation</bold>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="2">
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td colspan="2">Fill in unreported microbiology susceptibilities with rules</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p><italic>Summarization</italic>: preview a rule by showing distribution of the cells that will be impacted</p>
                  </list-item>
                  <list-item>
                    <p><italic>Guidance</italic>: show high-impact data subsets for edits</p>
                  </list-item>
                  <list-item>
                    <p><italic>Interactions</italic>: direct edits on interface and indirect edits via rules</p>
                  </list-item>
                  <list-item>
                    <p><italic>Acceleration</italic>: suggest general rules based on the domain expert’s single edit</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="2">
                <break/>
              </td>
              <td colspan="4">
                <bold>Validation</bold>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="2">
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td colspan="2">Validate data augmentation by examining rule set and consolidating them to remove conflicts</td>
              <td>
                <list list-type="bullet">
                  <list-item>
                    <p><italic>Summarization</italic>: visual summary of rules and their relations</p>
                  </list-item>
                  <list-item>
                    <p><italic>Guidance</italic>: node size guides user to high-conflict areas</p>
                  </list-item>
                  <list-item>
                    <p><italic>Interactions</italic>: edit rule set by accepting and rejecting rules</p>
                  </list-item>
                  <list-item>
                    <p><italic>Acceleration</italic>: automatically remove redundant rules</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="6">
                <bold>Data analysis</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">Understand the model and its predictions for individuals and different patient subpopulations</td>
              <td colspan="2">
                <list list-type="bullet">
                  <list-item>
                    <p><italic>Summarization</italic>: show probability of coverage with confidence interval</p>
                  </list-item>
                  <list-item>
                    <p><italic>Guidance</italic>: highlight covariates of concern</p>
                  </list-item>
                  <list-item>
                    <p><italic>Interactions</italic>: allow domain expert to select covariates to include</p>
                  </list-item>
                  <list-item>
                    <p><italic>Acceleration</italic>: show similar patients for who the model should be updated</p>
                  </list-item>
                </list>
              </td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>At the data curation level, our domain expert, Lucy, must provide the cohort definition along with variables of interest (eg, demographics, comorbidities, allergies, etc) to a data engineer, who pulls the relevant data from the EHR data warehouse. After the data pull, Lucy looks through the initial set and formulates additional exclusion rules to ensure that it matches the clinical case definition. To implement these rules, the data engineer annotates the data with microbiology classification information of the UMLS metathesaurus [<xref ref-type="bibr" rid="ref61">61</xref>]. This process could be improved with an expertise amplification system. The system should <italic>summarize</italic> data by showing the distribution of variables with linked brushing and filtering so that Lucy could see how the variable distributions are correlated. It could <italic>guide</italic> Lucy by suggesting correlated variables to the ones she selects. During validation of the cohort, Lucy should <italic>interactively</italic> be able to select data points to include. Finally, the system should be able to <italic>accelerate</italic> Lucy’s validation by suggesting exclusion rules based on her interactions.</p>
      <p>After the cohort is finalized, Lucy faces a data cleaning task. The microbiology laboratory provides data for only a subset of antibiotics based on domain characteristics and institutional preferences. When using these data for predictive modeling, the unreported values must be filled by domain experts. To address this, we built Icarus [<xref ref-type="bibr" rid="ref28">28</xref>] to amplify expertise in data augmentation. Icarus <italic>guides</italic> the domain expert by showing them high-impact data subsets for edits. It allows both direct <italic>interactions</italic> via edits and indirect <italic>interactions</italic> via rules. Finally, Icarus <italic>accelerates</italic> task completion by leveraging the UMLS classification to suggest general rules based on the domain expert’s single edit. It also allows the domain expert to preview the impact of a rule by <italic>summarizing</italic> the cells that will be impacted.</p>
      <p>Owing to the subjective nature of this task, multiple domain experts need to come to consensus on unreported values. To amplify the consensus process, we designed Delphi [<xref ref-type="bibr" rid="ref22">22</xref>], which visualizes the conflicts and redundancies in domain expert rules. It provides an overview of the data by visually <italic>summarizing</italic> the antibiotics and related rules in a node-link diagram. The node sizes <italic>guide</italic> the expert to regions of high conflict by encoding the number of data points affected. It allows domain experts to <italic>interactively</italic> edit the rule set by accepting and rejecting rules. Finally, it <italic>accelerates</italic> the domain experts’ task completion by automatically removing redundant rules after each edit.</p>
      <p>Once domain experts have come to a consensus, the data set is ready for analysis. Our data scientist uses penalized logistic regression to model resistance [<xref ref-type="bibr" rid="ref219">219</xref>]. During this stage, Lucy provides insights on the different variables and their relations. After model creation, Lucy can analyze and validate the results of the interactive analysis. For a given patient, the system should <italic>summarize</italic> its results by showing the probability of coverage along with confidence intervals. It should <italic>guide</italic> Lucy by drawing attention to any abnormal covariates whose value significantly deviates from others in the cohort. It should allow Lucy to <italic>interactively</italic> select covariates and rerun the model for a specific patient. It should <italic>accelerate</italic> the analysis by showing similar patients for whom the model should also be updated.</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>We have provided examples from the informatics literature to motivate the need for domain expert involvement in all steps of clinical data pipelines, from curation to analysis. Although this work is based on our experiences, we have done our best to do a targeted interdisciplinary review that can serve as a guide to clinical data projects. Our work is related to previous surveys in visual analytics in health care [<xref ref-type="bibr" rid="ref188">188</xref>] and interactive systems [<xref ref-type="bibr" rid="ref137">137</xref>]. Our survey is unique in that it provides a taxonomy on designing systems for amplifying expertise and focuses on the clinical data pipeline. Specifically, expertise amplification involves summarization, guidance, interactivity, and acceleration. Our case study illustrates how these can be applied to a clinical data pipeline.</p>
      <sec>
        <title>Conclusions</title>
        <p>Effectively engaging domain experts is crucial for the success of data-driven workflows. We provide a novel framework for developing systems that amplify domain expertise. Amplification systems should summarize data, guide domain experts’ data navigation, allow domain experts to interact and update algorithms, and finally accelerate their task by learning from their interactions. This framework draws on research from multiple computer science disciplines. As we move toward data-driven workflows, interdisciplinary methods are necessary for the greatest impact. Empowering stakeholders to interact with the data directly can lead to faster and more impactful insights and decision making, which is vital for democratizing data to benefit society.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">CDS</term>
          <def>
            <p>clinical decision support</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">HCI</term>
          <def>
            <p>human-computer interaction</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">NIH</term>
          <def>
            <p>National Institute of Health</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">UMLS</term>
          <def>
            <p>Unified Medical Language System</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The research reported in this paper was supported by the National Institute of Allergy and Infectious Diseases of National Institute of Health (NIH) under R01AI116975. The content is solely the responsibility of the authors and does not necessarily represent the official views of the NIH. The National Science Foundation also supports this work under awards IIS-1422977, IIS-1527779, and CAREER IIS-1453582.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Iandola</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moskewicz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ashraf</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dally</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Keutzer</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Squeezenet: alexnet-level accuracy with 50x fewer parameters and¡ 0.5 mb model size</article-title>
          <source>arXiv</source>
          <year>2016</year>
          <comment>epub ahead of print<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1602.07360"/></comment>
          <pub-id pub-id-type="doi">10.1109/CVPRW.2018.00215</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ribeiro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Why Should I Trust You: Explaining the Predictions of Any Classifier</article-title>
          <source>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
          <year>2016</year>
          <conf-name>KDD'16</conf-name>
          <conf-date>August 13-17, 2016</conf-date>
          <conf-loc>San Francisco, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2939672.2939778</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zarifis</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Papakonstantinou</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>ViDeTTe Interactive Notebooks</article-title>
          <source>Proceedings of the Workshop on Human-In-the-Loop Data Analytics</source>
          <year>2018</year>
          <conf-name>HILDA'18</conf-name>
          <conf-date>June 1-5, 2018</conf-date>
          <conf-loc>Houston, TX, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3209900.3209907</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kandel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Paepcke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hellerstein</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Wrangler: Interactive Visual Specification of Data Transformation Scripts</article-title>
          <source>Proceedings of the SIGCHI Conference on Human Factors in Computing Systems</source>
          <year>2011</year>
          <conf-name>CHI'11</conf-name>
          <conf-date>March 15-17, 2011</conf-date>
          <conf-loc>Vancouver BC Canada</conf-loc>
          <fpage>3363</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1145/1978942.1979444</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Orghian</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hidalgo</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>DIVE: A Mixed-Initiative System Supporting Integrated Data Exploration Workflows</article-title>
          <source>Proceedings of the Workshop on Human-In-the-Loop Data Analytics</source>
          <year>2018</year>
          <conf-name>HILDA'18</conf-name>
          <conf-date>June 1-5, 2018</conf-date>
          <conf-loc>Houston, TX, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3209900.3209910</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kraska</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Northstar: an interactive data science system</article-title>
          <source>Proc VLDB Endow</source>
          <year>2018</year>
          <month>08</month>
          <day>1</day>
          <volume>11</volume>
          <issue>12</issue>
          <fpage>2150</fpage>
          <lpage>64</lpage>
          <pub-id pub-id-type="doi">10.14778/3229863.3240493</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wongsuphasawat</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Moritz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Anand</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mackinlay</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Howe</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Voyager: exploratory analysis via faceted browsing of visualization recommendations</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2016</year>
          <month>1</month>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>649</fpage>
          <lpage>58</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2015.2467191</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Macke</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Parameswaran</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Helix: holistic optimization for accelerating iterative machine learning</article-title>
          <source>Pro. VLDB Endow</source>
          <year>2018</year>
          <month>12</month>
          <day>1</day>
          <volume>12</volume>
          <issue>4</issue>
          <fpage>446</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.14778/3297753.3297763</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Olah</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Satyanarayan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Carter</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Schubert</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mordvintsev</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The building blocks of interpretability</article-title>
          <source>Distill</source>
          <year>2018</year>
          <month>03</month>
          <volume>3</volume>
          <issue>3</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://distill.pub/2018/building-blocks/"/>
          </comment>
          <pub-id pub-id-type="doi">10.23915/distill.00010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yeomans</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mullainathan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kleinberg</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Making sense of recommendations</article-title>
          <source>J Behav Dec Making</source>
          <year>2019</year>
          <month>02</month>
          <day>14</day>
          <volume>32</volume>
          <issue>4</issue>
          <fpage>403</fpage>
          <lpage>14</lpage>
          <pub-id pub-id-type="doi">10.1002/bdm.2118</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dietvorst</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Simmons</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Massey</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Overcoming algorithm aversion: people will use imperfect algorithms if they can (even slightly) modify them</article-title>
          <source>Manag Sci</source>
          <year>2018</year>
          <month>03</month>
          <volume>64</volume>
          <issue>3</issue>
          <fpage>1155</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.1287/mnsc.2016.2643</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Molino</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ebert</surname>
              <given-names>DS</given-names>
            </name>
          </person-group>
          <article-title>Manifold: a model-agnostic framework for interpretation and diagnosis of machine learning models</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2019</year>
          <month>01</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>364</fpage>
          <lpage>73</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2018.2864499</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Poursabzi-Sangdeh</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hofman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vaughan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wallach</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Manipulating and measuring model interpretability</article-title>
          <source>arXiv preprint</source>
          <year>2018</year>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vaughan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wallach</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Understanding the effect of accuracy on trust in machine learning models</article-title>
          <source>Proceedings of CHI Conference on Human Factors in Computing Systems</source>
          <year>2019</year>
          <conf-name>Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>May 4-9, 2019</conf-date>
          <conf-loc>Scottish Event Campus Ltd, Glasgow, United Kingdom</conf-loc>
          <fpage>1</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1145/3290605.3300509</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haas</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ansel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Marcus</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Argonaut: macrotask crowdsourcing for complex data processing</article-title>
          <source>Proc VLDB Endow</source>
          <year>2015</year>
          <month>08</month>
          <volume>8</volume>
          <issue>12</issue>
          <fpage>1642</fpage>
          <lpage>53</lpage>
          <pub-id pub-id-type="doi">10.14778/2824032.2824062</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Parameswaran</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sarma</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia-Molina</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Polyzotis</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Widom</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Human-assisted graph search: it's okay to ask questions</article-title>
          <source>Proceedings of the VLDB Endowment</source>
          <year>2011</year>
          <month>02</month>
          <conf-name>International Conference on Very Large Databased</conf-name>
          <conf-date>2011</conf-date>
          <conf-loc>Seattle Washington</conf-loc>
          <fpage>267</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.14778/1952376.1952377</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Parameswaran</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia-Molina</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Polyzotis</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ramesh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Widom</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Crowdscreen: Algorithms for filtering data with humans</article-title>
          <source>Proceedings of the ACM SIGMOD International Conference on Management of Data</source>
          <year>2012</year>
          <conf-name>ACM SIGMOD/PODS conference</conf-name>
          <conf-date>2012</conf-date>
          <conf-loc>Scottsdale, Arizona, USA</conf-loc>
          <fpage>361</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1145/2213836.2213878</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Par</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Pang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Parameswaran</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia-Molina</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Polyzotis</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Widom</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>An overview of the deco system: data model and query language; query processing and optimization</article-title>
          <source>ACM SIGMOD Record</source>
          <year>2013</year>
          <month>01</month>
          <day>17</day>
          <volume>41</volume>
          <issue>4</issue>
          <fpage>22</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1145/2430456.2430462</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lasecki</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Rzeszotarski</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Marcus</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bigham</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The effects of sequence delay on crowd work</article-title>
          <source>Proceedings of the 33rd Annual ACM Conference on Human Factors in Computing Systems</source>
          <year>2015</year>
          <conf-name>CHI '15: CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>2015</conf-date>
          <conf-loc>Seoul Republic of Korea</conf-loc>
          <fpage>1375</fpage>
          <lpage>1378</lpage>
          <pub-id pub-id-type="doi">10.1145/2702123.2702594</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Retelny</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Robaszkiewicz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>To</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lasecki</surname>
              <given-names>WS</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rahmati</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Doshi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Valentine</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Expert Crowdsourcing With Flash Teams</article-title>
          <source>Proceedings of the 27th annual ACM symposium on User interface software and technology</source>
          <year>2014</year>
          <conf-name>UIST'14</conf-name>
          <conf-date>October 5-8, 2014</conf-date>
          <conf-loc>Honolulu, Hawaii, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2642918.2647409</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dror</surname>
              <given-names>IE</given-names>
            </name>
            <name name-style="western">
              <surname>Kukucka</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kassin</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Zapf</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <article-title>When expert decision making goes wrong: consensus, bias, the role of experts, and accuracy</article-title>
          <source>J Appl Res Memory Cogn</source>
          <year>2018</year>
          <month>03</month>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>162</fpage>
          <lpage>3</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jarmac.2018.01.007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hebert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pancholi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Lustberg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stevenson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nandi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Exploratory Visualizations of Rules for Validation of Expert Decisions</article-title>
          <source>DSIA Workshop, IEEE VIS</source>
          <year>2018</year>
          <conf-name>Workshop on Data Systems for Interactive Analysis (DSIA)</conf-name>
          <conf-date>October 2018</conf-date>
          <conf-loc>Berlin, Germany</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchgate.net/publication/331177971_Exploratory_Visualizations_of_Rules_for_Validation_of_Expert_Decisions"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Robbins</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Physicians generate an average 2.4 million a year per hospital</article-title>
          <source>Southwest J Pulm Crit Care</source>
          <year>2019</year>
          <volume>18</volume>
          <fpage>61</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.swjpcc.com/news/2019/3/4/physicians-generate-an-average-24-million-a-year-per-hospita.html"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dzau</surname>
              <given-names>VJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kirch</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Nasca</surname>
              <given-names>TJ</given-names>
            </name>
          </person-group>
          <article-title>To care is human — collectively confronting the clinician-burnout crisis</article-title>
          <source>N Engl J Med</source>
          <year>2018</year>
          <month>01</month>
          <day>25</day>
          <volume>378</volume>
          <issue>4</issue>
          <fpage>312</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.1056/nejmp1715127</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saitwal</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Walji</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Assessing performance of an electronic health record (EHR) using cognitive task analysis</article-title>
          <source>Int J Med Inform</source>
          <year>2010</year>
          <month>07</month>
          <volume>79</volume>
          <issue>7</issue>
          <fpage>501</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2010.04.001</pub-id>
          <pub-id pub-id-type="medline">20452274</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(10)00074-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Agency plus automation: designing artificial intelligence into interactive systems</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2019</year>
          <month>02</month>
          <day>5</day>
          <volume>116</volume>
          <issue>6</issue>
          <fpage>1844</fpage>
          <lpage>50</lpage>
          <pub-id pub-id-type="doi">10.1073/pnas.1807184115</pub-id>
          <pub-id pub-id-type="medline">30718389</pub-id>
          <pub-id pub-id-type="pii">1807184115</pub-id>
          <pub-id pub-id-type="pmcid">PMC6369770</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krishnan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Haas</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Franklin</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Towards reliable interactive data cleaning: a user survey and recommendations</article-title>
          <source>Proceedings of the Workshop on Human-In-the-Loop Data Analytics</source>
          <year>2016</year>
          <conf-name>SIGMOD/PODS'16: International Conference on Management of Data</conf-name>
          <conf-date>June, 2016</conf-date>
          <conf-loc>San Francisco California</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2939502.2939511</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hebert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Nandi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>ICARUS: minimizing human effort in iterative data completion</article-title>
          <source>Proc VLDB Endow</source>
          <year>2018</year>
          <month>09</month>
          <day>01</day>
          <volume>11</volume>
          <issue>13</issue>
          <fpage>2263</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.14778/3275366.3275374</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Reif</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hegde</surname>
              <given-names>N</given-names>
            </name>
            <collab>et al</collab>
          </person-group>
          <article-title>Human-Centered Tools for Coping with Imperfect Algorithms During Medical Decision-Making</article-title>
          <source>Proceedings of the 2019 CHI Conference on Human Factors in Computing Systems</source>
          <year>2019</year>
          <conf-name>CHI'19</conf-name>
          <conf-date>May 4-9, 2019</conf-date>
          <conf-loc>Glasgow, Scotland, UK</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3290605.3300234</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Clayton</surname>
              <given-names>PD</given-names>
            </name>
            <name name-style="western">
              <surname>Naus</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Bowes</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Madsen</surname>
              <given-names>TS</given-names>
            </name>
            <name name-style="western">
              <surname>Wilcox</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Orsmond</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rocha</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Thornton</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jacobsen</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Udall</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Rhodes</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Cannon</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Huff</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Leckman</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Physician use of electronic medical records: issues and successes with direct data entry and physician productivity</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2005</year>
          <fpage>141</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16779018"/>
          </comment>
          <pub-id pub-id-type="medline">16779018</pub-id>
          <pub-id pub-id-type="pii">58944</pub-id>
          <pub-id pub-id-type="pmcid">PMC1560588</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ganapathi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Data Quality: Experiences and Lessons From Operationalizing Big Data</article-title>
          <source>IEEE International Conference on Big Data</source>
          <year>2016</year>
          <conf-name>Big Data'16</conf-name>
          <conf-date>December 5-8, 2016</conf-date>
          <conf-loc>Washington, DC, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/bigdata.2016.7840769</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Gesner</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Mar</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Colburn</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Rocha</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Prioritization and refinement of clinical data elements within EHR systems</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>421</fpage>
          <lpage>30</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28269837"/>
          </comment>
          <pub-id pub-id-type="medline">28269837</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333277</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blaisure</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Ceusters</surname>
              <given-names>WM</given-names>
            </name>
          </person-group>
          <article-title>Improving the 'Fitness for Purpose' of common data models through realism based ontology</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>440</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854108"/>
          </comment>
          <pub-id pub-id-type="medline">29854108</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977618</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cimino</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Identifying the clinical laboratory tests from unspecified "Other Lab Test" data for secondary use</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2015</year>
          <volume>2015</volume>
          <fpage>1018</fpage>
          <lpage>23</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26958239"/>
          </comment>
          <pub-id pub-id-type="medline">26958239</pub-id>
          <pub-id pub-id-type="pmcid">PMC4765675</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lhatoo</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>GQ</given-names>
            </name>
          </person-group>
          <article-title>ODaCCI: ontology-guided data curation for multisite clinical research data integration in the NINDS center for SUDEP research</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>441</fpage>
          <lpage>450</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28269839"/>
          </comment>
          <pub-id pub-id-type="medline">28269839</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333343</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Connolly</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>DeFranco</surname>
              <given-names>EA</given-names>
            </name>
          </person-group>
          <article-title>Integrating public data sets for analysis of maternal airborne environmental exposures and stillbirth</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2014</year>
          <volume>2014</volume>
          <fpage>599</fpage>
          <lpage>605</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25954365"/>
          </comment>
          <pub-id pub-id-type="medline">25954365</pub-id>
          <pub-id pub-id-type="pmcid">PMC4419928</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gouripeddi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Facelli</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Bradshaw</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Schultz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>LaSalle</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Warner</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Butcher</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Madsen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mo</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>FURTHeR: an infrastructure for clinical, translational and comparative effectiveness research</article-title>
          <source>AMIA</source>
          <year>2013</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://knowledge.amia.org/amia-55142-a2013e-1.580047/t-10-1.581994/f-010-1.581995/a-184-1.582011/ap-247-1.582014?qr=1">https://knowledge.amia.org/amia-55142-a2013e-1.580047/t-10-1.581994/f-010-1.581995/a-184-1.582011/ap-247-1.582014?qr=1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Integrative spatial data analytics for public health studies of New York state</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>391</fpage>
          <lpage>400</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28269834"/>
          </comment>
          <pub-id pub-id-type="medline">28269834</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333201</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ying</surname>
              <given-names>Li</given-names>
            </name>
          </person-group>
          <article-title>Combining Heterogeneous Databases to Detect Adverse Drug Reactions</article-title>
          <source>Columbia University</source>
          <year>2015</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academiccommons.columbia.edu/doi/10.7916/D8Z60ND1">https://academiccommons.columbia.edu/doi/10.7916/D8Z60ND1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Clarkson</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Whipple</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Variation in the representation of human anatomy within digital resources: implications for data integration</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>330</fpage>
          <lpage>339</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30815072"/>
          </comment>
          <pub-id pub-id-type="medline">30815072</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371295</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berrios</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Beheshti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Costes</surname>
              <given-names>SV</given-names>
            </name>
          </person-group>
          <article-title>Fairness and usability for open-access omics data systems</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>232</fpage>
          <lpage>241</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30815061"/>
          </comment>
          <pub-id pub-id-type="medline">30815061</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371294</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Farach</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>McGettrick</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tirrell</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mesa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rozenblit</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>RexMart: An Open Source Tool for Exploring and Sharing Research Data without Compromising Data Integrity</article-title>
          <source>AMIA</source>
          <year>2014</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://figshare.com/articles/RexMart_An_Open_Source_Tool_for_Exploring_and_Sharing_Research_Data_without_Compromising_Data_Integrity/1262228/1">https://figshare.com/articles/RexMart_An_Open_Source_Tool_for_Exploring_and_Sharing_Research_Data_without_Compromising_Data_Integrity/1262228/1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maldonado</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Marcos</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fernández-Breis</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Parcero</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Boscá</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Legaz-García</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez-Salvador</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Robles</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A platform for exploration into chaining of web services for clinical data transformation and reasoning</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>854</fpage>
          <lpage>63</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28269882"/>
          </comment>
          <pub-id pub-id-type="medline">28269882</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Domain adaptation for semantic role labeling of clinical text</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2015</year>
          <month>09</month>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>967</fpage>
          <lpage>79</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26063745"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocu048</pub-id>
          <pub-id pub-id-type="medline">26063745</pub-id>
          <pub-id pub-id-type="pii">ocu048</pub-id>
          <pub-id pub-id-type="pmcid">PMC4986662</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>GQ</given-names>
            </name>
          </person-group>
          <article-title>A semantic-based approach for exploring consumer health questions using UMLS</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2014</year>
          <volume>2014</volume>
          <fpage>432</fpage>
          <lpage>41</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25954347"/>
          </comment>
          <pub-id pub-id-type="medline">25954347</pub-id>
          <pub-id pub-id-type="pmcid">PMC4419919</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>XL</given-names>
            </name>
            <name name-style="western">
              <surname>Rekatsinas</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Data Integration and Machine Learning: A Natural Synergy</article-title>
          <source>Proceedings of the 2018 International Conference on Management of Data</source>
          <year>2018</year>
          <conf-name>SIGMOD'18</conf-name>
          <conf-date>June 1-5, 2018</conf-date>
          <conf-loc>Houston, Texas</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3183713.3197387</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stonebraker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ilyas</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Data integration: the current status and the way forward</article-title>
          <source>IEEE Data Eng Bull</source>
          <year>2018</year>
          <volume>41</volume>
          <fpage>3</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://uwaterloo.ca/data-systems-group/publications/data-integration-current-status-and-way-forward"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fernandez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Madden</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Termite: a system for tunneling through heterogeneous data</article-title>
          <source>ArXiv</source>
          <year>2019</year>
          <comment>epub ahead of print</comment>
          <pub-id pub-id-type="doi">10.1145/3329859.3329877</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thirumuruganathan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ouzzani</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Data curation with deep learning vision: towards self-driving data curation</article-title>
          <source>arXiv</source>
          <year>2018</year>
          <fpage>1384</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.semanticscholar.org/paper/Data-Curation-with-Deep-Learning-%5BVision%5D%3A-Towards-Thirumuruganathan-Tang/da182e52b0c8a95d97bf3088561db466e86247f5"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Leaman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>TaggerOne: joint named entity recognition and normalization with semi-Markov models</article-title>
          <source>Bioinformatics</source>
          <year>2016</year>
          <month>09</month>
          <day>15</day>
          <volume>32</volume>
          <issue>18</issue>
          <fpage>2839</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27283952"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btw343</pub-id>
          <pub-id pub-id-type="medline">27283952</pub-id>
          <pub-id pub-id-type="pii">btw343</pub-id>
          <pub-id pub-id-type="pmcid">PMC5018376</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doğan</surname>
              <given-names>RI</given-names>
            </name>
            <name name-style="western">
              <surname>Leaman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>NCBI disease corpus: a resource for disease name recognition and concept normalization</article-title>
          <source>J Biomed Inform</source>
          <year>2014</year>
          <month>02</month>
          <volume>47</volume>
          <fpage>1</fpage>
          <lpage>10</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(13)00197-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2013.12.006</pub-id>
          <pub-id pub-id-type="medline">24393765</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(13)00197-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC3951655</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>GNormPlus: an integrative approach for tagging genes, gene families, and protein domains</article-title>
          <source>Biomed Res Int</source>
          <year>2015</year>
          <volume>2015</volume>
          <fpage>918710</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1155/2015/918710"/>
          </comment>
          <pub-id pub-id-type="doi">10.1155/2015/918710</pub-id>
          <pub-id pub-id-type="medline">26380306</pub-id>
          <pub-id pub-id-type="pmcid">PMC4561873</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krallinger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rabal</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Leitner</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Vazquez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Salgado</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Leaman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lowe</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Sayle</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Batista-Navarro</surname>
              <given-names>RT</given-names>
            </name>
            <name name-style="western">
              <surname>Rak</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Huber</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Rocktäschel</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Matos</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Campos</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Munkhdalai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ryu</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Ramanan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nathan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Žitnik</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bajec</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weber</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Irmer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Akhondi</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Kors</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Sikdar</surname>
              <given-names>UK</given-names>
            </name>
            <name name-style="western">
              <surname>Ekbal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yoshioka</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dieb</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Verspoor</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Khabsa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Giles</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ravikumar</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Lamurias</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Couto</surname>
              <given-names>FM</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>RT</given-names>
            </name>
            <name name-style="western">
              <surname>Ata</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Can</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Usié</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alves</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Segura-Bedmar</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Oyarzabal</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Valencia</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The CHEMDNER corpus of chemicals and drugs and its annotation principles</article-title>
          <source>J Cheminform</source>
          <year>2015</year>
          <month>01</month>
          <day>19</day>
          <volume>7</volume>
          <issue>S1</issue>
          <pub-id pub-id-type="doi">10.1186/1758-2946-7-s1-s2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Kao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>tmVar: a text mining approach for extracting sequence variants in biomedical literature</article-title>
          <source>Bioinformatics</source>
          <year>2013</year>
          <month>06</month>
          <day>1</day>
          <volume>29</volume>
          <issue>11</issue>
          <fpage>1433</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23564842"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btt156</pub-id>
          <pub-id pub-id-type="medline">23564842</pub-id>
          <pub-id pub-id-type="pii">btt156</pub-id>
          <pub-id pub-id-type="pmcid">PMC3661051</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hielscher</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Niemann</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Preim</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Völzke</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ittermann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Spiliopoulou</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A framework for expert-driven subpopulation discovery and evaluation using subspace clustering for epidemiological data</article-title>
          <source>Expert Syst Appl</source>
          <year>2018</year>
          <month>12</month>
          <volume>113</volume>
          <fpage>147</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1016/j.eswa.2018.07.003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gotz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Perer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Iterative cohort analysis and exploration</article-title>
          <source>Inf Vis</source>
          <year>2014</year>
          <month>03</month>
          <day>19</day>
          <volume>14</volume>
          <issue>4</issue>
          <fpage>289</fpage>
          <lpage>307</lpage>
          <pub-id pub-id-type="doi">10.1177/1473871614526077</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Malik</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Monroe</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Onukwugha</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Plaisant</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shneiderman</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>An evaluation of visual analytics approaches to comparing cohorts of event sequences</article-title>
          <year>2014</year>
          <conf-name>InEHRVis Workshop on Visualizing Electronic Health Record Data at VIS  (Vol. 14)</conf-name>
          <conf-date>2014 Nov 9</conf-date>
          <conf-loc>-</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nargesian</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Pu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bashardoost</surname>
              <given-names>BG</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Optimizing organizations for navigating data lakes</article-title>
          <source>arXiv</source>
          <year>2018</year>
          <fpage>7024</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.semanticscholar.org/paper/Optimizing-Organizations-for-Navigating-Data-Lakes-Nargesian-Pu/2d480586a0d065eec2b8510a841ff824a2bdef72"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nargesian</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Pu</surname>
              <given-names>KQ</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>Table union search on open data</article-title>
          <source>Proc VLDB Endow</source>
          <year>2018</year>
          <month>03</month>
          <volume>11</volume>
          <issue>7</issue>
          <fpage>813</fpage>
          <lpage>25</lpage>
          <pub-id pub-id-type="doi">10.14778/3192965.3192973</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lehman</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-III, a freely accessible critical care database</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <month>05</month>
          <day>24</day>
          <volume>3</volume>
          <fpage>160035</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27219127"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id>
          <pub-id pub-id-type="medline">27219127</pub-id>
          <pub-id pub-id-type="pii">sdata201635</pub-id>
          <pub-id pub-id-type="pmcid">PMC4878278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bodenreider</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>The unified medical language system (UMLS): integrating biomedical terminology</article-title>
          <source>Nucleic Acids Res</source>
          <year>2004</year>
          <month>01</month>
          <day>1</day>
          <volume>32</volume>
          <issue>Database issue</issue>
          <fpage>D267</fpage>
          <lpage>70</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14681409"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkh061</pub-id>
          <pub-id pub-id-type="medline">14681409</pub-id>
          <pub-id pub-id-type="pii">32/suppl_1/D267</pub-id>
          <pub-id pub-id-type="pmcid">PMC308795</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nandi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mandel</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Gestural query specification</article-title>
          <source>Proc VLDB Endow</source>
          <year>2013</year>
          <month>12</month>
          <volume>7</volume>
          <issue>4</issue>
          <fpage>289</fpage>
          <lpage>300</lpage>
          <pub-id pub-id-type="doi">10.14778/2732240.2732247</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Raj</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Sellam</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Precision Interfaces for Different Modalities</article-title>
          <source>Proceedings of the 2018 International Conference on Management of Data</source>
          <year>2018</year>
          <conf-name>SIGMOD'18</conf-name>
          <conf-date>June 1-5, 2018</conf-date>
          <conf-loc>Houston, Texas</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3183713.3193570</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Mining precision interfaces from query logs</article-title>
          <source>ArXiv</source>
          <year>2019</year>
          <comment>epub ahead of print</comment>
          <pub-id pub-id-type="doi">10.1145/3299869.3319872</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Brue</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Leveraging terminology services for extract-transform-load processes: a user-centered approach</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>1010</fpage>
          <lpage>1019</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28269898"/>
          </comment>
          <pub-id pub-id-type="medline">28269898</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333225</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shickel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tighe</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bihorac</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rashidi</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Deep EHR: a survey of recent advances in deep learning techniques for electronic health record (EHR) analysis</article-title>
          <source>IEEE J Biomed Health Inform</source>
          <year>2018</year>
          <month>09</month>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>1589</fpage>
          <lpage>604</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2017.2767063</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Che</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Purushotham</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Khemani</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Interpretable deep models for ICU outcome prediction</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>371</fpage>
          <lpage>380</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28269832"/>
          </comment>
          <pub-id pub-id-type="medline">28269832</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333206</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adibuzzaman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>DeLaurentis</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Benneyworth</surname>
              <given-names>BD</given-names>
            </name>
          </person-group>
          <article-title>Big data in healthcare - the promises, challenges and opportunities from a research perspective: a case study with a model database</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>384</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854102"/>
          </comment>
          <pub-id pub-id-type="medline">29854102</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977694</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dallachiesa</surname>
              <given-names>A</given-names>
            </name>
            <collab>Ebaid, A</collab>
            <collab>Eldawy, A</collab>
            <collab>Elmagarmid, A</collab>
            <collab>Ilyas, I</collab>
            <collab>Ouzzani M</collab>
            <collab>Tang N</collab>
          </person-group>
          <article-title>NADEEF: a commodity data cleaning system</article-title>
          <source>Proceedings of the 2013 ACM SIGMOD International Conference on Management of Data</source>
          <year>2013</year>
          <conf-name>SIGMOD '13</conf-name>
          <conf-date>2013</conf-date>
          <conf-loc>New York</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2463676.2465327</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mayfield</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Neville</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Prabhakar</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <source>Eracer: a database approach for statistical inference and data cleaning</source>
          <year>2010</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://orion.cs.purdue.edu/docs/eracer.pdf">https://orion.cs.purdue.edu/docs/eracer.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meduri</surname>
              <given-names>VV</given-names>
            </name>
            <name name-style="western">
              <surname>Papotti</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Towards user-aware rule discovery</article-title>
          <source>Information Search, Integration, and Personalization</source>
          <year>2017</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>3</fpage>
          <lpage>17</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Dependable data repairing with fixing rules</article-title>
          <source>J Data and Information Quality</source>
          <year>2017</year>
          <month>07</month>
          <day>17</day>
          <volume>8</volume>
          <issue>3-4</issue>
          <fpage>1</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="doi">10.1145/3041761</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Krishnan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Franklin</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kraska</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Milo</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>A sample-and-clean framework for fast and accurate query processing on dirty data</article-title>
          <source>Proceedings of the 2014 ACM SIGMOD International Conference on Management of Data</source>
          <year>2014</year>
          <conf-name>SIGMOD'14</conf-name>
          <conf-date>June 2014</conf-date>
          <conf-loc>Snowbird Utah USA</conf-loc>
          <fpage>469</fpage>
          <lpage>80</lpage>
          <pub-id pub-id-type="doi">10.1145/2588555.2610505</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krishnan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Franklin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Activeclean: interactive data cleaning while learning convex loss models</article-title>
          <source>arXiv</source>
          <year>2016</year>
          <fpage>2117</fpage>
          <lpage>20</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/2882903.2899409"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2882903.2899409</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kalashnikov</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Mehrotra</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Query aware determinization of uncertain objects</article-title>
          <source>IEEE Trans Knowl Data Eng</source>
          <year>2015</year>
          <month>01</month>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>207</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1109/tkde.2013.170</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wie</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Link</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>DataProf: Semantic Profiling for Iterative Data Cleansing and Business Rule Acquisition</article-title>
          <source>Proceedings of the 2018 International Conference on Management of Data</source>
          <year>2018</year>
          <conf-name>SIGMOD'18</conf-name>
          <conf-date>June 1-5, 2018</conf-date>
          <conf-loc>Houston, Texas</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3183713.3193544</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yakout</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Elmagarmid</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Neville</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ouzzani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ilyas</surname>
              <given-names>IF</given-names>
            </name>
          </person-group>
          <article-title>Guided data repair</article-title>
          <source>Proc VLDB Endow</source>
          <year>2011</year>
          <month>02</month>
          <volume>4</volume>
          <issue>5</issue>
          <fpage>279</fpage>
          <lpage>89</lpage>
          <pub-id pub-id-type="doi">10.14778/1952376.1952378</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thirumuruganathan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Berti-Equille</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ouzzani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Quiane-Ruiz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>UGuide: user-guided discovery of FD-detectable errors</article-title>
          <source>Proceedings of the 2017 ACM International Conference on Management of Data</source>
          <year>2017</year>
          <conf-name>SIGMOD'17</conf-name>
          <conf-date>May 14-19, 2017</conf-date>
          <conf-loc>Chicago, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3035918.3064024</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Widom</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Crowdfill: collecting structured data from the crowd</article-title>
          <source>ACM SIGMOD</source>
          <year>2014</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://ilpubs.stanford.edu:8090/1079/1/crowdfill.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2588555.2610503</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Auto-Detect: Data-Driven Error Detection in Tables</article-title>
          <source>Proceedings of the 2018 International Conference on Management of Data</source>
          <year>2018</year>
          <conf-name>SIGMOD'18</conf-name>
          <conf-date>June 1-5, 2018</conf-date>
          <conf-loc>Houston, Texas</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3183713.3196889</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Morcos</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ilyas</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Ouzzani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Papotti</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Katara: A data cleaning system powered by knowledge bases and crowdsourcing</article-title>
          <source>ACM SIGMOD</source>
          <year>2015</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/2723372.2749431"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2723372.2749431</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Cleaning Relations Using Knowledge Bases</article-title>
          <source>IEEE 33rd International Conference on Data Engineering</source>
          <year>2017</year>
          <conf-name>ICDE'17</conf-name>
          <conf-date>April 19-22, 2017</conf-date>
          <conf-loc>San Diego, CA, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icde.2017.141</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Biessmann</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Salinas</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Schelter</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Lange</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>'Deep' Learning for Missing Value Imputationin Tables with Non-Numerical Data</article-title>
          <source>Proceedings of the 27th ACM International Conference on Information and Knowledge Management</source>
          <year>2018</year>
          <conf-name>CIKM'18</conf-name>
          <conf-date>October 22-26, 2018</conf-date>
          <conf-loc>Turin, Italy</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3269206.3272005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rekatsinas</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ilyas</surname>
              <given-names>IF</given-names>
            </name>
            <name name-style="western">
              <surname>Ré</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>HoloClean: holistic data repairs with probabilistic inference</article-title>
          <source>Proc VLDB Endow</source>
          <year>2017</year>
          <month>08</month>
          <day>1</day>
          <volume>10</volume>
          <issue>11</issue>
          <fpage>1190</fpage>
          <lpage>201</lpage>
          <pub-id pub-id-type="doi">10.14778/3137628.3137631</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ilyas</surname>
              <given-names>IF</given-names>
            </name>
            <name name-style="western">
              <surname>Papotti</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Holistic Data Cleaning: Putting Violations Into Context</article-title>
          <source>29th International Conference on Data Engineering</source>
          <year>2013</year>
          <conf-name>ICDE'13</conf-name>
          <conf-date>April 8-12, 2013</conf-date>
          <conf-loc>Brisbane, QLD, Australia</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icde.2013.6544847</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schreibstein</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Newton-Dame</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>McVeigh</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Perlman</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Singer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Missing data in an electronic health record-based population health surveillance system</article-title>
          <source>AMIA</source>
          <year>2014</year>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Divita</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>QT</given-names>
            </name>
            <name name-style="western">
              <surname>Gundlapalli</surname>
              <given-names>AV</given-names>
            </name>
            <name name-style="western">
              <surname>Duvall</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nebeker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Samore</surname>
              <given-names>MH</given-names>
            </name>
          </person-group>
          <article-title>Sophia: a expedient UMLS concept extraction annotator</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2014</year>
          <fpage>467</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="medline">25954351</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rumeng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jagannatha Abhyuday</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A hybrid neural network model for joint prediction of presence and period assertions of medical events in clinical notes</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <fpage>1149</fpage>
          <lpage>58</lpage>
          <pub-id pub-id-type="medline">29854183</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref89">
        <label>89</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Browne</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Kayaalp</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dodd</surname>
              <given-names>ZA</given-names>
            </name>
            <name name-style="western">
              <surname>Sagan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>McDonald</surname>
              <given-names>CJ</given-names>
            </name>
          </person-group>
          <article-title>The challenges of creating a gold standard for de-identification research</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2014</year>
          <volume>2014</volume>
          <fpage>353</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25954338"/>
          </comment>
          <pub-id pub-id-type="medline">25954338</pub-id>
          <pub-id pub-id-type="pmcid">PMC4420002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref90">
        <label>90</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bowles</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Ratcliffe</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Naylor</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Keim</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Flores</surname>
              <given-names>EJ</given-names>
            </name>
          </person-group>
          <article-title>Nurse generated EHR data supports post-acute care referral decision making: development and validation of a two-step algorithm</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>465</fpage>
          <lpage>74</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854111"/>
          </comment>
          <pub-id pub-id-type="medline">29854111</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977719</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref91">
        <label>91</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shivade</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hebert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Regan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fosler-Lussier</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Automatic data source identification for clinical trial eligibility criteria resolution</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>1149</fpage>
          <lpage>1158</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28269912"/>
          </comment>
          <pub-id pub-id-type="medline">28269912</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333255</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref92">
        <label>92</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Norman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Leeflang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Névéol</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Data extraction and synthesis in systematic reviews of diagnostic test accuracy: a corpus for automating and evaluating the process</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>817</fpage>
          <lpage>26</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30815124"/>
          </comment>
          <pub-id pub-id-type="medline">30815124</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371350</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref93">
        <label>93</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chandar</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Yaman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hoxha</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Similarity-based recommendation of new concepts to a terminology</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2015</year>
          <volume>2015</volume>
          <fpage>386</fpage>
          <lpage>95</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26958170"/>
          </comment>
          <pub-id pub-id-type="medline">26958170</pub-id>
          <pub-id pub-id-type="pmcid">PMC4765685</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref94">
        <label>94</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kavuluru</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rios</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Automatic assignment of non-leaf MeSH terms to biomedical articles</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2015</year>
          <volume>2015</volume>
          <fpage>697</fpage>
          <lpage>706</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26958205"/>
          </comment>
          <pub-id pub-id-type="medline">26958205</pub-id>
          <pub-id pub-id-type="pmcid">PMC4765689</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref95">
        <label>95</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Feller</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zucker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Don't Walk</surname>
              <given-names>OB</given-names>
            </name>
            <name name-style="western">
              <surname>Srikishan</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Martinez</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Gordon</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Towards the inference of social and behavioral determinants of sexual health: development of a gold-standard corpus with semi-supervised learning</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>422</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30815082"/>
          </comment>
          <pub-id pub-id-type="medline">30815082</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371339</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref96">
        <label>96</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Afshar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Joyce</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Oakey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Formanek</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Churpek</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Zelisko</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Price</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dligach</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A computable phenotype for acute respiratory distress syndrome using natural language processing and machine learning</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>157</fpage>
          <lpage>65</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30815053"/>
          </comment>
          <pub-id pub-id-type="medline">30815053</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371271</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref97">
        <label>97</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ratner</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bach</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Ehrenberg</surname>
              <given-names>HR</given-names>
            </name>
            <name name-style="western">
              <surname>Ré</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Snorkel: Fast Training Set Generation for Information Extraction</article-title>
          <source>Proceedings of the 2017 ACM International Conference on Management of Data</source>
          <year>2017</year>
          <conf-name>SIGMOD'17</conf-name>
          <conf-date>May 14-19, 2017</conf-date>
          <conf-loc>Chicago, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3035918.3056442</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref98">
        <label>98</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Halpern</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Horng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sontag</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Using anchors to estimate clinical state without labeled data</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2014</year>
          <volume>2014</volume>
          <fpage>606</fpage>
          <lpage>15</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25954366"/>
          </comment>
          <pub-id pub-id-type="medline">25954366</pub-id>
          <pub-id pub-id-type="pmcid">PMC4419996</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref99">
        <label>99</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Raman</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Hellerstein</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Potter's Wheel: an Interactive Framework for Data Cleaning</article-title>
          <source>Univesity of Berkeley</source>
          <access-date>2020-09-28</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www/ cs. berkeley. edu/? rshankar/papers/pwheel. pdf, 2000">http://www/ cs. berkeley. edu/? rshankar/papers/pwheel. pdf, 2000</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref100">
        <label>100</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stolte</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hanrahan</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Polaris: a system for query, analysis, and visualization of multidimensional relational databases</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2002</year>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>52</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1109/2945.981851</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref101">
        <label>101</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kandel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hellerstein</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Proactive Wrangling: Mixed-initiative End-user Programming of Data Transformation Scripts</article-title>
          <source>Proceedings of the 24th Annual ACM Symposium on User Interface Software and Technology</source>
          <year>2011</year>
          <conf-name>UIST'11</conf-name>
          <conf-date>March 17, 2011</conf-date>
          <conf-loc>New York, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2047196.2047205</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref102">
        <label>102</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gulwani</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Learning semantic string transformations from examples</article-title>
          <source>Proc VLDB Endow</source>
          <year>2012</year>
          <month>04</month>
          <volume>5</volume>
          <issue>8</issue>
          <fpage>740</fpage>
          <lpage>51</lpage>
          <pub-id pub-id-type="doi">10.14778/2212351.2212356</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref103">
        <label>103</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Cafarella</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jagadish</surname>
              <given-names>HV</given-names>
            </name>
          </person-group>
          <article-title>Foofah: transforming data by example</article-title>
          <source>Proceedings of the 2017 ACM International Conference on Management of Data</source>
          <year>2017</year>
          <conf-name>SIGMOD'17</conf-name>
          <conf-date>May 14-19, 2017</conf-date>
          <conf-loc>Chicago, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3035918.3064034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref104">
        <label>104</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Costabile</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Fogli</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Letondal</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mussio</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Piccinno</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Domain-expert users and their needs of software development</article-title>
          <source>HCI 2003 End-User Development Session</source>
          <year>2003</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://giove.cnuce.cnr.it/projects/EUD-NET/pdf/Costabile-et-alCameraReady.pdf">http://giove.cnuce.cnr.it/projects/EUD-NET/pdf/Costabile-et-alCameraReady.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref105">
        <label>105</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hanauer</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Hruby</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Fort</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Rasmussen</surname>
              <given-names>LV</given-names>
            </name>
            <name name-style="western">
              <surname>Mendonça</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>What is asked in clinical data request forms? A multi-site thematic analysis of forms towards better data access support</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2014</year>
          <volume>2014</volume>
          <fpage>616</fpage>
          <lpage>25</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25954367"/>
          </comment>
          <pub-id pub-id-type="medline">25954367</pub-id>
          <pub-id pub-id-type="pmcid">PMC4419980</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref106">
        <label>106</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hruby</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Hoxha</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ravichandran</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Mendonça</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Hanauer</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A data-driven concept schema for defining clinical research data needs</article-title>
          <source>Int J Med Inform</source>
          <year>2016</year>
          <month>07</month>
          <volume>91</volume>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27185504"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2016.03.008</pub-id>
          <pub-id pub-id-type="medline">27185504</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(16)30049-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC4873775</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref107">
        <label>107</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Edinger</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Demner-Fushman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Bedrick</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hersh</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of clinical text segmentation to facilitate cohort retrieval</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>660</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854131"/>
          </comment>
          <pub-id pub-id-type="medline">29854131</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977655</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref108">
        <label>108</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Moeller</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Arsoniadis</surname>
              <given-names>EG</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kwaan</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>GJ</given-names>
            </name>
          </person-group>
          <article-title>Accelerating chart review using automated methods on electronic health record data for postoperative complications</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>1822</fpage>
          <lpage>1831</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28269941"/>
          </comment>
          <pub-id pub-id-type="medline">28269941</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333220</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref109">
        <label>109</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Major</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Tanna</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aphinyanaphongs</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Reusable filtering functions for application in ICU data: a case study</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>844</fpage>
          <lpage>853</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28269881"/>
          </comment>
          <pub-id pub-id-type="medline">28269881</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333239</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref110">
        <label>110</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Controlling False Discoveries During Interactive Data Exploration</article-title>
          <source>Proceedings of the 2017 ACM International Conference on Management of Data</source>
          <year>2017</year>
          <conf-name>SIGMOD'17</conf-name>
          <conf-date>May 14-17, 2017</conf-date>
          <conf-loc>Chicago, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3035918.3064019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref111">
        <label>111</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Romero-Brufau</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kostandy</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Maass</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Wutthisirisart</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sir</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bartholmai</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Stuve</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pasupathy</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Development of data integration and visualization tools for the Department of Radiology to display operational and strategic metrics</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>942</fpage>
          <lpage>951</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30815137"/>
          </comment>
          <pub-id pub-id-type="medline">30815137</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371359</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref112">
        <label>112</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pore</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sengeh</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Mugambi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Purswani</surname>
              <given-names>NV</given-names>
            </name>
            <name name-style="western">
              <surname>Sesay</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Arnold</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Myers</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Design and evaluation of a web-based decision support tool for district-level disease surveillance in a low-resource setting</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>1401</fpage>
          <lpage>10</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854209"/>
          </comment>
          <pub-id pub-id-type="medline">29854209</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977610</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref113">
        <label>113</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Iyer</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>DuttaDuwarah</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>DataScope: Interactive Visual Exploratory Dashboards for Large Multidimensional Data</article-title>
          <source>Workshop on Visual Analytics in Healthcare</source>
          <year>2017</year>
          <conf-name>VAHC'17</conf-name>
          <conf-date>October 1, 2017</conf-date>
          <conf-loc>Phoenix, AZ, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/vahc.2017.8387496</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref114">
        <label>114</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anscombe</surname>
              <given-names>FJ</given-names>
            </name>
          </person-group>
          <article-title>Graphs in statistical analysis</article-title>
          <source>Am Stat</source>
          <year>1973</year>
          <month>02</month>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>17</fpage>
          <pub-id pub-id-type="doi">10.2307/2682899</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref115">
        <label>115</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shneiderman</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The eyes have it: a task by data type taxonomy for information visualizations</article-title>
          <source>Proceedings 1996 IEEE Symposium on Visual Languages</source>
          <year>2003</year>
          <conf-name>IEEE Symposium on Visual Languages</conf-name>
          <conf-date>August 6, 2002</conf-date>
          <conf-loc>Boulder, CO, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1016/b978-155860915-0/50046-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref116">
        <label>116</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vartak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Madden</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Parameswaran</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Polyzotis</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>SeeDB: automatically generating query visualizations</article-title>
          <source>Proc VLDB Endow</source>
          <year>2014</year>
          <month>08</month>
          <volume>7</volume>
          <issue>13</issue>
          <fpage>1581</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.14778/2733004.2733035</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref117">
        <label>117</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moritz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Howe</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Formalizing visualization design knowledge as constraints: actionable and extensible models in draco</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2019</year>
          <month>01</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>438</fpage>
          <lpage>48</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2018.2865240</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref118">
        <label>118</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Demiralp</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haas</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Parthasarathy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pedapati</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Foresight: recommending visual insights</article-title>
          <source>Proc VLDB Endow</source>
          <year>2017</year>
          <month>08</month>
          <day>1</day>
          <volume>10</volume>
          <issue>12</issue>
          <fpage>1937</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.14778/3137765.3137813</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref119">
        <label>119</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caballero</surname>
              <given-names>GC</given-names>
            </name>
          </person-group>
          <article-title>Visual Analytics for Evaluating Clinical Pathways</article-title>
          <source>Workshop on Visual Analytics in Healthcare</source>
          <year>2017</year>
          <conf-name>VAHC'17</conf-name>
          <conf-date>October 1, 2017</conf-date>
          <conf-loc>Phoenix, AZ, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/vahc.2017.8387499</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref120">
        <label>120</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Widanagamaachchi</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Livnat</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bremer</surname>
              <given-names>PT</given-names>
            </name>
            <name name-style="western">
              <surname>Duvall</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pascucci</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Interactive visualization and exploration of patient progression in a hospital setting</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>1773</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="medline">29854248</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977592</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref121">
        <label>121</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>GQ</given-names>
            </name>
          </person-group>
          <article-title>SpindleSphere: a web-based platform for large-scale sleep spindle analysis and visualization</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>1159</fpage>
          <lpage>68</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854184"/>
          </comment>
          <pub-id pub-id-type="medline">29854184</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977590</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref122">
        <label>122</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mortensen</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Musen</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Noy</surname>
              <given-names>NF</given-names>
            </name>
          </person-group>
          <article-title>An empirically derived taxonomy of errors in SNOMED CT</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2014</year>
          <volume>2014</volume>
          <fpage>899</fpage>
          <lpage>906</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25954397"/>
          </comment>
          <pub-id pub-id-type="medline">25954397</pub-id>
          <pub-id pub-id-type="pmcid">PMC4419962</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref123">
        <label>123</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Wasserman</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenau</surname>
              <given-names>PT</given-names>
            </name>
            <name name-style="western">
              <surname>Howard</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Sarkar</surname>
              <given-names>IN</given-names>
            </name>
          </person-group>
          <article-title>Mining and visualizing family history associations in the electronic health record: a case study for Pediatric Asthma</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2015</year>
          <volume>2015</volume>
          <fpage>396</fpage>
          <lpage>405</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26958171"/>
          </comment>
          <pub-id pub-id-type="medline">26958171</pub-id>
          <pub-id pub-id-type="pmcid">PMC4765567</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref124">
        <label>124</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sockolow</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bass</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bowles</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Holmberg</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sheryl</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Data visualization of home care admission nurses' decision-making</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>1597</fpage>
          <lpage>606</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854230"/>
          </comment>
          <pub-id pub-id-type="medline">29854230</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977644</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref125">
        <label>125</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kummerfeld</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Anker</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Rix</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kushner</surname>
              <given-names>MG</given-names>
            </name>
          </person-group>
          <article-title>Methodological advances in the study of hidden variables: a demonstration on clinical alcohol use disorder data</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>710</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30815113"/>
          </comment>
          <pub-id pub-id-type="medline">30815113</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371371</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref126">
        <label>126</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarawagi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Megiddo</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Discovery-driven Exploration of OLAP Data Cubes</article-title>
          <source>International Conference on Extending Database Technology</source>
          <year>1998</year>
          <conf-name>EDBT'98</conf-name>
          <conf-date>March 23-27, 1998</conf-date>
          <conf-loc>Valencia, Spain</conf-loc>
          <pub-id pub-id-type="doi">10.1007/bfb0100984</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref127">
        <label>127</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sordo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tokachichu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Vitale</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Maviglia</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Rocha</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Modeling contextual knowledge for clinical decision support</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>1617</fpage>
          <lpage>1624</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854232"/>
          </comment>
          <pub-id pub-id-type="medline">29854232</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977672</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref128">
        <label>128</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gangadhar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Pesuit</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Bogdanov</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Kallenbach</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ken</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vasey</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Loomis</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Effectiveness of a cloud-based EHR clinical decision support program for body mass index (BMI) screening and follow-up</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>742</fpage>
          <lpage>749</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854140"/>
          </comment>
          <pub-id pub-id-type="medline">29854140</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977575</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref129">
        <label>129</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Souissi</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Abed</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Elhiki</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Fortemps</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pirlot</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Reducing the toxicity risk in antibiotic prescriptions by combining ontologies with a multiple criteria decision model</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>1625</fpage>
          <lpage>1634</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854233"/>
          </comment>
          <pub-id pub-id-type="medline">29854233</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977731</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref130">
        <label>130</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cardoso</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Chantal</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Da Silveira</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pruski</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Combining rules, background knowledge and change patterns to maintain semantic annotations</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>505</fpage>
          <lpage>514</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854115"/>
          </comment>
          <pub-id pub-id-type="medline">29854115</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977713</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref131">
        <label>131</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hedda</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Malin</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fabbri</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the effectiveness of auditing rules for electronic health record systems</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>866</fpage>
          <lpage>875</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854153"/>
          </comment>
          <pub-id pub-id-type="medline">29854153</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref132">
        <label>132</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caruana</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gehrke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Koch</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sturm</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Intelligible Models for HealthCare: Predicting Pneumonia Risk and Hospital 30-day Readmission</article-title>
          <source>Proceedings of the 21th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
          <year>2015</year>
          <conf-name>KDD'15</conf-name>
          <conf-date>August 10-13, 2015</conf-date>
          <conf-loc>Sydney, Australia</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2783258.2788613</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref133">
        <label>133</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Che</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>St Sauver</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Deep learning solutions for classifying patients on opioid use</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>525</fpage>
          <lpage>34</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854117"/>
          </comment>
          <pub-id pub-id-type="medline">29854117</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977635</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref134">
        <label>134</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Huh</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>YR</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Turchin</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>An interpretable ICU mortality prediction model based on logistic regression and recurrent neural networks with LSTM units</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>460</fpage>
          <lpage>469</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30815086"/>
          </comment>
          <pub-id pub-id-type="medline">30815086</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref135">
        <label>135</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Speier</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>El-Saden</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Arnold</surname>
              <given-names>CW</given-names>
            </name>
          </person-group>
          <article-title>Classifying acute ischemic stroke onset time using deep imaging features</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>892</fpage>
          <lpage>901</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854156"/>
          </comment>
          <pub-id pub-id-type="medline">29854156</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977679</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref136">
        <label>136</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ming</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bertini</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>RuleMatrix: visualizing and understanding classifiers with rules</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2019</year>
          <month>01</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>342</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2018.2864812</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref137">
        <label>137</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Nandi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Evaluating interactive data systems</article-title>
          <source>VLDB J</source>
          <year>2019</year>
          <month>11</month>
          <day>13</day>
          <volume>29</volume>
          <issue>1</issue>
          <fpage>119</fpage>
          <lpage>46</lpage>
          <pub-id pub-id-type="doi">10.1007/s00778-019-00589-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref138">
        <label>138</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Domingos</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Halevy</surname>
              <given-names>AY</given-names>
            </name>
          </person-group>
          <article-title>Reconciling schemas of disparate data sources</article-title>
          <source>SIGMOD Rec</source>
          <year>2001</year>
          <month>06</month>
          <volume>30</volume>
          <issue>2</issue>
          <fpage>509</fpage>
          <lpage>20</lpage>
          <pub-id pub-id-type="doi">10.1145/376284.375731</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref139">
        <label>139</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Do</surname>
              <given-names>HH</given-names>
            </name>
            <name name-style="western">
              <surname>Rahm</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>COMA - a system for flexible combination of schema matching approaches</article-title>
          <source>Proceedings of 28th International Conference on Very Large Data Bases</source>
          <year>2002</year>
          <conf-name>28th International Conference on Very Large Data Bases</conf-name>
          <conf-date>August 20-23, 2002</conf-date>
          <conf-loc>Hong Kong, China</conf-loc>
          <pub-id pub-id-type="doi">10.1016/b978-155860869-6/50060-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref140">
        <label>140</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kannan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Madhavan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Halevy</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Exploring schema repositories with schemr</article-title>
          <source>SIGMOD Rec</source>
          <year>2011</year>
          <month>07</month>
          <day>18</day>
          <volume>40</volume>
          <issue>1</issue>
          <fpage>11</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1145/2007206.2007210</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref141">
        <label>141</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahm</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <article-title>A survey of approaches to automatic schema matching</article-title>
          <source>VLDB J . 334?</source>
          <year>2001</year>
          <volume>10</volume>
          <issue>4</issue>
          <fpage>350</fpage>
          <pub-id pub-id-type="doi">10.1007/s007780100057</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref142">
        <label>142</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nandi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <article-title>HAMSTER: using search clicklogs for schema and taxonomy matching</article-title>
          <source>Proc VLDB Endow</source>
          <year>2009</year>
          <month>08</month>
          <day>1</day>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>181</fpage>
          <lpage>92</lpage>
          <pub-id pub-id-type="doi">10.14778/1687627.1687649</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref143">
        <label>143</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Synthesizing Mapping Relationships Using Table Corpus</article-title>
          <source>Proceedings of the 2017 ACM International Conference on Management of Data</source>
          <year>2017</year>
          <conf-name>SIGMOD'17</conf-name>
          <conf-date>May 14-17, 2017</conf-date>
          <conf-loc>Chicago, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3035918.3064010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref144">
        <label>144</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ives</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Knoblock</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Minton</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jacob</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Talukdar</surname>
              <given-names>PP</given-names>
            </name>
            <name name-style="western">
              <surname>Tuchinda</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ambite</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Muslea</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gazen</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <source>arXiv</source>
          <year>2009</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://talukdar.net/papers/cidr.pdf">http://talukdar.net/papers/cidr.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref145">
        <label>145</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kraska</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Franklin</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>CrowdER: crowdsourcing entity resolution</article-title>
          <source>Proc VLDB Endow</source>
          <year>2012</year>
          <month>07</month>
          <volume>5</volume>
          <issue>11</issue>
          <fpage>1483</fpage>
          <lpage>94</lpage>
          <pub-id pub-id-type="doi">10.14778/2350229.2350263</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref146">
        <label>146</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cafarella</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Halevy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Madhavan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>DZ</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Ten years of webtables</article-title>
          <source>Proc VLDB Endow</source>
          <year>2018</year>
          <month>08</month>
          <day>1</day>
          <volume>11</volume>
          <issue>12</issue>
          <fpage>2140</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.14778/3229863.3240492</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref147">
        <label>147</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>XL</given-names>
            </name>
            <name name-style="western">
              <surname>Halevy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Data integration with uncertainty</article-title>
          <source>VLDB J</source>
          <year>2008</year>
          <month>11</month>
          <day>14</day>
          <volume>18</volume>
          <issue>2</issue>
          <fpage>469</fpage>
          <lpage>500</lpage>
          <pub-id pub-id-type="doi">10.1007/s00778-008-0119-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref148">
        <label>148</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jagadish</surname>
              <given-names>HV</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Reducing uncertainty of schema matching via crowdsourcing with accuracy rates</article-title>
          <source>IEEE Trans. Knowl Data Eng</source>
          <year>2020</year>
          <month>01</month>
          <day>1</day>
          <volume>32</volume>
          <issue>1</issue>
          <fpage>135</fpage>
          <lpage>51</lpage>
          <pub-id pub-id-type="doi">10.1109/tkde.2018.2881185</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref149">
        <label>149</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cafarella</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Halevy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Khoussainova</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Data integration for the relational web</article-title>
          <source>Proc VLDB Endow</source>
          <year>2009</year>
          <month>08</month>
          <day>1</day>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>1090</fpage>
          <lpage>101</lpage>
          <pub-id pub-id-type="doi">10.14778/1687627.1687750</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref150">
        <label>150</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Madhavan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jeffery</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ko</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Halevy</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Web-scale Data Integration: You can only afford to Pay As You Go</article-title>
          <source>MIT</source>
          <year>2007</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://web.mit.edu/tibbetts/Public/CIDR_2007_Proceedings/papers/cidr07p40.pdf">http://web.mit.edu/tibbetts/Public/CIDR_2007_Proceedings/papers/cidr07p40.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref151">
        <label>151</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Limaye</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Sarawagi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chakrabarti</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Annotating and searching web tables using entities, types and relationships</article-title>
          <source>Proc VLDB Endow</source>
          <year>2010</year>
          <month>09</month>
          <volume>3</volume>
          <issue>1-2</issue>
          <fpage>1338</fpage>
          <lpage>47</lpage>
          <pub-id pub-id-type="doi">10.14778/1920841.1921005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref152">
        <label>152</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>Open data integration</article-title>
          <source>Proc VLDB Endow</source>
          <year>2018</year>
          <month>08</month>
          <day>1</day>
          <volume>11</volume>
          <issue>12</issue>
          <fpage>2130</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.14778/3229863.3240491</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref153">
        <label>153</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fernandez</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Mansour</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Qahtan</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Elmagarmid</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ilyas</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Madden</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ouzzani</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Seeping semantics: Linking datasets using word embeddings for data discovery</article-title>
          <year>2018</year>
          <conf-name>IEEE 34th International Conference on Data Engineering</conf-name>
          <conf-date>October 25, 2018</conf-date>
          <conf-loc>Paris, France</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icde.2018.00093</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref154">
        <label>154</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Veltri</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Santoro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mecca</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Papotti</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Interactive and Deterministic Data Cleaning</article-title>
          <source>Proceedings of the  International Conference on Management of Data</source>
          <year>2016</year>
          <conf-name>SIGMOD '16</conf-name>
          <conf-date>June 2016</conf-date>
          <conf-loc>New York</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2882903.2915242</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref155">
        <label>155</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bergman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Milo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Novgorodov</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>WC</given-names>
            </name>
          </person-group>
          <article-title>Query-oriented data cleaning with oracles</article-title>
          <source>Proceedings of the 2015 ACM SIGMOD International Conference on Management of Data</source>
          <year>2015</year>
          <conf-name>SIGMOD '15</conf-name>
          <conf-date>May, 2015</conf-date>
          <conf-loc>New York</conf-loc>
          <fpage>1199</fpage>
          <lpage>1214</lpage>
          <pub-id pub-id-type="doi">10.1145/2723372.2737786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref156">
        <label>156</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Assadi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Milo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Novgorodov</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Cleaning Data with Constraints and Experts</article-title>
          <source>Proceedings of the 21st International Workshop on the Web and Databases</source>
          <year>2018</year>
          <conf-name>WebDB'18</conf-name>
          <conf-date>June 10, 2018</conf-date>
          <conf-loc>Houston, TX, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3201463.3201464</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref157">
        <label>157</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Geerts</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lakshmanan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xiong</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Discovering conditional functional dependencies</article-title>
          <source>Proceedings of the 25th International Conference on Data Engineering</source>
          <year>2011</year>
          <conf-name>International Conference on Data Engineering</conf-name>
          <conf-date>March 29, 2009 - April 2, 2009</conf-date>
          <conf-loc>Shanghai, China</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icde.2009.208</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref158">
        <label>158</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chiang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>Discovering data quality rules</article-title>
          <source>Proc VLDB Endow</source>
          <year>2008</year>
          <month>08</month>
          <day>1</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>1166</fpage>
          <lpage>77</lpage>
          <pub-id pub-id-type="doi">10.14778/1453856.1453980</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref159">
        <label>159</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Golab</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Karloff</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Korn</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Srivastava</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>On generating near-optimal tableaux for conditional functional dependencies</article-title>
          <source>Proc VLDB Endow</source>
          <year>2008</year>
          <month>08</month>
          <day>1</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>376</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.14778/1453856.1453900</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref160">
        <label>160</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cong</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Geerts</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jia</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Improving data quality: consistency and accuracy</article-title>
          <source>VLDB J</source>
          <year>2007</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://homepages.inf.ed.ac.uk/wenfei/papers/vldb07-b.pdf">http://homepages.inf.ed.ac.uk/wenfei/papers/vldb07-b.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref161">
        <label>161</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Geerts</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Foundations of data quality management</article-title>
          <source>Synth Lect Data Manag</source>
          <year>2012</year>
          <month>07</month>
          <day>31</day>
          <volume>4</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <lpage>217</lpage>
          <pub-id pub-id-type="doi">10.2200/s00439ed1v01y201207dtm030</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref162">
        <label>162</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>DZ</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>XL</given-names>
            </name>
            <name name-style="western">
              <surname>Sarma</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Franklin</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Functional dependency generation and applications in pay-as-you-go data integration systems</article-title>
          <year>2009</year>
          <conf-name>12th International Workshop on the Web and Databases</conf-name>
          <conf-date>June 28, 2009</conf-date>
          <conf-loc>Providence, Rhode Island, USA</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref163">
        <label>163</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rammelaere</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Geerts</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Explaining repaired data with CFDs</article-title>
          <source>Proc VLDB Endow</source>
          <year>2018</year>
          <month>07</month>
          <day>1</day>
          <volume>11</volume>
          <issue>11</issue>
          <fpage>1387</fpage>
          <lpage>99</lpage>
          <pub-id pub-id-type="doi">10.14778/3236187.3236193</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref164">
        <label>164</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ilyas</surname>
              <given-names>IF</given-names>
            </name>
            <name name-style="western">
              <surname>Markl</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Haas</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Aboulnaga</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>CORDS: Automatic Discovery of Correlations and Soft Functional Dependencies</article-title>
          <source>Proceedings of the 2004 ACM SIGMOD international conference on Management of data</source>
          <year>2004</year>
          <conf-name>SIGMOD'14</conf-name>
          <conf-date>June 13-18, 2004</conf-date>
          <conf-loc>Paris</conf-loc>
          <pub-id pub-id-type="doi">10.1145/1007568.1007641</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref165">
        <label>165</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Asghar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ghenai</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Automatic discovery of functional dependencies and conditional functional dependencies: a comparative study</article-title>
          <source>University of Waterloo</source>
          <year>2015</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cs.uwaterloo.ca/~nasghar/848.pdf">https://cs.uwaterloo.ca/~nasghar/848.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref166">
        <label>166</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>De Sa</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ratner</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ré</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>DeepDive: declarative knowledge base construction</article-title>
          <source>SIGMOD Rec</source>
          <year>2016</year>
          <month>06</month>
          <day>2</day>
          <volume>45</volume>
          <issue>1</issue>
          <fpage>60</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1145/2949741.2949756</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref167">
        <label>167</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Varma</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ré</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Snuba: automating weak supervision to label training data</article-title>
          <source>Proc VLDB Endow</source>
          <year>2018</year>
          <month>11</month>
          <day>1</day>
          <volume>12</volume>
          <issue>3</issue>
          <fpage>223</fpage>
          <lpage>36</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31777681"/>
          </comment>
          <pub-id pub-id-type="doi">10.14778/3291264.3291268</pub-id>
          <pub-id pub-id-type="medline">31777681</pub-id>
          <pub-id pub-id-type="pmcid">PMC6879381</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref168">
        <label>168</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Felix</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dasgupta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bertini</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The Exploratory Labeling Assistant: Mixed-Initiative Label Curation with Large Document Collections Share on</article-title>
          <source>Proceedings of the 31st Annual ACM Symposium on User Interface Software and Technology</source>
          <year>2018</year>
          <conf-name>UIST'18</conf-name>
          <conf-date>June 1-5, 2018</conf-date>
          <conf-loc>New York, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3242587.3242596</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref169">
        <label>169</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Kao</surname>
              <given-names>HY</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>PubTator: a web-based text mining tool for assisting biocuration</article-title>
          <source>Nucleic Acids Res</source>
          <year>2013</year>
          <month>07</month>
          <volume>41</volume>
          <issue>Web Server issue</issue>
          <fpage>W518</fpage>
          <lpage>22</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23703206"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkt441</pub-id>
          <pub-id pub-id-type="medline">23703206</pub-id>
          <pub-id pub-id-type="pii">gkt441</pub-id>
          <pub-id pub-id-type="pmcid">PMC3692066</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref170">
        <label>170</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kwon</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Leaman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>ezTag: tagging biomedical concepts via interactive learning</article-title>
          <source>Nucleic Acids Res</source>
          <year>2018</year>
          <month>07</month>
          <day>2</day>
          <volume>46</volume>
          <issue>W1</issue>
          <fpage>W523</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29788413"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gky428</pub-id>
          <pub-id pub-id-type="medline">29788413</pub-id>
          <pub-id pub-id-type="pii">4999245</pub-id>
          <pub-id pub-id-type="pmcid">PMC6030907</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref171">
        <label>171</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nazi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Narasayya</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhuri</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Efficient estimation of inclusion coefficient using hyperloglog sketches</article-title>
          <source>Proc VLDB Endow</source>
          <year>2018</year>
          <month>06</month>
          <day>1</day>
          <volume>11</volume>
          <issue>10</issue>
          <fpage>1097</fpage>
          <lpage>109</lpage>
          <pub-id pub-id-type="doi">10.14778/3231751.3231759</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref172">
        <label>172</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Efficient Foreign Key Discovery Based on Nearest Neighbor Search</article-title>
          <source>International Conference on Web-Age Information Management</source>
          <year>2015</year>
          <conf-name>WAIM'15</conf-name>
          <conf-date>June 8-10, 2015</conf-date>
          <conf-loc>Qingdao, China</conf-loc>
          <pub-id pub-id-type="doi">10.1007/978-3-319-21042-1_37</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref173">
        <label>173</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Motl</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kordik</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Foreign key constraint identification in relational databases</article-title>
          <source>Czech Technical University in Prague</source>
          <year>2017</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://ceur-ws.org/Vol-1885/106.pdf">http://ceur-ws.org/Vol-1885/106.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref174">
        <label>174</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Koehler</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Link</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Inclusion Dependencies Reloaded</article-title>
          <source>Proceedings of the 24th ACM International on Conference on Information and Knowledge Management</source>
          <year>2015</year>
          <conf-name>CIKM '15</conf-name>
          <conf-date>October, 2015</conf-date>
          <conf-loc>Melbourne Australia</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref175">
        <label>175</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Narasayya</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhuri</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Fast foreign-key detection in Microsoft SQL server PowerPivot for Excel</article-title>
          <source>Proc VLDB Endow</source>
          <year>2014</year>
          <month>08</month>
          <volume>7</volume>
          <issue>13</issue>
          <fpage>1417</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.14778/2733004.2733014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref176">
        <label>176</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moritz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Howe</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Falcon: Balancing interactive latency and resolution sensitivity for scalable linked visualizations,?</article-title>
          <source>University of Washington</source>
          <year>2019</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://idl.cs.washington.edu/files/2019-Falcon-CHI.pdf">https://idl.cs.washington.edu/files/2019-Falcon-CHI.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref177">
        <label>177</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kamat</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jayachandran</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tunga</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nandi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Distributed and Interactive Cube Exploration</article-title>
          <source>30th International Conference on Data Engineering</source>
          <year>2014</year>
          <conf-name>ICDE'14</conf-name>
          <conf-date>March 31-April 4, 2014</conf-date>
          <conf-loc>Chicago, IL, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icde.2014.6816674</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref178">
        <label>178</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lins</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Klosowski</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Scheidegger</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Nanocubes for real-time exploration of spatiotemporal datasets</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2013</year>
          <month>12</month>
          <volume>19</volume>
          <issue>12</issue>
          <fpage>2456</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2013.179</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref179">
        <label>179</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pahins</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Stephens</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Scheidegger</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Comba</surname>
              <given-names>JL</given-names>
            </name>
          </person-group>
          <article-title>Hashedcubes: simple, low memory, real-time visual exploration of big data</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2017</year>
          <month>01</month>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>671</fpage>
          <lpage>80</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2016.2598624</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref180">
        <label>180</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Joglekar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia-Molina</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Parameswaran</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Interactive Data Exploration With Smart Drill-down</article-title>
          <source>32nd International Conference on Data Engineering</source>
          <year>2016</year>
          <conf-name>ICDE'16</conf-name>
          <conf-date>May 16-20, 2016</conf-date>
          <conf-loc>Helsinki, Finland</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icde.2016.7498300</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref181">
        <label>181</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dimitriadou</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Papaemmanouil</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Diao</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>AIDE: an active learning-based approach for interactive data exploration</article-title>
          <source>IEEE Trans Knowl Data Eng</source>
          <year>2016</year>
          <month>11</month>
          <day>1</day>
          <volume>28</volume>
          <issue>11</issue>
          <fpage>2842</fpage>
          <lpage>56</lpage>
          <pub-id pub-id-type="doi">10.1109/tkde.2016.2599168</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref182">
        <label>182</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Psallidas</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Smoke</article-title>
          <source>Proc VLDB Endow</source>
          <year>2018</year>
          <month>02</month>
          <day>1</day>
          <volume>11</volume>
          <issue>6</issue>
          <fpage>719</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.14778/3199517.3199522</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref183">
        <label>183</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Madden</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Scorpion</article-title>
          <source>Proc VLDB Endow</source>
          <year>2013</year>
          <month>06</month>
          <volume>6</volume>
          <issue>8</issue>
          <fpage>553</fpage>
          <lpage>64</lpage>
          <pub-id pub-id-type="doi">10.14778/2536354.2536356</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref184">
        <label>184</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kandel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Parikh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Paepcke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hellerstein</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Profiler: Integrated Statistical Analysis and Visualization for Data Quality Assessment</article-title>
          <source>Stanford Univeristy</source>
          <year>2012</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://vis.stanford.edu/papers/profiler">http://vis.stanford.edu/papers/profiler</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref185">
        <label>185</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Correll</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kindlmann</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Scheidegger</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Looks good to me: visualizations as sanity checks</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2019</year>
          <month>01</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>830</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2018.2864907</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref186">
        <label>186</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wongsuphasawat</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Moritz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Qu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ouk</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Anand</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mackinlay</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Howe</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Voyager 2: Augmenting Visual Analysis with Partial View Specifications</article-title>
          <source>University of Washington</source>
          <year>2017</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://idl.cs.washington.edu/files/2017-Voyager2-CHI.pdf">https://idl.cs.washington.edu/files/2017-Voyager2-CHI.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref187">
        <label>187</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Willett</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawala</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Scented widgets: improving navigation cues with embedded visualizations</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2007</year>
          <month>11</month>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>1129</fpage>
          <lpage>36</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2007.70589</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref188">
        <label>188</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Preim</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lawonn</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A survey of visual analytics for public health</article-title>
          <source>Computer Graphics Forum</source>
          <year>2019</year>
          <month>11</month>
          <day>28</day>
          <volume>39</volume>
          <issue>1</issue>
          <fpage>543</fpage>
          <lpage>80</lpage>
          <pub-id pub-id-type="doi">10.1111/cgf.13891</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref189">
        <label>189</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Holzinger</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Biemann</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pattichis</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Kell</surname>
              <given-names>DB</given-names>
            </name>
          </person-group>
          <article-title>What do we need to build explainable AI systems for the medical domain?</article-title>
          <source>arXiv</source>
          <year>2017</year>
          <fpage>9923</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref190">
        <label>190</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Montavon</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Samek</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Methods for interpreting and understanding deep neural networks</article-title>
          <source>Digi Signal Process</source>
          <year>2018</year>
          <month>02</month>
          <volume>73</volume>
          <fpage>1</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1016/j.dsp.2017.10.011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref191">
        <label>191</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alspaugh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zokaei</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hearst</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Futzing and moseying: interviews with professional data analysts on exploration practices</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2019</year>
          <month>01</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>22</fpage>
          <lpage>31</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2018.2865040</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref192">
        <label>192</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stoyanovich</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Howe</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jagadish</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Miklau</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Panel: a debate on data and algorithmic ethics</article-title>
          <source>Proc VLDB Endow</source>
          <year>2018</year>
          <month>08</month>
          <day>1</day>
          <volume>11</volume>
          <issue>12</issue>
          <fpage>2165</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.14778/3229863.3240494</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref193">
        <label>193</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jongejaan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Holbrook</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The effects of example-based explanations in a machine learning interface</article-title>
          <source>Proceedings of the 24th International Conference on Intelligent User Interfaces</source>
          <year>2019</year>
          <conf-name>IUI '19</conf-name>
          <conf-date>March, 2019</conf-date>
          <conf-loc>New York</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref194">
        <label>194</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Tpflow: progressive partition and multidimensional pattern extraction for large-scale spatio-temporal data analysis</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2019</year>
          <month>01</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2018.2865018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref195">
        <label>195</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Nandi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hellerstein</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Data tweening: incremental visualization of data transforms</article-title>
          <source>Proc VLDB Endow</source>
          <year>2017</year>
          <month>02</month>
          <day>1</day>
          <volume>10</volume>
          <issue>6</issue>
          <fpage>661</fpage>
          <lpage>72</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref196">
        <label>196</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Acree</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Patros</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Suseno</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Grant</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fleming</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hadsell</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Semel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hebert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>A novel inpatient Antibiotic Stewardship Assistance Program (ASAP) using real-time electronic health record data, prediction modeling and epidemiologic data to provide personalized empiric antibiotic recommendations</article-title>
          <source>Open Forum Infect Dis</source>
          <year>2018</year>
          <month>11</month>
          <volume>5</volume>
          <issue>Suppl 1</issue>
          <pub-id pub-id-type="doi">10.1093/ofid/ofy210.201</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref197">
        <label>197</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kamat</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nandi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A session-based approach to fast-but-approximate interactive data cube exploration</article-title>
          <source>ACM Trans Knowl Discov Data</source>
          <year>2018</year>
          <month>02</month>
          <day>23</day>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1145/3070648</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref198">
        <label>198</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Battle</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Stonebraker</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Dynamic prefetching of data tiles for interactive visualization</article-title>
          <source>Proceedings of the  International Conference on Management of Data</source>
          <year>2016</year>
          <conf-name>SIGMOD '16</conf-name>
          <conf-date>June, 2016</conf-date>
          <conf-loc>New York</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref199">
        <label>199</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Takayama</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kandogan</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Trust as an underlying factor of system administrator interface choice</article-title>
          <source>Extended Abstracts on Human Factors in Computing Systems</source>
          <year>2006</year>
          <conf-name>CHI EA '06</conf-name>
          <conf-date>April, 2006</conf-date>
          <conf-loc>Montréal Québec Canada</conf-loc>
          <pub-id pub-id-type="doi">10.1145/1125451.1125708</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref200">
        <label>200</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Idreos</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liarou</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>dbTouch: Analytics at your Fingertips</article-title>
          <source>Stanford Univeristy</source>
          <year>2013</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www-cs-students.stanford.edu/~adityagp/courses/cs598-old/papers/dbtouch.pdf">http://www-cs-students.stanford.edu/~adityagp/courses/cs598-old/papers/dbtouch.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref201">
        <label>201</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bendre</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Parameswaran</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>DataSpread</article-title>
          <source>Proc VLDB Endow</source>
          <year>2015</year>
          <month>08</month>
          <volume>8</volume>
          <issue>12</issue>
          <fpage>2000</fpage>
          <lpage>3</lpage>
          <pub-id pub-id-type="doi">10.14778/2824032.2824121</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref202">
        <label>202</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ozcan</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Koutrika</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Expressive Query Construction through Direct Manipulation of Nested Relational Results</article-title>
          <source>Proceedings of the 2016 International Conference on Management of Data</source>
          <year>2016</year>
          <conf-name>SIGMOD '16</conf-name>
          <conf-date>June 2016</conf-date>
          <conf-loc>San Francisco, California</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref203">
        <label>203</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schaffer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>O'Donovan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Michaelis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Raglin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Höllerer</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>I can do better than your AI: expertise and explanations</article-title>
          <source>Proceedings of the 24th International Conference on Intelligent User Interfaces</source>
          <year>2019</year>
          <conf-name>IUI '19</conf-name>
          <conf-date>March 2019</conf-date>
          <conf-loc>Marina del Ray, California</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3301275.3302308</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref204">
        <label>204</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arnold</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Collier</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Leech</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Sutton</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The differential use and effect of knowledge-based system explanations in novice and expert judgment decisions</article-title>
          <source>MIS Q</source>
          <year>2006</year>
          <volume>30</volume>
          <issue>1</issue>
          <fpage>79</fpage>
          <pub-id pub-id-type="doi">10.2307/25148718</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref205">
        <label>205</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dror</surname>
              <given-names>IE</given-names>
            </name>
          </person-group>
          <article-title>A hierarchy of expert performance</article-title>
          <source>J Appl Res Memory Cogn</source>
          <year>2016</year>
          <month>06</month>
          <volume>5</volume>
          <issue>2</issue>
          <fpage>121</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jarmac.2016.03.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref206">
        <label>206</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mason</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Suri</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Conducting behavioral research on Amazon's Mechanical Turk</article-title>
          <source>Behav Res Methods</source>
          <year>2012</year>
          <month>03</month>
          <volume>44</volume>
          <issue>1</issue>
          <fpage>23</fpage>
          <pub-id pub-id-type="doi">10.3758/s13428-011-0124-6</pub-id>
          <pub-id pub-id-type="medline">21717266</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref207">
        <label>207</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Czerwinski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lund</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Crowdsourcing user studies with Mechanical Turk</article-title>
          <source>Proceedings of the SIGCHI Conference on Human Factors in Computing Systems</source>
          <year>2008</year>
          <conf-name>CHI '08</conf-name>
          <conf-date>April, 2008</conf-date>
          <conf-loc>Florence, Italy</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref208">
        <label>208</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarma</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Parameswaran</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Widom</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Towards Globally Optimal Crowdsourcing Quality Management: The Uniform Worker Setting</article-title>
          <source>Proceedings of the 2016 International Conference on Management of Data</source>
          <year>2016</year>
          <conf-name>SIGMOD '16</conf-name>
          <conf-date>June, 2016</conf-date>
          <conf-loc>San Francisco, California</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref209">
        <label>209</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kandogan</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Roth</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shwarz</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hui</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Terizzano</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Christodoulakis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>LabBook: Metadata-driven social collaborative data analysis</article-title>
          <year>2015</year>
          <conf-name>2015 IEEE International Conference on Big Data (Big Data)</conf-name>
          <conf-date>2015</conf-date>
          <conf-loc>Santa Clara, California</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref210">
        <label>210</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hellerstein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sreekanti</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Dalton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nag</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ramachandran</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Arora</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bhattacharyya</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Ground: A Data Context Service</article-title>
          <source>Conference on Innovative Data Systems Research</source>
          <year>2017</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://cidrdb.org/cidr2017/papers/p111-hellerstein-cidr17.pdf">http://cidrdb.org/cidr2017/papers/p111-hellerstein-cidr17.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref211">
        <label>211</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kandel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Paepcke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hellerstein</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Enterprise data analysis and visualization: an interview study</article-title>
          <source>IEEE Trans Visual Comput Graphics</source>
          <year>2012</year>
          <month>12</month>
          <volume>18</volume>
          <issue>12</issue>
          <fpage>2917</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1109/tvcg.2012.219</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref212">
        <label>212</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kandogan</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Balakrishnan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haber</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Pierce</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>From data to insight: work practices of analysts in the enterprise</article-title>
          <source>IEEE Comput Grap Appl</source>
          <year>2014</year>
          <month>09</month>
          <volume>34</volume>
          <issue>5</issue>
          <fpage>42</fpage>
          <lpage>50</lpage>
          <pub-id pub-id-type="doi">10.1109/mcg.2014.62</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref213">
        <label>213</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jagdish</surname>
              <given-names>HV</given-names>
            </name>
            <name name-style="western">
              <surname>Nandi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>Li</given-names>
            </name>
          </person-group>
          <article-title>Organic databases</article-title>
          <source>Databases in Networked Information Systems</source>
          <year>2011</year>
          <publisher-loc>Berlin, Heidelberg</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>49</fpage>
          <lpage>63</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref214">
        <label>214</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Embi</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Yackel</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Logan</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Bowen</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Cooney</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>Gorman</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <article-title>Impacts of computerized physician documentation in a teaching hospital: perceptions of faculty and resident physicians</article-title>
          <source>J Am Med Inf Assoc</source>
          <year>2004</year>
          <month>04</month>
          <day>2</day>
          <volume>11</volume>
          <issue>4</issue>
          <fpage>300</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1197/jamia.m1525</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref215">
        <label>215</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Nandi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Transformer: a database-driven approach to generating forms for constrained interaction</article-title>
          <source>Proceedings of the 24th International Conference on Intelligent User Interfaces</source>
          <year>2019</year>
          <conf-name>IUI '19</conf-name>
          <conf-date>2019</conf-date>
          <conf-loc>Marina del Ray, California</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref216">
        <label>216</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hellerstein</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Parikh</surname>
              <given-names>TS</given-names>
            </name>
          </person-group>
          <article-title>Usher: improving data quality with dynamic forms</article-title>
          <source>IEEE Trans Knowl Data Eng</source>
          <year>2011</year>
          <month>08</month>
          <volume>23</volume>
          <issue>8</issue>
          <fpage>1138</fpage>
          <lpage>53</lpage>
          <pub-id pub-id-type="doi">10.1109/tkde.2011.31</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref217">
        <label>217</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gajos</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Weld</surname>
              <given-names>DS</given-names>
            </name>
          </person-group>
          <article-title>SUPPLE: Automatically Generating User Interfaces</article-title>
          <source>Harvard University</source>
          <year>2004</year>
          <access-date>2020-10-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.eecs.harvard.edu/~kgajos/papers/2004/supple-iui04.pdf">https://www.eecs.harvard.edu/~kgajos/papers/2004/supple-iui04.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref218">
        <label>218</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jayapandian</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jagadish</surname>
              <given-names>HV</given-names>
            </name>
          </person-group>
          <article-title>Automated creation of a forms-based database query interface</article-title>
          <source>Proceedings VLDB Endowment</source>
          <year>2008</year>
          <month>08</month>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>695</fpage>
          <lpage>709</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref219">
        <label>219</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hebert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Dewart</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lustberg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pancholi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Stevenson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Hade</surname>
              <given-names>EM</given-names>
            </name>
          </person-group>
          <article-title>Prediction of antibiotic susceptibility for urinary tract infection in a hospital setting</article-title>
          <source>Antimicrob Agents Chemother</source>
          <year>2020</year>
          <month>06</month>
          <day>23</day>
          <volume>64</volume>
          <issue>7</issue>
          <fpage>02236-19</fpage>
          <pub-id pub-id-type="doi">10.1128/aac.02236-19</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
