<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="review-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">JMI</journal-id>
            <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
            <journal-title>JMIR Medical Informatics</journal-title>
            <issn pub-type="epub">2291-9694</issn>
            <publisher>
                <publisher-name>Gunther Eysenbach</publisher-name>
                <publisher-loc>JMIR Publications Inc., Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v2i1e1</article-id>
            <article-id pub-id-type="pmid">25600256</article-id>
            <article-id pub-id-type="doi">10.2196/medinform.2913</article-id>
            <article-categories>
                <subj-group subj-group-type="article-type">
                    <subject>Review</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Big Data and Clinicians: A Review on the State of the Science</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Toldo</surname>
                        <given-names>Luca</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Gao</surname>
                        <given-names>Junfeng</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1">
                    <name name-style="western">
                        <surname>Wang</surname>
                        <given-names>Weiqi</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-4936-0977</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib2" corresp="yes">
                    <name name-style="western">
                        <surname>Krishnan</surname>
                        <given-names>Eswar</given-names>
                    </name>
                    <degrees>MD, MPH</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                    <address>
                        <institution>School of Medicine</institution>
                        <institution>Stanford University</institution>
                        <addr-line>1000 Welch Road, Suite 203</addr-line>
                        <addr-line>Palo Alto, CA, 94304</addr-line>
                        <country>United States</country>
                        <phone>1 650 725 8004</phone>
                        <fax>1 650 723 9656</fax>
                        <email>e.krishnan@stanford.edu</email>
                    </address>
                </contrib>
            </contrib-group>
            <aff id="aff1" rid="aff1">
                <sup>1</sup>
                <institution>School of Medicine</institution>
                <institution>Stanford University</institution>
                <addr-line>Palo Alto, CA</addr-line>
                <country>United States</country>
            </aff>
            <author-notes>
                <corresp>Corresponding Author: Eswar Krishnan <email>e.krishnan@stanford.edu</email>
                </corresp>
            </author-notes>
            <pub-date pub-type="collection">
                <season>Jan-Jun</season>
                <year>2014</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>17</day>
                <month>01</month>
                <year>2014</year>
            </pub-date>
            <volume>2</volume>
            <issue>1</issue>
            <elocation-id>e1</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>27</day>
                    <month>08</month>
                    <year>2013</year>
                </date>
                <date date-type="rev-request">
                    <day>27</day>
                    <month>10</month>
                    <year>2013</year>
                </date>
                <date date-type="rev-recd">
                    <day>25</day>
                    <month>11</month>
                    <year>2013</year>
                </date>
                <date date-type="accepted">
                    <day>08</day>
                    <month>12</month>
                    <year>2013</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;Weiqi Wang, Eswar Krishnan. Originally published in JMIR Research Protocols (http://medinform.jmir.org), 17.01.2014. </copyright-statement>
            <copyright-year>2014</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://www.medinform.jmir.org/2014/1/e1/" xlink:type="simple" />
            <abstract>
                <sec sec-type="background">
                    <title>Background</title>
                    <p>In the past few decades, medically related data collection saw a huge increase, referred to as big data. These huge datasets bring challenges in storage, processing, and analysis. In clinical medicine, big data is expected to play an important role in identifying causality of patient symptoms, in predicting hazards of disease incidence or reoccurrence, and in improving primary-care quality.</p>
                </sec>
                <sec sec-type="objective">
                    <title>Objective</title>
                    <p>The objective of this review was to provide an overview of the features of clinical big data, describe a few commonly employed computational algorithms, statistical methods, and software toolkits for data manipulation and analysis, and discuss the challenges and limitations in this realm.</p>
                </sec>
                <sec sec-type="methods">
                    <title>Methods</title>
                    <p>We conducted a literature review to identify studies on big data in medicine, especially clinical medicine. We used different
combinations of keywords to search PubMed, Science Direct, Web of Knowledge, and Google Scholar for literature of interest
from the past 10 years.</p>
                </sec>
                <sec sec-type="results">
                    <title>Results</title>
                    <p>This paper reviewed studies that analyzed clinical big data and discussed issues related to storage and analysis of this type
of data.</p>
                </sec>
                <sec sec-type="conclusions">
                    <title>Conclusions</title>
                    <p>Big data is becoming a common feature of biological and clinical studies. Researchers who use clinical big data face multiple challenges, and the data itself has limitations. It is imperative that methodologies for data analysis keep pace with our ability to
collect and store data.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>big data</kwd>
                <kwd>database</kwd>
                <kwd>medical informatics</kwd>
                <kwd>clinical research</kwd>
                <kwd>medicine</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title> Introduction</title>
            <p>Big data refers to very large datasets with complex structures that are difficult to process using traditional methods and tools. The term process includes, capture, storage, formatting, extraction, curation, integration, analysis, and visualization [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. A popular definition of big data is the &#8220;3V&#8221; model proposed by Gartner [<xref ref-type="bibr" rid="ref10">10</xref>], which attributes three fundamental features to big data: high volume of data mass, high velocity of data flow, and high variety of data types. The notion of big data can be traced back to the 1970s [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>] when scientists realized that they lacked the tools to analyze datasets of large size. In those days, big data was merely several to hundreds of megabytes [<xref ref-type="bibr" rid="ref14">14</xref>]; now datasets of terabytes are common [<xref ref-type="bibr" rid="ref15">15</xref>, <xref ref-type="bibr" rid="ref16">16</xref>]. Therefore, the &#8220;big&#8221; in big data reflects the limits of data storage and computational power existing at a given point in time.</p>
            <p>
                <xref ref-type="table" rid="table1">Table 1</xref> shows the growth of global big data volume and computer science papers on big data since 2009. This table exemplifies that stored data will be in the tens of zettabytes range by 2020, and research on how to deal with big data will grow exponentially as well.</p>
            <p>Big data is gathered in many disciplines and is made possible by ubiquitous information-sensing devices and software [<xref ref-type="bibr" rid="ref19">19</xref>]. An example is web logs: websites such as Google or Facebook automatically record user information at each visit. Other examples come from the stock market [<xref ref-type="bibr" rid="ref20">20</xref>], earthquake surveillance [<xref ref-type="bibr" rid="ref21">21</xref>], political elections [<xref ref-type="bibr" rid="ref22">22</xref>], behavioral studies [<xref ref-type="bibr" rid="ref23">23</xref>], sports [<xref ref-type="bibr" rid="ref24">24</xref>], pharmaceutical reports [<xref ref-type="bibr" rid="ref25">25</xref>], health care [<xref ref-type="bibr" rid="ref26">26</xref>, <xref ref-type="bibr" rid="ref27">27</xref>], electronic medical records [<xref ref-type="bibr" rid="ref28">28</xref>], imaging data [<xref ref-type="bibr" rid="ref29">29</xref>], genome data [<xref ref-type="bibr" rid="ref30">30</xref>, <xref ref-type="bibr" rid="ref31">31</xref>], and entrepreneur transaction records [<xref ref-type="bibr" rid="ref32">32</xref>]. Data collection is sometimes interdisciplinary. As an example, a sudden increase in Google search terms such as &#8220;flu symptoms&#8221; and &#8220;flu treatments&#8221; can be used to predict an increase in flu patients presenting to hospital emergency rooms [<xref ref-type="bibr" rid="ref33">33</xref>]. This example also demonstrates that big data has promising predictive power and return on investment. Return on investment of big data has also been suggested for clinical big data [<xref ref-type="bibr" rid="ref34">34</xref>, <xref ref-type="bibr" rid="ref35">35</xref>].</p>
            <p>Although arguably valuable, big data is difficult to analyze due to the massive volume of the raw data and its diversity, as shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>. Therefore, instead of the raw big data, a large dataset is often extracted from the raw data to generate a secondary storage of data for analysis purposes. This data extraction is applied, for example, when a computer tomography scan is involved in clinical trials and only the physician diagnosis based on the scan is included in data analysis. Similarly, a large volume of descriptive data on various kinds of samplings, tests, or assays can be extracted with only the key parameters kept. As a consequence, the data analyzed in clinical medicine is usually from secondary datasets that contain only data of interest. The secondary datasets, although still large, are not terabytes in size. Additionally, due to the nature of clinical trials, a large dataset in clinical medicine usually does not have an overwhelming number of samples. Kjaergard et al [<xref ref-type="bibr" rid="ref36">36</xref>] defined clinical trials with 1000 or more participants as large, and the studies in clinical medicine titled big/large, data/dataset generally have thousands of attributes, but only hundreds of samples [<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref39">39</xref>].</p>
            <p>For this paper, we reviewed the literature to determine the features of clinical big data and determine the methods used for manipulation and analysis of these data. This paper is focused on clinical medicine rather than general health care issues; therefore, we mainly reviewed the studies that appeared relevant to clinicians. We examined the selected studies to extract information on research interests, goals, and achievements, and the implemented methodologies. Our intention was not to conduct an exhaustive systematic review, but instead to enable a literature-based discussion of how the big data issue has been addressed in clinical medicine. Based on our findings, we discuss the challenges and limitations of analysis of large clinical datasets.</p>
            <table-wrap position="float" id="table1">
                <label>Table 1</label>
                <caption>
                    <p>Global growth of big data and computer science papers on big data.</p>
                </caption>
                <table width="576" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                    <col width="38" />
                    <col width="141" />
                    <col width="185" />
                    <col width="154" />
                    <thead>
                        <tr valign="bottom">
                            <td>Year</td>
                            <td>Data volume, ZB<sup>a,c</sup>
                            </td>
                            <td>Conference papers, CS<sup>b,c</sup>
                            </td>
                            <td>Journal papers, CS<sup>c</sup>
                            </td>
                        </tr>
                    </thead>
                    <tbody>
                        <tr valign="top">
                            <td>2009</td>
                            <td>1.5</td>
                            <td>12</td>
                            <td>7</td>
                        </tr>
                        <tr valign="top">
                            <td>2010</td>
                            <td>2</td>
                            <td>26</td>
                            <td>7</td>
                        </tr>
                        <tr valign="top">
                            <td>2011</td>
                            <td>2.5</td>
                            <td>32</td>
                            <td>23</td>
                        </tr>
                        <tr valign="top">
                            <td>2012</td>
                            <td>3</td>
                            <td>78</td>
                            <td>47</td>
                        </tr>
                        <tr valign="top">
                            <td>2015</td>
                            <td>8</td>
                            <td>?</td>
                            <td>?</td>
                        </tr>
                        <tr valign="top">
                            <td>2020</td>
                            <td>44</td>
                            <td>??</td>
                            <td>??</td>
                        </tr>
                    </tbody>
                </table>
                <table-wrap-foot>
                    <fn id="table1fn1">
                        <p>
                            <sup>a</sup>Data from <italic>oracle</italic> [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
                    </fn>
                    <fn id="table1fn2">
                        <p>
                            <sup>b</sup>Data from <italic>Research Trends</italic> [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
                    </fn>
                    <fn id="table1fn3">
                        <p>
                            <sup>c</sup>CS, computer science; ZB, zettabytes (1 zettabyte = 1000 terabytes = 10<sup>6</sup> petabytes = 10<sup>18</sup> gigabytes, GB).</p>
                    </fn>
                </table-wrap-foot>
            </table-wrap>
            <fig id="figure1" position="float">
                <label>Figure 1</label>
                <caption>
                    <p>A schematic of the issues surrounding storage and use of big data. Clinical big data, as well as big data in other disciplines, have been surrounded by a number of issues and challenges, including (but not limited to): generation, storage, curation, extraction, integration, analysis, visualization, etc. ANN: artificial neuron network; EMR: electronic medical record; MPP: massively parallel-processing; PCA: principle component analysis; ROI: return of investment; SVM: support vector machine.</p>
                </caption>
                <graphic xlink:href="medinform_v2i1e2_fig1.gif" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
            </fig>
        </sec>
        <sec sec-type="methods">
            <title> Methods</title>
            <p>We conducted a literature review to identify studies on big data in medicine, especially clinical medicine. We used different combinations of keywords to search PubMed, Science Direct, Web of Knowledge, and Google Scholar for literature of interest, mainly from the last 10 years. The key words were: &#34;big data medicine&#34;, &#34;large dataset medicine&#34;, &#8220;clinical big data&#8221;, &#8220;clinical large dataset&#8221;, &#8220;clinical data warehouse&#8221;, &#8220;clinical database&#8221;, &#8220;clinical data mining&#8221;, &#8220;biomedical big data&#8221;, &#8220;biomedical database&#8221;, &#8220;biomedical data warehouse&#8221;, &#8220;healthcare big data&#8221;, &#8220;healthcare database&#8221;, and &#8220;healthcare data warehouse&#8221;.</p>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <sec>
                <title>Big Data in Clinical Medicine</title>
                <p>Big data plays an important role in medical and clinical research and has been leveraged in clinically relevant studies. Major research institute centers and funding agencies have made large investments in the arena. For example, the National Institutes of Health recently committed US $100 million for the big data to Knowledge (BD2K) initiative [<xref ref-type="bibr" rid="ref40">40</xref>]. The BD2K defines &#8220;biomedical&#8221; big data as large datasets generated by research groups or individual investigators and as large datasets generated by aggregation of smaller datasets. The most well-known examples of medical big data are databases maintained by the Medicare and Healthcare Cost and Utilization Project (with over 100 million observations). One of the differences between medical big data and large datasets from other disciplines is that clinical big data are often collected based on protocols (ie, fixed forms) and therefore are relatively structured, partially due to the extraction process that simplify raw data as mentioned above. This feature can be traced back to the Framingham Heart Study [<xref ref-type="bibr" rid="ref41">41</xref>], which has followed a cohort in the town of Framingham, Massachusetts since 1948. Vast amounts of data have been collected through the Framingham Heart Study, and the analysis has informed our understanding of heart diseases, including the effects of diet, exercise, medications, and obesity on risk [<xref ref-type="bibr" rid="ref42">42</xref>]. There are many other clinical databases with different scopes, including but not limited to, prevalence and trend studies, risk factor studies, and genotype-phenotype studies.</p>
            </sec>
            <sec>
                <title>Prevalence and Trend Studies</title>
                <p>One of the major uses for clinical big data is in analysis of the prevalence or trends of a disease or phenotype among different populations. An early big data study evaluated a cohort consisting of 890,394 US veterans with diabetes followed from 2002 through 2006 [<xref ref-type="bibr" rid="ref43">43</xref>]. Bermejo-Sanchez et al [<xref ref-type="bibr" rid="ref44">44</xref>] observed 326 of the birth defect Amelia among 23 million live births, stillbirths, and fetal anomalies from 23 countries and 4 continents, and found the trend of higher prevalence of Amelia among younger mothers. Histological features that differ between chronic idiopathic inflammatory bowel disease and normality and between Crohn&#8217;s disease and ulcerative colitis were identified in 809 large bowel endoscopic biopsies [<xref ref-type="bibr" rid="ref45">45</xref>]. Kelly et al [<xref ref-type="bibr" rid="ref46">46</xref>] studied the prevalence of hip abnormalities of 8192 subjects with hemophilia A and B. Siregar et al [<xref ref-type="bibr" rid="ref47">47</xref>] performed a population-based study on patients after cardiac surgery in all 16 cardiothoracic surgery centers in the Netherlands. Elshazly et al [<xref ref-type="bibr" rid="ref48">48</xref>] examined 1.3 million US adults for patient-level discordance of non-high-density lipoprotein cholesterol and low-density lipoprotein cholesterol. Chan and McGarey [<xref ref-type="bibr" rid="ref49">49</xref>] summarize how large datasets can be analyzed to achieve population-based conclusions, specifically for determination of secular trends, health disparities, geographic variation, and evaluation of specific diseases and treatments. This paper also summarized the strengths and limitations of large-sized datasets and addressed issues such as missing data and bias. These issues will also be discussed in brief below.</p>
            </sec>
            <sec>
                <title>Risk Factor Studies</title>
                <p>Clinical big data can also be used to determine causality, effect, or association between risk factors and the disease of interest. Ursum et al [<xref ref-type="bibr" rid="ref50">50</xref>] examined the relationships between seroconversion and patient age with inflammatory effects of autoantibodies in 18,658 rheumatoid arthritis patients and controls, and showed that citrullinated proteins and peptides were more reliable markers for rheumatoid arthritis than was Immunoglobulin M rheumatoid factor. Ajdacic-Gross et al [<xref ref-type="bibr" rid="ref51">51</xref>] examined the data on 11,905 Swiss conscripts from 2003 for stuttering and found that there was no single overwhelming risk factor for stuttering, although premature birth and parental alcohol abuse appeared influential. Data collected on 14,433 patients from the 155 Veterans Administration medical centers in all 50 US states, Puerto Rico, and the District of Columbia were used to identify the alcohol dependence of medications [<xref ref-type="bibr" rid="ref52">52</xref>]. By analysis of 53,177 cases of contrast administration in 35,922 patients from the Radiology and Cardiac Catheterization Laboratory databases, an increase in contrast nephropathy was associated with use of sodium bicarbonate [<xref ref-type="bibr" rid="ref53">53</xref>]. Echocardiography and electrocardiogram-gated single-photon emission computed tomography traces for the evaluation of left ventricular ejection fraction were compared in 534 patients [<xref ref-type="bibr" rid="ref54">54</xref>]. Zhang et al [<xref ref-type="bibr" rid="ref55">55</xref>] examined clinical data of 16,135 adult patients and elucidated the relationships between glycemic, blood glucose level, and intake of insulin with mortality. Mitchel et al [<xref ref-type="bibr" rid="ref56">56</xref>] studied the effect of 2 types of insulin on 7720 patients selected from 8 million in UK. Kobayashi et al [<xref ref-type="bibr" rid="ref57">57</xref>] analyzed 19,070 records on right hemicolectomy from 3500 Japanese hospitals and successfully developed a risk model. It should be noted that in these studies, the terms of &#8220;association&#8221; and &#8220;causality&#8221; must be rigorously distinguished; most of the studies claimed association, whereas causality was rarely asserted.</p>
            </sec>
            <sec>
                <title>Genotype&#8211;Phenotype Studies</title>
                <p>With the advancement of genotyping technology, an increasing amount of risk-factor studies have attempted to assess association on the genetic level through evaluation of gene expression and/or genomic data obtained from patients and controls. For example, clinical and genetic data from 5700 patients who had been treated with warfarin were used to create an algorithm to estimate the appropriate dose [<xref ref-type="bibr" rid="ref58">58</xref>]. Causality of autism spectrum disorders has been investigated by analysis of 31,516 clinical cases on copy number variation in patients versus 13,696 controls [<xref ref-type="bibr" rid="ref59">59</xref>]. Koefoed et al [<xref ref-type="bibr" rid="ref60">60</xref>] made efforts to assess the effects of signal transmission and calculated all combinations of three genotypes from 803 single-nucleotide polymorphism (SNP) genotypes (2.3 billion combinations) for 1355 controls and 607 patients with bipolar disorder. These studies are similar to risk-factor studies, yet often the big data is significantly larger in volume due in genetic analyses than in risk-factor studies.</p>
            </sec>
            <sec>
                <title>Method Development Studies</title>
                <p>A number of studies have taken advantage of clinical big data to establish new methods or techniques, or to develop new tools to enable analysis of data and decision making. In a typical example, Hill et al [<xref ref-type="bibr" rid="ref61">61</xref>] designed an interface to use clinical data to evaluate risk ratios for various diseases to aid in evaluation of treatment options. Liu et al [<xref ref-type="bibr" rid="ref62">62</xref>, <xref ref-type="bibr" rid="ref63">63</xref>] have used large-scale data analysis to optimize diagnosis of breast cancer from full-field digital mammography images. Lin et al [<xref ref-type="bibr" rid="ref64">64</xref>] made efforts to formalize the phenotype variable in the database Genotypes and Phenotypes. Stephen et al [<xref ref-type="bibr" rid="ref65">65</xref>] developed an algorithm to categorize pediatric patients presenting with respiratory distress into different subtypes using clinical variables from a clinical data warehouse. Clinical data warehouses or databases have been created from radiotherapy clinical trial data [<xref ref-type="bibr" rid="ref66">66</xref>], gene mutations [<xref ref-type="bibr" rid="ref67">67</xref>], cancer patient data [<xref ref-type="bibr" rid="ref68">68</xref>, <xref ref-type="bibr" rid="ref69">69</xref>], kidney disease patient data [<xref ref-type="bibr" rid="ref70">70</xref>], and gastrointestinal surgery patient data [<xref ref-type="bibr" rid="ref71">71</xref>]. Additionally, studies have focused on personalized big data [<xref ref-type="bibr" rid="ref72">72</xref>], citizen-centric health care versus patient-centric health care [<xref ref-type="bibr" rid="ref72">72</xref>, <xref ref-type="bibr" rid="ref73">73</xref>], medication orders [<xref ref-type="bibr" rid="ref74">74</xref>, <xref ref-type="bibr" rid="ref75">75</xref>], and decision making and information management/retrieval in general [<xref ref-type="bibr" rid="ref75">75</xref>-<xref ref-type="bibr" rid="ref80">80</xref>]. The dramatic increase in the number of studies with large scope in the past few years indicates an increasing desire of researchers to manipulate clinical big data; &#8220;big data-assisted clinics&#8221; may be expected in the near future.</p>
            </sec>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <sec>
                <title>Diversity of Data in Clinical Medicine</title>
                <p>The huge body of medical research that has been performed using large datasets demonstrates the broad spectrum of data resources used and shows that the structure of the medical dataset depends on the research question. Data from different subareas of medical research have broad diversity in terms of numbers of entries, types of data stored (or levels), dimensionality, and sample size [<xref ref-type="bibr" rid="ref81">81</xref>]. Datasets obviously differ greatly in size: gene expression datasets derived from high-throughput microarray and next-generation sequencing technologies, such as those that analyze SNPs and copy number variations, tend to be massive, whereas clinical trial dataset are not as big. Phan et al [<xref ref-type="bibr" rid="ref82">82</xref>] suggested that data in medicine be divided into four different levels: the molecular level (eg, genome data), cellular and tissue level (eg, stem cell differentiation data), clinical and patient level (eg, clinical trial data), and biomedical knowledge base level (ie, a comprehensive data collection). Additionally, data tend to have different levels of dimensionality (ie, number of attributes or parameters, <italic>p</italic>) and sample sizes (ie, number of records/entries, n). Typical datasets fall into one of three categories, as summarized by Sinha et al [<xref ref-type="bibr" rid="ref83">83</xref>]: large n, small <italic>p</italic>; small n, large <italic>p</italic>; and large n, large <italic>p</italic>. Thanks to advancements in computational technology, most algorithms can handle low-dimensional data (ie, large n, small <italic>p</italic>) without encountering significant difficulty.</p>
                <p>Most clinical data, however, is high-dimensional (ie, small n, large <italic>p</italic> or large n, large <italic>p</italic>) due to a limited number of patients. One typical example comes from a study of 69 Broca&#8217;s aphasic patients (ie, n=69) who were tested with nearly 6000 stimulus sentences (ie, <italic>p</italic>~6000) [<xref ref-type="bibr" rid="ref84">84</xref>]. With similar dimensionality, Mitchell et al [<xref ref-type="bibr" rid="ref39">39</xref>] studied bipolar disorder where the sample consisted of only 217 patients. For high-dimensional data, each point, sample, or element is described by many attributes [<xref ref-type="bibr" rid="ref83">83</xref>] with the involvement of the &#8220;curse of dimensionality&#8221; [<xref ref-type="bibr" rid="ref85">85</xref>]. Because high-dimensional data are sparse in dimensions, most classification or clustering approaches do not work well because the increase in problem space reduces the overall density of data samples. To solve this problem, compression methods and significance testing are usually used to either reduce the dimensionality or select relevant features before data analysis by some sort of data preprocessing [<xref ref-type="bibr" rid="ref83">83</xref>].</p>
            </sec>
            <sec>
                <title>Methods for Manipulation of Clinical Big Data</title>
                <sec>
                    <title> Technologies for Data Storage and Handling</title>
                    <p>Due to the massiveness and complexity of big data, nonrelational and distributed databases such as Apache Hadoop [<xref ref-type="bibr" rid="ref86">86</xref>], Google BigTable [<xref ref-type="bibr" rid="ref87">87</xref>], NoSQL [<xref ref-type="bibr" rid="ref88">88</xref>], and massively parallel-processing databases are used rather than traditional relational databases to store data. A large number of biostatistics software packages have been used to handle large clinical datasets, some of which enabled the features of cloud-based or distributed computing. Popular software packages include, but are not limited to, SAS [<xref ref-type="bibr" rid="ref36">36</xref>, <xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref53">53</xref>], Mplus [<xref ref-type="bibr" rid="ref51">51</xref>], SPSS [<xref ref-type="bibr" rid="ref36">36</xref>, <xref ref-type="bibr" rid="ref39">39</xref>, <xref ref-type="bibr" rid="ref45">45</xref>], PP-VLAM [<xref ref-type="bibr" rid="ref89">89</xref>], Stata [<xref ref-type="bibr" rid="ref90">90</xref>], and R [<xref ref-type="bibr" rid="ref91">91</xref>]. These technologies and tools greatly facilitate the handling of big data.</p>
                </sec>
                <sec>
                    <title>Methodologies for Data Preprocessing</title>
                    <p>Clinical raw big data can be highly diverse and uninformative without preprocessing. Extraction of a diagnosis from raw computer tomography data is an example of one of the predominant manners in which clinical big data are preprocessed. This type of processes relies on a specialist&#8217;s personal expertise and can be a source of bias. Most early analyses of big data, including that collected by the Framingham Heart Study adopted some form of preprocessing; therefore, challenges exist in curation [<xref ref-type="bibr" rid="ref6">6</xref>]. As an alternative to expert preprocessing, computational algorithms or statistical approaches, including compression methods, significance testing, or normalization [<xref ref-type="bibr" rid="ref92">92</xref>] can be implemented to preprocess raw big data. This methodology may also introduce bias and can cause uncertainty problems during data integration.</p>
                    <p>In some scenarios, visualization can be a part of data preprocessing (as well as result exhibition). Typical examples in this regard include the use of heat maps [<xref ref-type="bibr" rid="ref93">93</xref>], gene alignments [<xref ref-type="bibr" rid="ref94">94</xref>], protein structure visualization [<xref ref-type="bibr" rid="ref95">95</xref>], scatterplot matrix, tree visualization, network visualization, parallel coordinates, stacked graphs, etc. When the big data of interest are scattered or stored at different resources, data integration [<xref ref-type="bibr" rid="ref96">96</xref>, <xref ref-type="bibr" rid="ref97">97</xref>] and federation [<xref ref-type="bibr" rid="ref98">98</xref>] is an important phase during data preprocessing. Approaches such as the Information Manifold [<xref ref-type="bibr" rid="ref97">97</xref>], which allows browsing and querying of multiple networked information sources, can provide solutions to uncertainty problems after data integration and mapping [<xref ref-type="bibr" rid="ref99">99</xref>].</p>
                </sec>
                <sec>
                    <title>Statistical Approaches to Data Analysis</title>
                    <p>A number of popular statistical methods have been implemented in clinical data analysis. The most common include linear regression and logistic regression [<xref ref-type="bibr" rid="ref30">30</xref>], latent class analysis [<xref ref-type="bibr" rid="ref100">100</xref>], principle component analysis [<xref ref-type="bibr" rid="ref101">101</xref>], and classification and regression trees [<xref ref-type="bibr" rid="ref100">100</xref>]. Additionally, logarithmic and square-root transformations [<xref ref-type="bibr" rid="ref58">58</xref>], naive Bayes methods [<xref ref-type="bibr" rid="ref102">102</xref>], decision trees [<xref ref-type="bibr" rid="ref103">103</xref>], neural networks [<xref ref-type="bibr" rid="ref104">104</xref>], support vector machines [<xref ref-type="bibr" rid="ref105">105</xref>], and hidden Markov models [<xref ref-type="bibr" rid="ref83">83</xref>] are also used to study problems in medical data.</p>
                    <p>When a dataset is not overly complicated, a single test (eg, a simple Student&#8217;s <italic>t</italic> test) should be powerful enough to reject a null hypothesis, and single hypothesis testing is the methodology to adopt [<xref ref-type="bibr" rid="ref106">106</xref>]. Sometimes one cannot establish the significance of a hypothesis until different statistical tests have been applied to the same dataset. Multiple testing is often used to identify correlations that deserve further investigation [<xref ref-type="bibr" rid="ref107">107</xref>]. Algorithms for false discovery rate [<xref ref-type="bibr" rid="ref108">108</xref>] and family-wise error rate [<xref ref-type="bibr" rid="ref109">109</xref>] calculation have been implemented for multiple testing in studies on gene expression data and datasets with similar levels of complexity.</p>
                </sec>
            </sec>
            <sec>
                <title>Challenges and Limitations of Use of Clinical Big Data</title>
                <sec>
                    <title>Overview</title>
                    <p>Big data itself has many limitations. These limitations include &#8220;adequacy, accuracy, completeness, nature of the reporting sources, and other measures of the quality of the data&#8221;, as summarized previously [<xref ref-type="bibr" rid="ref110">110</xref>]. The consequences of these limitations are succinctly summarized in the book titled &#8220;Models. Behaving. Badly.&#8221; [<xref ref-type="bibr" rid="ref111">111</xref>]. Modeling can often lead to a biased statistical correlation or inference, sometimes known as a &#8220;false discovery&#8221;. Clinical big data users face a large spectrum of challenges, including but not limited to sample size, selection bias, interpretation problem, missing values, dependence problems, and data handling methodologies.</p>
                </sec>
                <sec>
                    <title>Sample Size</title>
                    <p>One of the counterintuitive challenges in analysis of big data clinical datasets is that sometimes the sample size is not as big, compared with the number of attributes to allow statistically significant analysis. Population survey methods are sometimes adopted because these methods can provide larger datasets. However, the authenticity and accuracy of this type of data are arguably limited; hence, survey methods cannot be reliably used to produce an adequate description or prediction [<xref ref-type="bibr" rid="ref39">39</xref>].</p>
                </sec>
                <sec>
                    <title>Selection Bias</title>
                    <p>Any dataset is a selection of data rather than the whole data world; therefore, selection bias is a very real limitation [<xref ref-type="bibr" rid="ref112">112</xref>] even if the sample size is big. In that sense, all studies of clinical data have this limitation to some degree [<xref ref-type="bibr" rid="ref39">39</xref>].</p>
                </sec>
                <sec>
                    <title>Interpretation Problem</title>
                    <p>Gebregziabher et al [<xref ref-type="bibr" rid="ref43">43</xref>] stated that the datasets generated through many translational research projects to answer questions of public health interest are not self-explanatory due to complexity and inadequate description/documentation of the dataset's parameters and associated metadata. The methodologies for interpreting the data can therefore be subject to all sorts of philosophical debate. For example, the data may not be totally na&#239;ve or objective and interpretation may be biased by subjective assumptions and/or manipulations by individual analysts.</p>
                </sec>
                <sec>
                    <title>Missing Values</title>
                    <p>It is common problem that large datasets have missing values, and in many cases the problem can be significant [<xref ref-type="bibr" rid="ref44">44</xref>]. A typical example is the Framingham Heart Study where data on serum uric acid are largely missing. Additionally, the covariates (ie, attributes) may not fully capture the degree of risk for patients and may cause uncertainty in results [<xref ref-type="bibr" rid="ref53">53</xref>].</p>
                </sec>
                <sec>
                    <title>Dependence Problems</title>
                    <p>One issue that has been often neglected is the dependence of data. Dependence between either attributes or samples in datasets can cause the degrees of freedom to decrease and/or some statistical principles to no longer apply. Examples of this are found when the same patients are evaluated multiple times through follow-up and when correlations in gene expression are drawn based on samples from different patients treated with similar medications [<xref ref-type="bibr" rid="ref83">83</xref>]. As many statistical methods do not account for dependence, results from these tests may be unreliable if this issue is not properly addressed before the data analysis.</p>
                </sec>
                <sec>
                    <title> Data Handling Methodologies</title>
                    <p>Effective processing of big data has always been a challenge. One must consider all the aspects of the dataset, including collection, curation, extraction, integration, interpretation, imputation, and selection of appropriate statistical methods, during processing and analysis. It has been claimed that analyses of large datasets are often suboptimal due to the researcher&#8217;s lack of knowledge of the available tools and methodologies [<xref ref-type="bibr" rid="ref83">83</xref>]. On the other hand, algorithms to handle big data are also underdeveloped to some extent and deserve more attention [<xref ref-type="bibr" rid="ref113">113</xref>].</p>
                </sec>
            </sec>
            <sec>
                <title> Conclusions</title>
                <p>This paper reviewed studies that analyzed clinical big data and that discuss issues related to data storage and analysis. Big data is becoming a common feature of biological and clinical studies. Today, a single biophysical researcher can generate terabytes of data in hours. Over the last decade, clinical datasets have grown incredibly in size, mostly due to use of modern technologies for collection and recording of data. Researchers who use clinical big data face multiple challenges, and the data itself has limitations. It is imperative that methodologies for data analysis keep pace with our ability to collect and store data.</p>
            </sec>
        </sec>
    </body>
    <back>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">BD2K</term>
                    <def>
                        <p>Big Data to Knowledge</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb2">CS</term>
                    <def>
                        <p>computer science</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb3">SNP</term>
                    <def>
                        <p>single-nucleotide polymorphism</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb4">ZB</term>
                    <def>
                        <p>zettabytes</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <fn-group>
            <fn fn-type="con">
                <p>WW did the search and primary review of the literature cited in this article and wrote the manuscript. EK guided the research and critically revised the manuscript.</p>
            </fn>
            <fn fn-type="conflict">
                <p>None declared.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wenkebach</surname>
                            <given-names>U</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pollwein</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Finsterer</surname>
                            <given-names>U</given-names>
                        </name>
                    </person-group>
                    <article-title>Visualization of large datasets in intensive care</article-title>
                    <source>Proc Annu Symp Comput Appl Med Care</source>
                    <year>1992</year>
                    <fpage>18</fpage>
                    <lpage>22</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/1482864" />
                    </comment>
                    <pub-id pub-id-type="medline">1482864</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2248022</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hua</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fu</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>A distributed big data storage and data mining framework for solar-generated electricity quantity forecasting</article-title>
                    <source>Proc. SPIE 8333, Photonics and Optoelectronics Meetings (POEM)</source>
                    <year>2011</year>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://proceedings.spiedigitallibrary.org/proceeding.aspx?articleid=1200314" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1117/12.919640</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>JZ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>YJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hua</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fu</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>A distributed big data storage and data mining framework for solar-generated electricity quantity forecasting</article-title>
                    <source>Proc. SPIE 8333, Photonics and Optoelectronics Meetings (POEM) 2011</source>
                    <year>2011</year>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://proceedings.spiedigitallibrary.org/proceeding.aspx?articleid=1200314" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1117/12.919640</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Fu</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>ZH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>JC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>He</surname>
                            <given-names>MQ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>JZ</given-names>
                        </name>
                    </person-group>
                    <article-title>Distributed storage system big data mining based on HPC application-A solar photovoltaic forecasting system practice</article-title>
                    <source>Information-Tokyo</source>
                    <year>2012</year>
                    <volume>15</volume>
                    <issue>9</issue>
                    <fpage>3749</fpage>
                    <lpage>3755</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Brinkmann</surname>
                            <given-names>BH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bower</surname>
                            <given-names>MR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Stengel</surname>
                            <given-names>KA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Worrell</surname>
                            <given-names>GA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Stead</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Large-scale electrophysiology: acquisition, compression, encryption, and storage of big data</article-title>
                    <source>J Neurosci Methods</source>
                    <year>2009</year>
                    <volume>180</volume>
                    <issue>1</issue>
                    <fpage>185</fpage>
                    <lpage>192</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19427545" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1016/j.jneumeth.2009.03.022</pub-id>
                    <pub-id pub-id-type="medline">19427545</pub-id>
                    <pub-id pub-id-type="pii">S0165-0270(09)00157-5</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2720128</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Howe</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Costanzo</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fey</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gojobori</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hannick</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hide</surname>
                            <given-names>W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hill</surname>
                            <given-names>DP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kania</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schaeffer</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>St Pierre</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Twigger</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>White</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rhee</surname>
                            <given-names>SY</given-names>
                        </name>
                    </person-group>
                    <article-title>Big data: The future of biocuration</article-title>
                    <source>Nature</source>
                    <year>2008</year>
                    <volume>455</volume>
                    <issue>7209</issue>
                    <fpage>47</fpage>
                    <lpage>50</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18769432" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1038/455047a</pub-id>
                    <pub-id pub-id-type="medline">18769432</pub-id>
                    <pub-id pub-id-type="pii">455047a</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2819144</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Calatroni</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Roggen</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Troster</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Collection and curation of a large reference dataset for activity recognition</article-title>
                    <source>Ieee Sys Man Cybern 2011</source>
                    <year>2011</year>
                    <fpage>30</fpage>
                    <lpage>35</lpage>
                    <pub-id pub-id-type="doi">10.1109/ICSMC.2011.6083638</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>O'Driscoll</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Daugelaite</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sleator</surname>
                            <given-names>RD</given-names>
                        </name>
                    </person-group>
                    <article-title>'Big data', Hadoop and cloud computing in genomics</article-title>
                    <source>J Biomed Inform</source>
                    <year>2013</year>
                    <volume>46</volume>
                    <issue>5</issue>
                    <fpage>774</fpage>
                    <lpage>781</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.jbi.2013.07.001</pub-id>
                    <pub-id pub-id-type="medline">23872175</pub-id>
                    <pub-id pub-id-type="pii">S1532-0464(13)00100-7</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lee</surname>
                            <given-names>KK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tang</surname>
                            <given-names>WC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Choi</surname>
                            <given-names>KS</given-names>
                        </name>
                    </person-group>
                    <article-title>Alternatives to relational database: comparison of NoSQL and XML approaches for clinical data storage</article-title>
                    <source>Comput Methods Programs Biomed</source>
                    <year>2013</year>
                    <volume>110</volume>
                    <issue>1</issue>
                    <fpage>99</fpage>
                    <lpage>109</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.cmpb.2012.10.018</pub-id>
                    <pub-id pub-id-type="medline">23177219</pub-id>
                    <pub-id pub-id-type="pii">S0169-2607(12)00280-5</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Beyer</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Douglas</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <source>The Importance of &#039;Big Data&#039;: A Definition</source>
                    <access-date>2013-08-25</access-date>
                    <comment>2012<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.gartner.com/it-glossary/big-data/">http://www.gartner.com/it-glossary/big-data/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6J7x1gswQ</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Olbers</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>M&#252;ller</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Willebrand</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Inverse technique analysis of a large data set</article-title>
                    <source>Physics of the Earth and Planetary Interiors</source>
                    <year>1976</year>
                    <volume>12</volume>
                    <issue>2-3</issue>
                    <fpage>248</fpage>
                    <lpage>252</lpage>
                    <pub-id pub-id-type="doi">10.1016/0031-9201(76)90054-6</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Byth</surname>
                            <given-names>DE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Eisemann</surname>
                            <given-names>RL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>de Lacy</surname>
                            <given-names>IH</given-names>
                        </name>
                    </person-group>
                    <article-title>Two-way pattern analysis of a large data set to evaluate genotypic adaptation</article-title>
                    <source>Heredity</source>
                    <year>1976</year>
                    <volume>37</volume>
                    <issue>2</issue>
                    <fpage>215</fpage>
                    <lpage>230</lpage>
                    <pub-id pub-id-type="doi">10.1038/Hdy.1976.84</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chaudron</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Assenlineau</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Renon</surname>
                            <given-names>H</given-names>
                        </name>
                    </person-group>
                    <article-title>A new modification of the Redlich&#8212;Kwong equation of state based on the analysis of a large set of pure component data</article-title>
                    <source>Chemical Engineering Science</source>
                    <year>1973</year>
                    <volume>28</volume>
                    <issue>3</issue>
                    <fpage>839</fpage>
                    <lpage>846</lpage>
                    <pub-id pub-id-type="doi">10.1016/0009-2509(77)80018-3</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Graefe</surname>
                            <given-names>JF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wood</surname>
                            <given-names>RW</given-names>
                        </name>
                    </person-group>
                    <article-title>Dealing with large data sets</article-title>
                    <source>Neurotoxicol Teratol</source>
                    <year>1990</year>
                    <volume>12</volume>
                    <issue>5</issue>
                    <fpage>449</fpage>
                    <lpage>454</lpage>
                    <pub-id pub-id-type="medline">2247031</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ackerman</surname>
                            <given-names>MJ</given-names>
                        </name>
                    </person-group>
                    <article-title>Big data</article-title>
                    <source>J Med Pract Manage</source>
                    <year>2012</year>
                    <volume>28</volume>
                    <issue>2</issue>
                    <fpage>153</fpage>
                    <lpage>154</lpage>
                    <pub-id pub-id-type="medline">23167038</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Trelles</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Prins</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Snir</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jansen</surname>
                            <given-names>RC</given-names>
                        </name>
                    </person-group>
                    <article-title>Big data, but are we ready?</article-title>
                    <source>Nat Rev Genet</source>
                    <year>2011</year>
                    <month>03</month>
                    <volume>12</volume>
                    <issue>3</issue>
                    <fpage>224</fpage>
                    <pub-id pub-id-type="doi">10.1038/nrg2857-c1</pub-id>
                    <pub-id pub-id-type="medline">21301471</pub-id>
                    <pub-id pub-id-type="pii">nrg2857-c1</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>analysis</surname>
                            <given-names>ATK</given-names>
                        </name>
                    </person-group>
                    <source>Big Data and the Creative Destruction of Today&#039;s Business Models</source>
                    <access-date>2013-11-25</access-date>
                    <comment>2013<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.atkearney.com/strategic-it/ideas-insights/article/-/asset_publisher/LCcgOeS4t85g/content/big-data-and-the-creative-destruction-of-today-s-business-models/10192">http://www.atkearney.com/strategic-it/ideas-insights/article/-/asset_publisher/LCcgOeS4t85g/content/big-data-and-the-creative-destruction-of-today-s-business-models/10192</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6LOmyDbvg</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Halevi</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Moed</surname>
                            <given-names>HF</given-names>
                        </name>
                    </person-group>
                    <source>The Evolution of Big Data as a Research and Scientific Topic: Overview of the Literature</source>
                    <access-date>2013-11-25</access-date>
                    <comment>2012<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.researchtrends.com/issue-30-september-2012/the-evolution-of-big-data-as-a-research-and-scientific-topic-overview-of-the-literature/">http://www.researchtrends.com/issue-30-september-2012/the-evolution-of-big-data-as-a-research-and-scientific-topic-overview-of-the-literature/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6LOn9qSGu</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hutchins</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ihler</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Smyth</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Probabilistic analysis of a large-scale urban traffic sensor data set</article-title>
                    <source>Knowledge Discovery from Sensor Data</source>
                    <year>2010</year>
                    <volume>5840</volume>
                    <fpage>94</fpage>
                    <lpage>114</lpage>
                    <pub-id pub-id-type="doi">10.1007/978-3-642-12519-5_6</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Sleutel</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>De Neve</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Beheydt</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hofman</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Regional simulation of long-term organic carbon stock changes in cropland soils using the DNDC model: 1. Large-scale model validation against a spatially explicit data set</article-title>
                    <source>Soil Use Manage</source>
                    <year>2006</year>
                    <volume>22</volume>
                    <issue>4</issue>
                    <fpage>342</fpage>
                    <lpage>351</lpage>
                    <pub-id pub-id-type="doi">10.1111/j.1475-2743.2006.00045.x</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cianchini</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>De Santis</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Balasis</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mandea</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Qamili</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Entropy based analysis of satellite magnetic data for searching possible electromagnetic signatures due to big earthquakes</article-title>
                    <source>Ma Comput Sci Eng</source>
                    <year>2009</year>
                    <fpage>29</fpage>
                    <lpage>35</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.earth-prints.org/handle/2122/5025" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Issenberg</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>How President Obama's campaign used big data to rally indicidual voters</article-title>
                    <source>Technol Rev</source>
                    <year>2013</year>
                    <volume>116</volume>
                    <issue>1</issue>
                    <fpage>38</fpage>
                    <lpage>49</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://web.ebscohost.com.ezproxy.stanford.edu/ehost/detail?sid=d0465494-31c7-46fc-9d50-c1a8a0afa1d3%40sessionmgr4005&#38;vid=1&#38;hid=4114&#38;bdata=JnNpdGU9ZWhvc3QtbGl2ZSZzY29wZT1zaXRl#db=bth&#38;AN=89156687" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kessler</surname>
                            <given-names>RC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brown</surname>
                            <given-names>RL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Broman</surname>
                            <given-names>CL</given-names>
                        </name>
                    </person-group>
                    <article-title>Sex differences in psychiatric help-seeking: evidence from four large-scale surveys</article-title>
                    <source>J Health Soc Behav</source>
                    <year>1981</year>
                    <month>03</month>
                    <volume>22</volume>
                    <issue>1</issue>
                    <fpage>49</fpage>
                    <lpage>64</lpage>
                    <pub-id pub-id-type="medline">7240706</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lewis</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Moneyball: The Art of Winning an Unfair Game: W</article-title>
                    <source>Moneyball: The Art of Winning an Unfair Game</source>
                    <year>2003</year>
                    <publisher-loc>New York, New York</publisher-loc>
                    <publisher-name>W. W. Norton &#38; Company</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ekins</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Williams</surname>
                            <given-names>AJ</given-names>
                        </name>
                    </person-group>
                    <article-title>When pharmaceutical companies publish large datasets: an abundance of riches or fool's gold?</article-title>
                    <source>Drug Discov Today</source>
                    <year>2010</year>
                    <volume>15</volume>
                    <issue>19-20</issue>
                    <fpage>812</fpage>
                    <lpage>815</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.drudis.2010.08.010</pub-id>
                    <pub-id pub-id-type="medline">20732447</pub-id>
                    <pub-id pub-id-type="pii">S1359-6446(10)00270-9</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Grimley Evans</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tallis</surname>
                            <given-names>RC</given-names>
                        </name>
                    </person-group>
                    <article-title>A new beginning for care for elderly people?</article-title>
                    <source>BMJ</source>
                    <year>2001</year>
                    <volume>322</volume>
                    <issue>7290</issue>
                    <fpage>807</fpage>
                    <lpage>808</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/11290619" />
                    </comment>
                    <pub-id pub-id-type="medline">11290619</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1119992</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Jee</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kim</surname>
                            <given-names>GH</given-names>
                        </name>
                    </person-group>
                    <article-title>Potentiality of big data in the medical sector: focus on how to reshape the healthcare system</article-title>
                    <source>Healthc Inform Res</source>
                    <year>2013</year>
                    <volume>19</volume>
                    <issue>2</issue>
                    <fpage>79</fpage>
                    <lpage>85</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.e-hir.org/journal/viewJournal.html?year=2013&#38;vol=019&#38;num=02&#38;page=79" />
                    </comment>
                    <pub-id pub-id-type="doi">10.4258/hir.2013.19.2.79</pub-id>
                    <pub-id pub-id-type="medline">23882412</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3717441</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Murdoch</surname>
                            <given-names>TB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Detsky</surname>
                            <given-names>AS</given-names>
                        </name>
                    </person-group>
                    <article-title>The inevitable application of big data to health care</article-title>
                    <source>JAMA</source>
                    <year>2013</year>
                    <volume>309</volume>
                    <issue>13</issue>
                    <fpage>1351</fpage>
                    <lpage>1352</lpage>
                    <pub-id pub-id-type="doi">10.1001/jama.2013.393</pub-id>
                    <pub-id pub-id-type="medline">23549579</pub-id>
                    <pub-id pub-id-type="pii">1674245</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Toga</surname>
                            <given-names>AW</given-names>
                        </name>
                    </person-group>
                    <article-title>The clinical value of large neuroimaging data sets in Alzheimer's disease</article-title>
                    <source>Neuroimaging Clin N Am</source>
                    <year>2012</year>
                    <volume>22</volume>
                    <issue>1</issue>
                    <fpage>107</fpage>
                    <lpage>118, ix</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22284737" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1016/j.nic.2011.11.008</pub-id>
                    <pub-id pub-id-type="medline">22284737</pub-id>
                    <pub-id pub-id-type="pii">S1052-5149(11)00178-X</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3555557</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bakke</surname>
                            <given-names>PS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhu</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gulsvik</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kong</surname>
                            <given-names>X</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Agusti</surname>
                            <given-names>AG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Calverley</surname>
                            <given-names>PM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Donner</surname>
                            <given-names>CF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Levy</surname>
                            <given-names>RD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Make</surname>
                            <given-names>BJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Par&#233;</surname>
                            <given-names>PD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rennard</surname>
                            <given-names>SI</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Vestbo</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wouters</surname>
                            <given-names>EF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Anderson</surname>
                            <given-names>W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lomas</surname>
                            <given-names>DA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Silverman</surname>
                            <given-names>EK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pillai</surname>
                            <given-names>SG</given-names>
                        </name>
                    </person-group>
                    <article-title>Candidate genes for COPD in two large data sets</article-title>
                    <source>Eur Respir J</source>
                    <year>2011</year>
                    <volume>37</volume>
                    <issue>2</issue>
                    <fpage>255</fpage>
                    <lpage>263</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://erj.ersjournals.com/cgi/pmidlookup?view=long&#38;pmid=20562129" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1183/09031936.00091709</pub-id>
                    <pub-id pub-id-type="medline">20562129</pub-id>
                    <pub-id pub-id-type="pii">09031936.00091709</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Solomon</surname>
                            <given-names>BD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nguyen</surname>
                            <given-names>AD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bear</surname>
                            <given-names>KA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wolfsberg</surname>
                            <given-names>TG</given-names>
                        </name>
                    </person-group>
                    <article-title>Clinical genomic database</article-title>
                    <source>Proc Natl Acad Sci U S A</source>
                    <year>2013</year>
                    <volume>110</volume>
                    <issue>24</issue>
                    <fpage>9851</fpage>
                    <lpage>9855</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&#38;pmid=23696674" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1073/pnas.1302575110</pub-id>
                    <pub-id pub-id-type="medline">23696674</pub-id>
                    <pub-id pub-id-type="pii">1302575110</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3683745</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref32">
                <label>32</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Liu</surname>
                            <given-names>XL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Du</surname>
                            <given-names>JP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>WZ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zuo</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Han</surname>
                            <given-names>ZM</given-names>
                        </name>
                    </person-group>
                    <article-title>Data warehousing for data mining based on Olap technology</article-title>
                    <source>Ciict 2008: Proceedings of China-Ireland International Conference on Information and Communications Technologies</source>
                    <year>2008</year>
                    <conf-name>China-Ireland International Conference on Information and Communications Technologies</conf-name>
                    <conf-date>26-28 Sept. 2008</conf-date>
                    <conf-loc>Beijing, China</conf-loc>
                    <fpage>176</fpage>
                    <lpage>79</lpage>
                    <pub-id pub-id-type="doi">10.1049/cp:20080786</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref33">
                <label>33</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lohr</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <source>The New York Times</source>
                    <year>2012</year>
                    <comment>The Age of Big Data<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.nytimes.com/2012/02/12/sunday-review/big-datas-impact-in-the-world.html?pagewanted=1&#38;_r=0">http://www.nytimes.com/2012/02/12/sunday-review/big-datas-impact-in-the-world.html?pagewanted=1&#38;_r=0</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6J7xJAwId</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref34">
                <label>34</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>McCann</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <source>EHR Boosts ROI</source>
                    <access-date>2013-11-25</access-date>
                    <comment>2013<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.healthcareitnews.com/news/ehr-boost-roi-revenue-medical-group">http://www.healthcareitnews.com/news/ehr-boost-roi-revenue-medical-group</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6LOnNYQHV</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref35">
                <label>35</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>group</surname>
                            <given-names>CIW</given-names>
                        </name>
                    </person-group>
                    <source>EMR Benefits and Return on Investment Categories</source>
                    <access-date>2013-11-25</access-date>
                    <comment>2008<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.informatics-review.com/wiki/index.php/EMR_Benefits_and_Return_on_Investment_Categories">http://www.informatics-review.com/wiki/index.php/EMR_Benefits_and_Return_on_Investment_Categories</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6LOndM19u</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref36">
                <label>36</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kjaergard</surname>
                            <given-names>LL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Villumsen</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gluud</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>Reported methodologic quality and discrepancies between large and small randomized trials in meta-analyses</article-title>
                    <source>Ann Intern Med</source>
                    <year>2001</year>
                    <month>12</month>
                    <day>4</day>
                    <volume>135</volume>
                    <issue>11</issue>
                    <fpage>982</fpage>
                    <lpage>989</lpage>
                    <pub-id pub-id-type="medline">11730399</pub-id>
                    <pub-id pub-id-type="pii">200112040-00010</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref37">
                <label>37</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mancia</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Omboni</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ravogli</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Parati</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zanchetti</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Ambulatory blood pressure monitoring in the evaluation of antihypertensive treatment: additional information from a large data base</article-title>
                    <source>Blood Press</source>
                    <year>1995</year>
                    <volume>4</volume>
                    <issue>3</issue>
                    <fpage>148</fpage>
                    <lpage>156</lpage>
                    <pub-id pub-id-type="medline">7670648</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref38">
                <label>38</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Reichelt</surname>
                            <given-names>JG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Heimdal</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>M&#248;ller</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dahl</surname>
                            <given-names>AA</given-names>
                        </name>
                    </person-group>
                    <article-title>BRCA1 testing with definitive results: a prospective study of psychological distress in a large clinic-based sample</article-title>
                    <source>Familial Cancer</source>
                    <year>2002</year>
                    <volume>3</volume>
                    <issue>1</issue>
                    <fpage>21</fpage>
                    <lpage>28</lpage>
                    <pub-id pub-id-type="doi">10.1023/B:FAME.0000026820.32469.4a</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref39">
                <label>39</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mitchell</surname>
                            <given-names>PB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Johnston</surname>
                            <given-names>AK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Corry</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ball</surname>
                            <given-names>JR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Malhi</surname>
                            <given-names>GS</given-names>
                        </name>
                    </person-group>
                    <article-title>Characteristics of bipolar disorder in an Australian specialist outpatient clinic: comparison across large datasets</article-title>
                    <source>Aust N Z J Psychiatry</source>
                    <year>2009</year>
                    <volume>43</volume>
                    <issue>2</issue>
                    <fpage>109</fpage>
                    <lpage>117</lpage>
                    <pub-id pub-id-type="doi">10.1080/00048670802607220</pub-id>
                    <pub-id pub-id-type="medline">19153918</pub-id>
                    <pub-id pub-id-type="pii">907921875</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref40">
                <label>40</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>NHGRI</collab>
                    </person-group>
                    <source>Request for Information (RFI): Input on Development of Analysis MethodsSoftware for Big Data</source>
                    <access-date>2013-08-27</access-date>
                    <comment>2013<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://grants.nih.gov/grants/guide/notice-files/NOT-HG-13-014.html">http://grants.nih.gov/grants/guide/notice-files/NOT-HG-13-014.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6JB6Y33gd</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref41">
                <label>41</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wolf</surname>
                            <given-names>PA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Abbott</surname>
                            <given-names>RD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kannel</surname>
                            <given-names>WB</given-names>
                        </name>
                    </person-group>
                    <article-title>Atrial fibrillation as an independent risk factor for stroke: the Framingham Study</article-title>
                    <source>Stroke</source>
                    <year>1991</year>
                    <volume>22</volume>
                    <issue>8</issue>
                    <fpage>983</fpage>
                    <lpage>988</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://stroke.ahajournals.org/cgi/pmidlookup?view=long&#38;pmid=1866765" />
                    </comment>
                    <pub-id pub-id-type="medline">1866765</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref42">
                <label>42</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hubert</surname>
                            <given-names>HB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Feinleib</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>McNamara</surname>
                            <given-names>PM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Castelli</surname>
                            <given-names>WP</given-names>
                        </name>
                    </person-group>
                    <article-title>Obesity as an independent risk factor for cardiovascular disease: a 26-year follow-up of participants in the Framingham Heart Study</article-title>
                    <source>Circulation</source>
                    <year>1983</year>
                    <volume>67</volume>
                    <issue>5</issue>
                    <fpage>968</fpage>
                    <lpage>977</lpage>
                    <pub-id pub-id-type="medline">6219830</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref43">
                <label>43</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Gebregziabher</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Egede</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gilbert</surname>
                            <given-names>GE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hunt</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nietert</surname>
                            <given-names>PJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mauldin</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Fitting parametric random effects models in very large data sets with application to VHA national data</article-title>
                    <source>BMC Med Res Methodol</source>
                    <year>2012</year>
                    <volume>12</volume>
                    <fpage>163</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.biomedcentral.com/1471-2288/12/163" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/1471-2288-12-163</pub-id>
                    <pub-id pub-id-type="medline">23095325</pub-id>
                    <pub-id pub-id-type="pii">1471-2288-12-163</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3542162</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref44">
                <label>44</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bermejo-S&#225;nchez</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cuevas</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Amar</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bakker</surname>
                            <given-names>MK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bianca</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bianchi</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Canfield</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Castilla</surname>
                            <given-names>EE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Clementi</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cocchi</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Feldkamp</surname>
                            <given-names>ML</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Landau</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Leoncini</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>Z</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lowry</surname>
                            <given-names>RB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mastroiacovo</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mutchinick</surname>
                            <given-names>OM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rissmann</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ritvanen</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Scarano</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Siffel</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Szabova</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mart&#237;nez-Fr&#237;as</surname>
                            <given-names>ML</given-names>
                        </name>
                    </person-group>
                    <article-title>Amelia: a multi-center descriptive epidemiologic study in a large dataset from the International Clearinghouse for Birth Defects Surveillance and Research, and overview of the literature</article-title>
                    <source>Am J Med Genet C Semin Med Genet</source>
                    <year>2011</year>
                    <volume>157C</volume>
                    <issue>4</issue>
                    <fpage>288</fpage>
                    <lpage>304</lpage>
                    <pub-id pub-id-type="doi">10.1002/ajmg.c.30319</pub-id>
                    <pub-id pub-id-type="medline">22002956</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref45">
                <label>45</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cross</surname>
                            <given-names>SS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Harrison</surname>
                            <given-names>RF</given-names>
                        </name>
                    </person-group>
                    <article-title>Discriminant histological features in the diagnosis of chronic idiopathic inflammatory bowel disease: analysis of a large dataset by a novel data visualisation technique</article-title>
                    <source>J Clin Pathol</source>
                    <year>2002</year>
                    <volume>55</volume>
                    <issue>1</issue>
                    <fpage>51</fpage>
                    <lpage>57</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jcp.bmj.com/cgi/pmidlookup?view=long&#38;pmid=11825925" />
                    </comment>
                    <pub-id pub-id-type="medline">11825925</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1769566</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref46">
                <label>46</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kelly</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>C Zhang</surname>
                            <given-names>Q</given-names>
                        </name>
                        <name name-style="western">
                            <surname>M Soucie</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Manco-Johnson</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dimichele</surname>
                            <given-names>D</given-names>
                        </name>
                        <collab>Joint Outcome Subcommittee of the Coordinating Committee for the Universal Data Collection Databasethe Hemophilia Treatment Center Network Investigators</collab>
                    </person-group>
                    <article-title>Prevalence of clinical hip abnormalities in haemophilia A and B: an analysis of the UDC database</article-title>
                    <source>Haemophilia</source>
                    <year>2013</year>
                    <volume>19</volume>
                    <issue>3</issue>
                    <fpage>426</fpage>
                    <lpage>431</lpage>
                    <pub-id pub-id-type="doi">10.1111/hae.12073</pub-id>
                    <pub-id pub-id-type="medline">23252621</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref47">
                <label>47</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Siregar</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Roes</surname>
                            <given-names>KC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>van Straten</surname>
                            <given-names>AH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bots</surname>
                            <given-names>ML</given-names>
                        </name>
                        <name name-style="western">
                            <surname>van der Graaf</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>van Herwerden</surname>
                            <given-names>LA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Groenwold</surname>
                            <given-names>RH</given-names>
                        </name>
                    </person-group>
                    <article-title>Statistical methods to monitor risk factors in a clinical database: example of a national cardiac surgery registry</article-title>
                    <source>Circ Cardiovasc Qual Outcomes</source>
                    <year>2013</year>
                    <volume>6</volume>
                    <issue>1</issue>
                    <fpage>110</fpage>
                    <lpage>118</lpage>
                    <pub-id pub-id-type="doi">10.1161/CIRCOUTCOMES.112.968800</pub-id>
                    <pub-id pub-id-type="medline">23322806</pub-id>
                    <pub-id pub-id-type="pii">6/1/110</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref48">
                <label>48</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Elshazly</surname>
                            <given-names>MB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Martin</surname>
                            <given-names>SS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Blaha</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Joshi</surname>
                            <given-names>PH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Toth</surname>
                            <given-names>PP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>McEvoy</surname>
                            <given-names>JW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Al-Hijji</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kulkarni</surname>
                            <given-names>KR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kwiterovich</surname>
                            <given-names>PO</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Blumenthal</surname>
                            <given-names>RS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jones</surname>
                            <given-names>SR</given-names>
                        </name>
                    </person-group>
                    <article-title>Non-high-density lipoprotein cholesterol, guideline targets, and population percentiles for secondary prevention in 1.3 million adults: the VLDL-2 Study (very large database of lipids)</article-title>
                    <source>J Am Coll Cardiol</source>
                    <year>2013</year>
                    <month>11</month>
                    <day>19</day>
                    <volume>62</volume>
                    <issue>21</issue>
                    <fpage>1960</fpage>
                    <lpage>1965</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.jacc.2013.07.045</pub-id>
                    <pub-id pub-id-type="medline">23973689</pub-id>
                    <pub-id pub-id-type="pii">S0735-1097(13)03075-1</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref49">
                <label>49</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chan</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>McGarey</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Using large datasets for population-based health research</article-title>
                    <source>Gallin JI, Ognibene FP.  eds. Principles and Practice of Clinical Research. 3rd ed</source>
                    <year>2012</year>
                    <publisher-loc>Maryland Heights, MO</publisher-loc>
                    <publisher-name>Elsevier, Inc</publisher-name>
                    <fpage>371</fpage>
                    <lpage>381</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref50">
                <label>50</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ursum</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bos</surname>
                            <given-names>WH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>van de Stadt</surname>
                            <given-names>RJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dijkmans</surname>
                            <given-names>BA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>van Schaardenburg</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>Different properties of ACPA and IgM-RF derived from a large dataset: further evidence of two distinct autoantibody systems</article-title>
                    <source>Arthritis Res Ther</source>
                    <year>2009</year>
                    <volume>11</volume>
                    <issue>3</issue>
                    <fpage>R75</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://arthritis-research.com/content/11/3/R75" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/ar2704</pub-id>
                    <pub-id pub-id-type="medline">19460147</pub-id>
                    <pub-id pub-id-type="pii">ar2704</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2714121</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref51">
                <label>51</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ajdacic-Gross</surname>
                            <given-names>V</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Vetter</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>M&#252;ller</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kawohl</surname>
                            <given-names>W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Frey</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lupi</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Blechschmidt</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Born</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Latal</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>R&#246;ssler</surname>
                            <given-names>W</given-names>
                        </name>
                    </person-group>
                    <article-title>Risk factors for stuttering: a secondary analysis of a large data base</article-title>
                    <source>Eur Arch Psychiatry Clin Neurosci</source>
                    <year>2010</year>
                    <volume>260</volume>
                    <issue>4</issue>
                    <fpage>279</fpage>
                    <lpage>286</lpage>
                    <pub-id pub-id-type="doi">10.1007/s00406-009-0075-4</pub-id>
                    <pub-id pub-id-type="medline">19826856</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref52">
                <label>52</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Monnelly</surname>
                            <given-names>EP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Locastro</surname>
                            <given-names>JS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gagnon</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Young</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fiore</surname>
                            <given-names>LD</given-names>
                        </name>
                    </person-group>
                    <article-title>Quetiapine versus trazodone in reducing rehospitalization for alcohol dependence: a large data-base study</article-title>
                    <source>J Addict Med</source>
                    <year>2008</year>
                    <volume>2</volume>
                    <issue>3</issue>
                    <fpage>128</fpage>
                    <lpage>134</lpage>
                    <pub-id pub-id-type="doi">10.1097/ADM.0b013e318165cb56</pub-id>
                    <pub-id pub-id-type="medline">21768982</pub-id>
                    <pub-id pub-id-type="pii">01271255-200809000-00003</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref53">
                <label>53</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>From</surname>
                            <given-names>AM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bartholmai</surname>
                            <given-names>BJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Williams</surname>
                            <given-names>AW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cha</surname>
                            <given-names>SS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pflueger</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>McDonald</surname>
                            <given-names>FS</given-names>
                        </name>
                    </person-group>
                    <article-title>Sodium bicarbonate is associated with an increased incidence of contrast nephropathy: a retrospective cohort study of 7977 patients at mayo clinic</article-title>
                    <source>Clin J Am Soc Nephrol</source>
                    <year>2008</year>
                    <volume>3</volume>
                    <issue>1</issue>
                    <fpage>10</fpage>
                    <lpage>18</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://cjasn.asnjournals.org/cgi/pmidlookup?view=long&#38;pmid=18057306" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2215/CJN.03100707</pub-id>
                    <pub-id pub-id-type="medline">18057306</pub-id>
                    <pub-id pub-id-type="pii">CJN.03100707</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2390990</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref54">
                <label>54</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Habash-Bseiso</surname>
                            <given-names>DE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rokey</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Berger</surname>
                            <given-names>CJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Weier</surname>
                            <given-names>AW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chyou</surname>
                            <given-names>PH</given-names>
                        </name>
                    </person-group>
                    <article-title>Accuracy of noninvasive ejection fraction measurement in a large community-based clinic</article-title>
                    <source>Clin Med Res</source>
                    <year>2005</year>
                    <volume>3</volume>
                    <issue>2</issue>
                    <fpage>75</fpage>
                    <lpage>82</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.clinmedres.org/cgi/pmidlookup?view=long&#38;pmid=16012124" />
                    </comment>
                    <pub-id pub-id-type="medline">16012124</pub-id>
                    <pub-id pub-id-type="pii">3/2/75</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1183436</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref55">
                <label>55</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hemond</surname>
                            <given-names>MS</given-names>
                        </name>
                    </person-group>
                    <article-title>Uncovering the predictive value of minimum blood glucose through statistical analysis of a large clinical dataset</article-title>
                    <source>AMIA Annu Symp Proc</source>
                    <year>2009</year>
                    <volume>2009</volume>
                    <fpage>725</fpage>
                    <lpage>729</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20351948" />
                    </comment>
                    <pub-id pub-id-type="medline">20351948</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2815380</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref56">
                <label>56</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Morgan</surname>
                            <given-names>CL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Evans</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Toft</surname>
                            <given-names>AD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jenkins-Jones</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Poole</surname>
                            <given-names>CD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Currie</surname>
                            <given-names>CJ</given-names>
                        </name>
                    </person-group>
                    <article-title>Clinical effectiveness of biphasic insulin aspart 30:70 versus biphasic human insulin 30 in UK general clinical practice: a retrospective database study</article-title>
                    <source>Clin Ther</source>
                    <year>2011</year>
                    <volume>33</volume>
                    <issue>1</issue>
                    <fpage>27</fpage>
                    <lpage>35</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.clinthera.2011.01.023</pub-id>
                    <pub-id pub-id-type="medline">21397771</pub-id>
                    <pub-id pub-id-type="pii">S0149-2918(11)00070-1</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref57">
                <label>57</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kobayashi</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Miyata</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gotoh</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Baba</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kimura</surname>
                            <given-names>W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kitagawa</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nakagoe</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Shimada</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tomita</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sugihara</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mori</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Risk model for right hemicolectomy based on 19,070 Japanese patients in the National Clinical Database</article-title>
                    <source>J Gastroenterol</source>
                    <year>2013</year>
                    <month>07</month>
                    <day>27</day>
                    <pub-id pub-id-type="doi">10.1007/s00535-013-0860-8</pub-id>
                    <pub-id pub-id-type="medline">23892987</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref58">
                <label>58</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <collab>International Warfarin Pharmacogenetics Consortium</collab>
                        <name name-style="western">
                            <surname>Klein</surname>
                            <given-names>TE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Altman</surname>
                            <given-names>RB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Eriksson</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gage</surname>
                            <given-names>BF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kimmel</surname>
                            <given-names>SE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lee</surname>
                            <given-names>MT</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Limdi</surname>
                            <given-names>NA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Page</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Roden</surname>
                            <given-names>DM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wagner</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Caldwell</surname>
                            <given-names>MD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Johnson</surname>
                            <given-names>JA</given-names>
                        </name>
                    </person-group>
                    <article-title>Estimation of the warfarin dose with clinical and pharmacogenetic data</article-title>
                    <source>N Engl J Med</source>
                    <year>2009</year>
                    <volume>360</volume>
                    <issue>8</issue>
                    <fpage>753</fpage>
                    <lpage>764</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19228618" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1056/NEJMoa0809329</pub-id>
                    <pub-id pub-id-type="medline">19228618</pub-id>
                    <pub-id pub-id-type="pii">360/8/753</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2722908</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref59">
                <label>59</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Moreno-De-Luca</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sanders</surname>
                            <given-names>SJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Willsey</surname>
                            <given-names>AJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mulle</surname>
                            <given-names>JG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lowe</surname>
                            <given-names>JK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Geschwind</surname>
                            <given-names>DH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>State</surname>
                            <given-names>MW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Martin</surname>
                            <given-names>CL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ledbetter</surname>
                            <given-names>DH</given-names>
                        </name>
                    </person-group>
                    <article-title>Using large clinical data sets to infer pathogenicity for rare copy number variants in autism cohorts</article-title>
                    <source>Mol Psychiatry</source>
                    <year>2013</year>
                    <volume>18</volume>
                    <issue>10</issue>
                    <fpage>1090</fpage>
                    <lpage>1095</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23044707" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1038/mp.2012.138</pub-id>
                    <pub-id pub-id-type="medline">23044707</pub-id>
                    <pub-id pub-id-type="pii">mp2012138</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3720840</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref60">
                <label>60</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Koefoed</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Andreassen</surname>
                            <given-names>OA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bennike</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dam</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Djurovic</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hansen</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jorgensen</surname>
                            <given-names>MB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kessing</surname>
                            <given-names>LV</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Melle</surname>
                            <given-names>I</given-names>
                        </name>
                        <name name-style="western">
                            <surname>M&#248;ller</surname>
                            <given-names>GL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mors</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Werge</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mellerup</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Combinations of SNPs related to signal transduction in bipolar disorder</article-title>
                    <source>PLoS One</source>
                    <year>2011</year>
                    <volume>6</volume>
                    <issue>8</issue>
                    <fpage>e23812</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0023812" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0023812</pub-id>
                    <pub-id pub-id-type="medline">21897858</pub-id>
                    <pub-id pub-id-type="pii">10-PONE-RA-20023</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3163586</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref61">
                <label>61</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hill</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Proulx</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zeng-Treitler</surname>
                            <given-names>Q</given-names>
                        </name>
                    </person-group>
                    <article-title>Exploring the use of large clinical data to inform patients for shared decision making</article-title>
                    <source>Stud Health Technol Inform</source>
                    <year>2013</year>
                    <volume>192</volume>
                    <fpage>851</fpage>
                    <lpage>855</lpage>
                    <pub-id pub-id-type="medline">23920678</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref62">
                <label>62</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Giger</surname>
                            <given-names>ML</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yuan</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Horsch</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lan</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jamieson</surname>
                            <given-names>AR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sennett</surname>
                            <given-names>CA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jansen</surname>
                            <given-names>SA</given-names>
                        </name>
                    </person-group>
                    <article-title>Evaluation of computer-aided diagnosis on a large clinical full-field digital mammographic dataset</article-title>
                    <source>Acad Radiol</source>
                    <year>2008</year>
                    <volume>15</volume>
                    <issue>11</issue>
                    <fpage>1437</fpage>
                    <lpage>1445</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18995194" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1016/j.acra.2008.05.004</pub-id>
                    <pub-id pub-id-type="medline">18995194</pub-id>
                    <pub-id pub-id-type="pii">S1076-6332(08)00280-8</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2597106</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref63">
                <label>63</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Giger</surname>
                            <given-names>ML</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lan</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bancroft Brown</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>MacMahon</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mussman</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Olopade</surname>
                            <given-names>OI</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sennett</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>Computerized analysis of mammographic parenchymal patterns on a large clinical dataset of full-field digital mammograms: robustness study with two high-risk datasets</article-title>
                    <source>J Digit Imaging</source>
                    <year>2012</year>
                    <volume>25</volume>
                    <issue>5</issue>
                    <fpage>591</fpage>
                    <lpage>598</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22246204" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1007/s10278-012-9452-z</pub-id>
                    <pub-id pub-id-type="medline">22246204</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3447101</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref64">
                <label>64</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lin</surname>
                            <given-names>KW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tharp</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Conway</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hsieh</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ross</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kim</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kim</surname>
                            <given-names>HE</given-names>
                        </name>
                    </person-group>
                    <article-title>Feasibility of using Clinical Element Models (CEM) to standardize phenotype variables in the database of genotypes and phenotypes (dbGaP)</article-title>
                    <source>PLoS One</source>
                    <year>2013</year>
                    <volume>8</volume>
                    <issue>9</issue>
                    <fpage>e76384</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0076384" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0076384</pub-id>
                    <pub-id pub-id-type="medline">24058713</pub-id>
                    <pub-id pub-id-type="pii">PONE-D-13-01003</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3776754</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref65">
                <label>65</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Stephen</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Boxwala</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gertman</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Feasibility of using a large Clinical Data Warehouse to automate the selection of diagnostic cohorts</article-title>
                    <source>AMIA Annu Symp Proc</source>
                    <year>2003</year>
                    <fpage>1019</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/14728522" />
                    </comment>
                    <pub-id pub-id-type="medline">14728522</pub-id>
                    <pub-id pub-id-type="pii">D030003072</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1480068</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref66">
                <label>66</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Roelofs</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Persoon</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nijsten</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wiessler</surname>
                            <given-names>W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dekker</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lambin</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Benefits of a clinical data warehouse with data mining tools to collect data for a radiotherapy trial</article-title>
                    <source>Radiother Oncol</source>
                    <year>2013</year>
                    <volume>108</volume>
                    <issue>1</issue>
                    <fpage>174</fpage>
                    <lpage>179</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.radonc.2012.09.019</pub-id>
                    <pub-id pub-id-type="medline">23394741</pub-id>
                    <pub-id pub-id-type="pii">S0167-8140(12)00444-6</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref67">
                <label>67</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Stenson</surname>
                            <given-names>PD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mort</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ball</surname>
                            <given-names>EV</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Shaw</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Phillips</surname>
                            <given-names>AD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cooper</surname>
                            <given-names>DN</given-names>
                        </name>
                    </person-group>
                    <article-title>The Human Gene Mutation Database: building a comprehensive mutation repository for clinical and molecular genetics, diagnostic testing and personalized genomic medicine</article-title>
                    <source>Hum Genet</source>
                    <year>2013</year>
                    <month>09</month>
                    <day>28</day>
                    <pub-id pub-id-type="doi">10.1007/s00439-013-1358-4</pub-id>
                    <pub-id pub-id-type="medline">24077912</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref68">
                <label>68</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hu</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brzeski</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hutchins</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ramaraj</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Qu</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Xiong</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kalathil</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kato</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tenkillaya</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Carney</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Redd</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Arkalgudvenkata</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Shahzad</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Scott</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cheng</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Meadow</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>McMichael</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sheu</surname>
                            <given-names>SL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rosendale</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kvecher</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ahern</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yang</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jordan</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Somiari</surname>
                            <given-names>SB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hooke</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Shriver</surname>
                            <given-names>CD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Somiari</surname>
                            <given-names>RI</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Liebman</surname>
                            <given-names>MN</given-names>
                        </name>
                    </person-group>
                    <article-title>Biomedical informatics: development of a comprehensive data warehouse for clinical and genomic breast cancer research</article-title>
                    <source>Pharmacogenomics</source>
                    <year>2004</year>
                    <volume>5</volume>
                    <issue>7</issue>
                    <fpage>933</fpage>
                    <lpage>941</lpage>
                    <pub-id pub-id-type="doi">10.1517/14622416.5.7.933</pub-id>
                    <pub-id pub-id-type="medline">15469411</pub-id>
                    <pub-id pub-id-type="pii">PGS050713</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref69">
                <label>69</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Savas</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>A curated database of genetic markers from the angiogenesis/VEGF pathway and their relation to clinical outcome in human cancers</article-title>
                    <source>Acta Oncol</source>
                    <year>2012</year>
                    <volume>51</volume>
                    <issue>2</issue>
                    <fpage>243</fpage>
                    <lpage>246</lpage>
                    <pub-id pub-id-type="doi">10.3109/0284186X.2011.636758</pub-id>
                    <pub-id pub-id-type="medline">22150118</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref70">
                <label>70</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Singh</surname>
                            <given-names>SK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Malik</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Firoz</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jha</surname>
                            <given-names>V</given-names>
                        </name>
                    </person-group>
                    <article-title>CDKD: a clinical database of kidney diseases</article-title>
                    <source>BMC Nephrol</source>
                    <year>2012</year>
                    <volume>13</volume>
                    <fpage>23</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.biomedcentral.com/1471-2369/13/23" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/1471-2369-13-23</pub-id>
                    <pub-id pub-id-type="medline">22540288</pub-id>
                    <pub-id pub-id-type="pii">1471-2369-13-23</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3520117</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref71">
                <label>71</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Suzuki</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gotoh</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sugihara</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kitagawa</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kimura</surname>
                            <given-names>W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kondo</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Shimada</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tomita</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nakagoe</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hashimoto</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Baba</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Miyata</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Motomura</surname>
                            <given-names>N</given-names>
                        </name>
                    </person-group>
                    <article-title>Nationwide survey and establishment of a clinical database for gastrointestinal surgery in Japan: Targeting integration of a cancer registration system and improving the outcome of cancer treatment</article-title>
                    <source>Cancer Sci</source>
                    <year>2011</year>
                    <volume>102</volume>
                    <issue>1</issue>
                    <fpage>226</fpage>
                    <lpage>230</lpage>
                    <pub-id pub-id-type="doi">10.1111/j.1349-7006.2010.01749.x</pub-id>
                    <pub-id pub-id-type="medline">20961361</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref72">
                <label>72</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chawla</surname>
                            <given-names>NV</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Davis</surname>
                            <given-names>DA</given-names>
                        </name>
                    </person-group>
                    <article-title>Bringing big data to personalized healthcare: a patient-centered framework</article-title>
                    <source>J Gen Intern Med</source>
                    <year>2013</year>
                    <volume>28(suppl 3)</volume>
                    <fpage>S660</fpage>
                    <lpage>S665</lpage>
                    <pub-id pub-id-type="doi">10.1007/s11606-013-2455-8</pub-id>
                    <pub-id pub-id-type="medline">23797912</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref73">
                <label>73</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Han</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>It&#228;l&#228;</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>H&#228;m&#228;l&#228;inen</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Citizen Centric Architecture approach - taking e-health forward by integrating citizens and service providers</article-title>
                    <source>Stud Health Technol Inform</source>
                    <year>2010</year>
                    <volume>160</volume>
                    <issue>Pt 2</issue>
                    <fpage>907</fpage>
                    <lpage>911</lpage>
                    <pub-id pub-id-type="medline">20841816</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref74">
                <label>74</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Boussadi</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Caruba</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zapletal</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sabatier</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Durieux</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Degoulet</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>A clinical data warehouse-based process for refining medication orders alerts</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2012</year>
                    <volume>19</volume>
                    <issue>5</issue>
                    <fpage>782</fpage>
                    <lpage>785</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.bmj.com/cgi/pmidlookup?view=long&#38;pmid=22523345" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/amiajnl-2012-000850</pub-id>
                    <pub-id pub-id-type="medline">22523345</pub-id>
                    <pub-id pub-id-type="pii">amiajnl-2012-000850</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3422842</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref75">
                <label>75</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hernandez</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Podchiyska</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Weber</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ferris</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lowe</surname>
                            <given-names>H</given-names>
                        </name>
                    </person-group>
                    <source>AMIA Annu Symp Proc</source>
                    <year>2009</year>
                    <access-date>2014-01-09</access-date>
                    <comment>Automated mapping of pharmacy orders from two electronic health record systems to RxNorm within the STRIDE clinical data warehouse<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20351858/reload=0;jsessionid=4aLVRuWM5ugKTsb134ug.0">http://europepmc.org/abstract/MED/20351858/reload=0;jsessionid=4aLVRuWM5ugKTsb134ug.0</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6MVbvtUxj</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref76">
                <label>76</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cuggia</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Garcelon</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Campillo-Gimenez</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bernicot</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Laurent</surname>
                            <given-names>JF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Garin</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Happe</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Duvauferrier</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <article-title>Roogle: an information retrieval engine for clinical data warehouse</article-title>
                    <source>Stud Health Technol Inform</source>
                    <year>2011</year>
                    <volume>169</volume>
                    <fpage>584</fpage>
                    <lpage>588</lpage>
                    <pub-id pub-id-type="medline">21893816</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref77">
                <label>77</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Zhou</surname>
                            <given-names>X</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Liu</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Guo</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gao</surname>
                            <given-names>Z</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yan</surname>
                            <given-names>X</given-names>
                        </name>
                    </person-group>
                    <article-title>Development of traditional Chinese medicine clinical data warehouse for medical knowledge discovery and decision support</article-title>
                    <source>Artif Intell Med</source>
                    <year>2010</year>
                    <volume>48</volume>
                    <issue>2-3</issue>
                    <fpage>139</fpage>
                    <lpage>152</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.artmed.2009.07.012</pub-id>
                    <pub-id pub-id-type="medline">20122820</pub-id>
                    <pub-id pub-id-type="pii">S0933-3657(09)00105-5</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref78">
                <label>78</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Zapletal</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rodon</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Grabar</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Degoulet</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Methodology of integration of a clinical data warehouse with a clinical information system: the HEGP case</article-title>
                    <source>Stud Health Technol Inform</source>
                    <year>2010</year>
                    <volume>160</volume>
                    <issue>Pt 1</issue>
                    <fpage>193</fpage>
                    <lpage>197</lpage>
                    <pub-id pub-id-type="medline">20841676</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref79">
                <label>79</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hanss</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schaaf</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wetzel</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hahn</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schrader</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tolxdorff</surname>
                            <given-names>T</given-names>
                        </name>
                    </person-group>
                    <article-title>Integration of decentralized clinical data in a data warehouse: a service-oriented design and realization</article-title>
                    <source>Methods Inf Med</source>
                    <year>2009</year>
                    <volume>48</volume>
                    <issue>5</issue>
                    <fpage>414</fpage>
                    <lpage>418</lpage>
                    <pub-id pub-id-type="doi">10.3414/ME9240</pub-id>
                    <pub-id pub-id-type="medline">19657544</pub-id>
                    <pub-id pub-id-type="pii">9240</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref80">
                <label>80</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Evans</surname>
                            <given-names>RS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lloyd</surname>
                            <given-names>JF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pierce</surname>
                            <given-names>LA</given-names>
                        </name>
                    </person-group>
                    <source>AMIA Annu Symp Proc</source>
                    <year>2012</year>
                    <access-date>2014-01-09</access-date>
                    <comment>Clinical use of an enterprise data warehouse<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23304288/reload=0;jsessionid=P5NVyPK8BYs9OV0Ra8hg.0">http://europepmc.org/abstract/MED/23304288/reload=0;jsessionid=P5NVyPK8BYs9OV0Ra8hg.0</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6MVc6BqLh</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref81">
                <label>81</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Harrison</surname>
                            <given-names>JH</given-names>
                        </name>
                    </person-group>
                    <article-title>Introduction to the mining of clinical data</article-title>
                    <source>Clin Lab Med</source>
                    <year>2008</year>
                    <volume>28</volume>
                    <issue>1</issue>
                    <fpage>1</fpage>
                    <lpage>7</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.cll.2007.10.001</pub-id>
                    <pub-id pub-id-type="medline">18194715</pub-id>
                    <pub-id pub-id-type="pii">S0272-2712(07)00110-2</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref82">
                <label>82</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Phan</surname>
                            <given-names>JH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Quo</surname>
                            <given-names>CF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cheng</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>MD</given-names>
                        </name>
                    </person-group>
                    <article-title>Multiscale integration of -omic, imaging, and clinical data in biomedical informatics</article-title>
                    <source>IEEE Rev Biomed Eng</source>
                    <year>2012</year>
                    <volume>5</volume>
                    <fpage>74</fpage>
                    <lpage>87</lpage>
                    <pub-id pub-id-type="doi">10.1109/RBME.2012.2212427</pub-id>
                    <pub-id pub-id-type="medline">23231990</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref83">
                <label>83</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Sinha</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hripcsak</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Markatou</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Large datasets in biomedicine: a discussion of salient analytic issues</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2009</year>
                    <volume>16</volume>
                    <issue>6</issue>
                    <fpage>759</fpage>
                    <lpage>767</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.bmj.com/cgi/pmidlookup?view=long&#38;pmid=19717808" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1197/jamia.M2780</pub-id>
                    <pub-id pub-id-type="medline">19717808</pub-id>
                    <pub-id pub-id-type="pii">M2780</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3002128</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref84">
                <label>84</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Drai</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Grodzinsky</surname>
                            <given-names>Y</given-names>
                        </name>
                    </person-group>
                    <article-title>A new empirical angle on the variability debate: quantitative neurosyntactic analyses of a large data set from Broca's aphasia</article-title>
                    <source>Brain Lang</source>
                    <year>2006</year>
                    <volume>96</volume>
                    <issue>2</issue>
                    <fpage>117</fpage>
                    <lpage>128</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.bandl.2004.10.016</pub-id>
                    <pub-id pub-id-type="medline">16115671</pub-id>
                    <pub-id pub-id-type="pii">S0093-934X(05)00116-1</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref85">
                <label>85</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bellman</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kalaba</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <article-title>DYNAMIC PROGRAMMING AND STATISTICAL COMMUNICATION THEORY</article-title>
                    <source>Proc Natl Acad Sci U S A</source>
                    <year>1957</year>
                    <volume>43</volume>
                    <issue>8</issue>
                    <fpage>749</fpage>
                    <lpage>751</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16590080" />
                    </comment>
                    <pub-id pub-id-type="medline">16590080</pub-id>
                    <pub-id pub-id-type="pmcid">PMC528532</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref86">
                <label>86</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Borthakur</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <source>The Hadoop Distributed File System: Architecture and Design</source>
                    <access-date>2013-11-25</access-date>
                    <comment>2007<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://hadoop.apache.org/docs/r0.18.0/hdfs_design.pdf">https://hadoop.apache.org/docs/r0.18.0/hdfs_design.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6LOoNyUXR</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref87">
                <label>87</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chang</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dean</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ghemawat</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>Bigtable: A Distributed Storage System for Structured Data</article-title>
                    <year>2006</year>
                    <conf-name>the 7th USENIX Symposium on Operating Systems Design and Implementation (OSDI’06)</conf-name>
                    <conf-date>2006</conf-date>
                    <conf-loc>Seattle, WA, US</conf-loc>
                    <fpage>205</fpage>
                    <lpage>218</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref88">
                <label>88</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Litt</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <source>NoSQL: The Unix Database (With awk)</source>
                    <access-date>2013-11-25</access-date>
                    <comment>2007<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.troubleshooters.com/lpm/200704/200704.htm">http://www.troubleshooters.com/lpm/200704/200704.htm</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6LOp7PTH6</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref89">
                <label>89</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>van der Burgt</surname>
                            <given-names>YE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Taban</surname>
                            <given-names>IM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Konijnenburg</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Biskup</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Duursma</surname>
                            <given-names>MC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Heeren</surname>
                            <given-names>RM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>R&#246;mpp</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>van Nieuwpoort</surname>
                            <given-names>RV</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bal</surname>
                            <given-names>HE</given-names>
                        </name>
                    </person-group>
                    <article-title>Parallel processing of large datasets from NanoLC-FTICR-MS measurements</article-title>
                    <source>J Am Soc Mass Spectrom</source>
                    <year>2007</year>
                    <volume>18</volume>
                    <issue>1</issue>
                    <fpage>152</fpage>
                    <lpage>161</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.jasms.2006.09.005</pub-id>
                    <pub-id pub-id-type="medline">17055738</pub-id>
                    <pub-id pub-id-type="pii">S1044-0305(06)00822-1</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref90">
                <label>90</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <collab>Stata Corporation</collab>
                    </person-group>
                    <article-title>Stata reference manual : release 6</article-title>
                    <source>Stata Reference Manual Set, 4vol: Release 6</source>
                    <year>1999</year>
                    <publisher-loc>College Station, TX</publisher-loc>
                    <publisher-name>Stata Corp</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref91">
                <label>91</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>R Development Core Team</collab>
                    </person-group>
                    <source>official website for R</source>
                    <access-date>2014-01-08</access-date>
                    <publisher-loc>Vienna, Austria</publisher-loc>
                    <comment>The R Project for Statistical Computing<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.r-project.org/">http://www.r-project.org/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6MU3hBSqT</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref92">
                <label>92</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bolstad</surname>
                            <given-names>BM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Irizarry</surname>
                            <given-names>RA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Astrand</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Speed</surname>
                            <given-names>TP</given-names>
                        </name>
                    </person-group>
                    <article-title>A comparison of normalization methods for high density oligonucleotide array data based on variance and bias</article-title>
                    <source>Bioinformatics</source>
                    <year>2003</year>
                    <volume>19</volume>
                    <issue>2</issue>
                    <fpage>185</fpage>
                    <lpage>193</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bioinformatics.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=12538238" />
                    </comment>
                    <pub-id pub-id-type="medline">12538238</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref93">
                <label>93</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Pleil</surname>
                            <given-names>JD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Stiegel</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Madden</surname>
                            <given-names>MC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sobus</surname>
                            <given-names>JR</given-names>
                        </name>
                    </person-group>
                    <article-title>Heat map visualization of complex environmental and biomarker measurements</article-title>
                    <source>Chemosphere</source>
                    <year>2011</year>
                    <volume>84</volume>
                    <issue>5</issue>
                    <fpage>716</fpage>
                    <lpage>723</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.chemosphere.2011.03.017</pub-id>
                    <pub-id pub-id-type="medline">21492901</pub-id>
                    <pub-id pub-id-type="pii">S0045-6535(11)00286-4</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref94">
                <label>94</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Garcia-Betancur</surname>
                            <given-names>JC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Menendez</surname>
                            <given-names>MC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Del Portillo</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Garcia</surname>
                            <given-names>MJ</given-names>
                        </name>
                    </person-group>
                    <article-title>Alignment of multiple complete genomes suggests that gene rearrangements may contribute towards the speciation of Mycobacteria</article-title>
                    <source>Infect Genet Evol</source>
                    <year>2012</year>
                    <volume>12</volume>
                    <issue>4</issue>
                    <fpage>819</fpage>
                    <lpage>826</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.meegid.2011.09.024</pub-id>
                    <pub-id pub-id-type="medline">22008279</pub-id>
                    <pub-id pub-id-type="pii">S1567-1348(11)00354-6</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref95">
                <label>95</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Aita</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nishigaki</surname>
                            <given-names>K</given-names>
                        </name>
                    </person-group>
                    <article-title>A visualization of 3D proteome universe: mapping of a proteome ensemble into 3D space based on the protein-structure composition</article-title>
                    <source>Mol Phylogenet Evol</source>
                    <year>2011</year>
                    <volume>61</volume>
                    <issue>2</issue>
                    <fpage>484</fpage>
                    <lpage>494</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.ympev.2011.06.020</pub-id>
                    <pub-id pub-id-type="medline">21762784</pub-id>
                    <pub-id pub-id-type="pii">S1055-7903(11)00309-5</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref96">
                <label>96</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lenzerini</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Data Integration: A Theoretical Perspective</article-title>
                    <year>2002</year>
                    <conf-name>Proceedings of the ACM Symposium on Principles of Database Systems (PODS)</conf-name>
                    <conf-date>2002</conf-date>
                    <conf-loc>Roma, Italy</conf-loc>
                    <fpage>233</fpage>
                    <lpage>246</lpage>
                    <pub-id pub-id-type="doi">10.1145/543613.543644</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref97">
                <label>97</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Halevy</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rajaraman</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ordille</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Data integration: the teenage years</article-title>
                    <year>2006</year>
                    <conf-name>VLDB '06 Proceedings of the 32nd international conference on Very large data bases</conf-name>
                    <conf-date>2006</conf-date>
                    <conf-loc>Seoul, Korea</conf-loc>
                    <fpage>9</fpage>
                    <lpage>16</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref98">
                <label>98</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Haas</surname>
                            <given-names>LM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lin</surname>
                            <given-names>ET</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Roth</surname>
                            <given-names>MA</given-names>
                        </name>
                    </person-group>
                    <article-title>Data integration through database federation</article-title>
                    <source>IBM Syst. J</source>
                    <year>2002</year>
                    <volume>41</volume>
                    <issue>4</issue>
                    <fpage>578</fpage>
                    <lpage>596</lpage>
                    <pub-id pub-id-type="doi">10.1147/sj.414.0578</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref99">
                <label>99</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Shyu</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ytreberg</surname>
                            <given-names>FM</given-names>
                        </name>
                    </person-group>
                    <article-title>Reducing the bias and uncertainty of free energy estimates by using regression to fit thermodynamic integration data</article-title>
                    <source>J Comput Chem</source>
                    <year>2009</year>
                    <volume>30</volume>
                    <issue>14</issue>
                    <fpage>2297</fpage>
                    <lpage>2304</lpage>
                    <pub-id pub-id-type="doi">10.1002/jcc.21231</pub-id>
                    <pub-id pub-id-type="medline">19266482</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref100">
                <label>100</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Taylor</surname>
                            <given-names>W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gladman</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Helliwell</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Marchesoni</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mease</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mielants</surname>
                            <given-names>H</given-names>
                        </name>
                        <collab>CASPAR Study Group</collab>
                    </person-group>
                    <article-title>Classification criteria for psoriatic arthritis: development of new criteria from a large international study</article-title>
                    <source>Arthritis Rheum</source>
                    <year>2006</year>
                    <volume>54</volume>
                    <issue>8</issue>
                    <fpage>2665</fpage>
                    <lpage>2673</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.doi.org/10.1002/art.21972" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1002/art.21972</pub-id>
                    <pub-id pub-id-type="medline">16871531</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref101">
                <label>101</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Gschwind</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Robert</surname>
                            <given-names>Y</given-names>
                        </name>
                    </person-group>
                    <article-title>Analyse der zeitlichen Ver&#228;nderungen der Papillen-Reflexion mittels Hauptkomponentenanalyse</article-title>
                    <source>Klin Monatsbl Augenheilkd</source>
                    <year>2008</year>
                    <volume>190</volume>
                    <issue>04</issue>
                    <fpage>249</fpage>
                    <pub-id pub-id-type="doi">10.1055/s-2008-1050370</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref102">
                <label>102</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Santaf&#233;</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lozano</surname>
                            <given-names>JA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Larra&#241;aga</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Bayesian model averaging of naive Bayes for clustering</article-title>
                    <source>IEEE Trans Syst Man Cybern B Cybern</source>
                    <year>2006</year>
                    <volume>36</volume>
                    <issue>5</issue>
                    <fpage>1149</fpage>
                    <lpage>1161</lpage>
                    <pub-id pub-id-type="medline">17036820</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref103">
                <label>103</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Farr&#233;</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cabrera</surname>
                            <given-names>JA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Romero</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rubio</surname>
                            <given-names>JM</given-names>
                        </name>
                    </person-group>
                    <article-title>Therapeutic decision tree for patients with sustained ventricular tachyarrhythmias or aborted cardiac arrest: a critical review of the Antiarrhythmics Versus Implantable Defibrillator trial and the Canadian Implantable Defibrillator Study</article-title>
                    <source>Am J Cardiol</source>
                    <year>2000</year>
                    <volume>86</volume>
                    <issue>9A</issue>
                    <fpage>44K</fpage>
                    <lpage>51K</lpage>
                    <pub-id pub-id-type="medline">11084100</pub-id>
                    <pub-id pub-id-type="pii">S0002914900012911</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref104">
                <label>104</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lisboa</surname>
                            <given-names>PJ</given-names>
                        </name>
                    </person-group>
                    <article-title>A review of evidence of health benefit from artificial neural networks in medical intervention</article-title>
                    <source>Neural Netw</source>
                    <year>2002</year>
                    <volume>15</volume>
                    <issue>1</issue>
                    <fpage>11</fpage>
                    <lpage>39</lpage>
                    <pub-id pub-id-type="medline">11958484</pub-id>
                    <pub-id pub-id-type="pii">S0893-6080(01)00111-3</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref105">
                <label>105</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>HF</given-names>
                        </name>
                    </person-group>
                    <article-title>In silico log P prediction for a large data set with support vector machines, radial basis neural networks and multiple linear regression</article-title>
                    <source>Chem Biol Drug Des</source>
                    <year>2009</year>
                    <volume>74</volume>
                    <issue>2</issue>
                    <fpage>142</fpage>
                    <lpage>147</lpage>
                    <pub-id pub-id-type="doi">10.1111/j.1747-0285.2009.00840.x</pub-id>
                    <pub-id pub-id-type="medline">19549084</pub-id>
                    <pub-id pub-id-type="pii">JPP840</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref106">
                <label>106</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Aickin</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gensler</surname>
                            <given-names>H</given-names>
                        </name>
                    </person-group>
                    <article-title>Adjusting for multiple testing when reporting research results: the Bonferroni vs Holm methods</article-title>
                    <source>Am J Public Health</source>
                    <year>1996</year>
                    <volume>86</volume>
                    <issue>5</issue>
                    <fpage>726</fpage>
                    <lpage>728</lpage>
                    <pub-id pub-id-type="doi">10.2105/Ajph.86.5.726</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref107">
                <label>107</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bender</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lange</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>Adjusting for multiple testing&#8212;when and how?</article-title>
                    <source>Journal of Clinical Epidemiology</source>
                    <year>2001</year>
                    <volume>54</volume>
                    <issue>4</issue>
                    <fpage>343</fpage>
                    <lpage>349</lpage>
                    <pub-id pub-id-type="doi">10.1016/S0895-4356(00)00314-0</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref108">
                <label>108</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Broberg</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>A comparative review of estimates of the proportion unchanged genes and the false discovery rate</article-title>
                    <source>BMC Bioinformatics</source>
                    <year>2005</year>
                    <volume>6</volume>
                    <fpage>199</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.biomedcentral.com/1471-2105/6/199" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/1471-2105-6-199</pub-id>
                    <pub-id pub-id-type="medline">16086831</pub-id>
                    <pub-id pub-id-type="pii">1471-2105-6-199</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1199583</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref109">
                <label>109</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>van der Laan</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dudoit</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pollard</surname>
                            <given-names>KS</given-names>
                        </name>
                    </person-group>
                    <article-title>Multiple testing. Part II.  Step-down procedures for control of the family-wise error rate</article-title>
                    <source>Stat Appl Genet Mol Biol</source>
                    <year>2004</year>
                    <volume>3</volume>
                    <pub-id pub-id-type="doi">10.2202/1544-6115.1041</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref110">
                <label>110</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Sanders</surname>
                            <given-names>CM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Saltzstein</surname>
                            <given-names>SL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schultzel</surname>
                            <given-names>MM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nguyen</surname>
                            <given-names>DH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Stafford</surname>
                            <given-names>HS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sadler</surname>
                            <given-names>GR</given-names>
                        </name>
                    </person-group>
                    <article-title>Understanding the limits of large datasets</article-title>
                    <source>J Cancer Educ</source>
                    <year>2012</year>
                    <volume>27</volume>
                    <issue>4</issue>
                    <fpage>664</fpage>
                    <lpage>669</lpage>
                    <pub-id pub-id-type="doi">10.1007/s13187-012-0383-7</pub-id>
                    <pub-id pub-id-type="medline">22729362</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref111">
                <label>111</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Derman</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Models</article-title>
                    <source>Models.Behaving.Badly. Why Confusing Illusion with Reality Can Lead to Disaster, on Wall Street and in Life</source>
                    <year>2012</year>
                    <publisher-loc>New York, New York</publisher-loc>
                    <publisher-name>Free Press</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref112">
                <label>112</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kobayashi</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kishimoto</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Swearingen</surname>
                            <given-names>CJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Filopoulos</surname>
                            <given-names>MT</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ohara</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tokuda</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Oshikawa</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yoshida</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Utsunomiya</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kimura</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Okada</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Matsui</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yazici</surname>
                            <given-names>Y</given-names>
                        </name>
                    </person-group>
                    <article-title>Differences in clinical manifestations, treatment, and concordance rates with two major sets of criteria for Beh&#231;et's syndrome for patients in the US and Japan: data from a large, three-center cohort study</article-title>
                    <source>Mod Rheumatol</source>
                    <year>2013</year>
                    <volume>23</volume>
                    <issue>3</issue>
                    <fpage>547</fpage>
                    <lpage>553</lpage>
                    <pub-id pub-id-type="doi">10.1007/s10165-012-0696-8</pub-id>
                    <pub-id pub-id-type="medline">22752504</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref113">
                <label>113</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Jacobs</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>The pathologies of big data</article-title>
                    <source>Commun ACM</source>
                    <year>2009</year>
                    <volume>52</volume>
                    <issue>8</issue>
                    <fpage>36</fpage>
                    <pub-id pub-id-type="doi">10.1145/1536616.1536632</pub-id>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>
