<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v12i1e47744</article-id>
      <article-id pub-id-type="pmid">38446504</article-id>
      <article-id pub-id-type="doi">10.2196/47744</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Real-World Data Quality Framework for Oncology Time to Treatment Discontinuation Use Case: Implementation and Evaluation Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Chen</surname>
            <given-names>Qingyu</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kim</surname>
            <given-names>Hyo Jung</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Setia</surname>
            <given-names>Sajita</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Royce</surname>
            <given-names>Trevor</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Ru</surname>
            <given-names>Boshu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Center for Observational and Real-world Evidence (CORE)</institution>
            <institution>Merck &#38; Co, Inc</institution>
            <addr-line>770 Sumneytown Pike</addr-line>
            <addr-line>WP37A</addr-line>
            <addr-line>West Point, PA, 19486</addr-line>
            <country>United States</country>
            <phone>1 215 652 4301</phone>
            <email>boshu.ru@merck.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9620-1306</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Sillah</surname>
            <given-names>Arthur</given-names>
          </name>
          <degrees>MPH, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1065-6735</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Desai</surname>
            <given-names>Kaushal</given-names>
          </name>
          <degrees>MS, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8941-2858</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Chandwani</surname>
            <given-names>Sheenu</given-names>
          </name>
          <degrees>MPH, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0335-5750</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Yao</surname>
            <given-names>Lixia</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5187-6120</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Kothari</surname>
            <given-names>Smita</given-names>
          </name>
          <degrees>MBA, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5614-3332</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Center for Observational and Real-world Evidence (CORE)</institution>
        <institution>Merck &#38; Co, Inc</institution>
        <addr-line>West Point, PA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Boshu Ru <email>boshu.ru@merck.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>6</day>
        <month>3</month>
        <year>2024</year>
      </pub-date>
      <volume>12</volume>
      <elocation-id>e47744</elocation-id>
      <history>
        <date date-type="received">
          <day>30</day>
          <month>3</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>30</day>
          <month>6</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>30</day>
          <month>11</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>14</day>
          <month>1</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Boshu Ru, Arthur Sillah, Kaushal Desai, Sheenu Chandwani, Lixia Yao, Smita Kothari. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 06.03.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2024/1/e47744" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The importance of real-world evidence is widely recognized in observational oncology studies. However, the lack of interoperable data quality standards in the fragmented health information technology landscape represents an important challenge. Therefore, adopting validated systematic methods for evaluating data quality is important for oncology outcomes research leveraging real-world data (RWD).</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to implement real-world time to treatment discontinuation (rwTTD) for a systemic anticancer therapy (SACT) as a new use case for the Use Case Specific Relevance and Quality Assessment, a framework linking data quality and relevance in fit-for-purpose RWD assessment.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>To define the rwTTD use case, we mapped the operational definition of rwTTD to RWD elements commonly available from oncology electronic health record–derived data sets. We identified 20 tasks to check the completeness and plausibility of data elements concerning SACT use, line of therapy (LOT), death date, and length of follow-up. Using descriptive statistics, we illustrated how to implement the Use Case Specific Relevance and Quality Assessment on 2 oncology databases (<italic>Data sets A and B</italic>) to estimate the rwTTD of an SACT drug (<italic>target SACT</italic>) for patients with advanced head and neck cancer diagnosed on or after January 1, 2015.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A total of 1200 (24.96%) of 4808 patients in Data set A and 237 (5.92%) of 4003 patients in Data set B received the target SACT, suggesting better relevance of the former in estimating the rwTTD of the target SACT. The 2 data sets differed with regard to the terminology used for SACT drugs, LOT format, and target SACT LOT distribution over time. Data set B appeared to have less complete SACT records, longer lags in incorporating the latest data, and incomplete mortality data, suggesting a lack of fitness for estimating rwTTD.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The fit-for-purpose data quality assessment demonstrated substantial variability in the quality of the 2 real-world data sets. The data quality specifications applied for rwTTD estimation can be expanded to support a broad spectrum of oncology use cases.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>data quality assessment</kwd>
        <kwd>real-world data</kwd>
        <kwd>real-world time to treatment discontinuation</kwd>
        <kwd>systemic anticancer therapy</kwd>
        <kwd>Use Case Specific Relevance and Quality Assessment</kwd>
        <kwd>UReQA framework</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The importance of real-world evidence drawn from real-world data (RWD) is widely recognized in oncology research [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref5">5</xref>]. Over the past decade, federal legislation and incentives promoting the secondary use of RWD in the United States [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>], coupled with advances in health information technology, have resulted in an explosion of RWD sources and a complex RWD ecosystem [<xref ref-type="bibr" rid="ref1">1</xref>]. However, this rich data landscape can also pose challenges in identifying fit-for-purpose RWD to meet biopharma research needs.</p>
        <p>Two key obstacles to identifying high-quality data are the fragmentation of RWD sources and the lack of interoperable data quality standards. These obstacles are particularly pertinent in the United States, where progress is slow in reaching full interoperability of data sourced from thousands of providers who customized their electronic health record (EHR) systems from solutions provided by &#62;40 different EHR software vendors [<xref ref-type="bibr" rid="ref9">9</xref>]. Therefore, adopting validated systematic methods for evaluating data quality is important for research leveraging RWD [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        <p>In 2016, an expert panel proposed the concepts of <italic>conformance</italic>, <italic>completeness</italic>, and <italic>plausibility</italic> as 3 categories (with subcategories) to describe the intrinsic data quality of EHR databases and to serve as a framework for assessing data quality that could then be verified (with organizational data) or validated using an accepted gold standard [<xref ref-type="bibr" rid="ref13">13</xref>]. Several working groups and authors have applied these terms or proposed others for defining research data quality [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>], and multiple initiatives in the United States, both public and private, have developed frameworks and tools to evaluate and improve the quality of EHR data sets [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref21">21</xref>] and to implement model-driven, quantitative approaches to address RWD completeness and plausibility issues [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref25">25</xref>]. However, there is no single RWD source that can fit the needs of all studies, and the selection of RWD to support an individual use case must also consider data relevance and measurement thresholds in addition to data quality.</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>In a previous study, we introduced the Use Case Specific Relevance and Quality Assessment (UReQA) framework, an RWD quality framework that combines both the data quality and the relevance aspects of assessing RWD, with the goal of developing data quality assessment specifications tailored to use cases [<xref ref-type="bibr" rid="ref3">3</xref>]. In this study, we aimed to implement this framework in the use case for estimating real-world time to treatment discontinuation (rwTTD) in oncology. Our work had two main components: (1) to design comprehensive data quality assessment checks for estimating rwTTD for a systemic anticancer therapy (SACT) and (2) to illustrate how these quality checks can be used to evaluate EHR-derived RWD products.</p>
        <p>We selected rwTTD as the first use case to implement the UReQA framework because of its high utility as a pragmatic real-world effectiveness end point for continuously administered SACTs (such as immunotherapies) and its known correlation with overall survival [<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref28">28</xref>]. Moreover, the estimation of rwTTD requires information on medication use patterns, mortality, and follow-up. These data elements are foundational to outcomes research. Therefore, implementation of the rwTTD use case can be expanded to other use cases in or beyond oncology, as well as different data sources, such as claims databases.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study used 2 commercially licensed deidentified structured secondary data sources accessible to the study team. It was exempted from institutional review board review because of the following: (1) each data source contains a significant level of protection against the release of personal information to outside entities and (2) the use of such databases presents the lowest risk to potential subjects because the analysis involves only anonymous data; hence, conducting the study will not place the subjects at risk.</p>
      </sec>
      <sec>
        <title>Study Overview</title>
        <p>This study comprised four main steps: (1) conceptual definition of the rwTTD use case; (2) mapping of the rwTTD use case definition to RWD elements (operational definition); (3) identifying data quality checks for the required data elements to determine rwTTD for an SACT, designated the “target SACT”; and (4) implementing the UReQA framework [<xref ref-type="bibr" rid="ref3">3</xref>] in assessing the RWD fitness for estimating rwTTD. The data quality assessment was undertaken on 2 US EHR-based oncology databases for estimating rwTTD for a target SACT, an immunotherapy drug that is administered intravenously in advanced-stage head and neck cancer (HNC). The targeted SACT received approval in 2016 for the treatment of previously treated advanced HNC and in 2019 for its use as a first-line therapy in advanced HNC. The focus of this study is on designing data quality assessment methods that are tailored for specific use cases, rather than calculating rwTTD for a particular medication. Therefore, we mask the name of the actual drug product.</p>
      </sec>
      <sec>
        <title>Step 1: Conceptual Definition of the rwTTD Use Case</title>
        <p>The end point, rwTTD, is defined as the length of time from initiation to discontinuation of a medication <italic>([date of last recorded dose – date of first recorded dose] + 1 d</italic>), with discontinuation defined as the date of the last dose if a patient died during therapy or initiated a new treatment or if there is a gap of ≥120 days between the last recorded dose and last recorded activity in a data set. Patients who do not meet the discontinuation criteria are censored at the last medication use [<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref28">28</xref>].</p>
      </sec>
      <sec>
        <title>Step 2: Mapping of the rwTTD Use Case Definition to RWD Elements</title>
        <p>Owing to the variations in data element definition and data structures between real-world EHR databases, we need to operationalize the concept of rwTTD by deconstructing its definition and mapping it to four sets of required data elements that are commonly available from oncology EHR–derived data sets: (1) SACT, (2) line of therapy (LOT) specifying the regimen names and sequence of current treatment in the treatment plan [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>], (3) mortality status, and (4) follow-up time, as summarized in <xref ref-type="table" rid="table1">Table 1</xref>. Although SACT, mortality status, and follow-up time are often recorded directly as procedure, prescription, and administrative events in raw EHR databases, the LOT was often derived from raw EHR by the algorithm.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Required data elements for determining real-world time to treatment discontinuation (rwTTD) for a systemic anticancer therapy (SACT) drug in a specific line of therapy (LOT).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="530"/>
            <col width="440"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Operational steps to ascertain rwTTD and type of data category</td>
                <td>Commonly used data elements</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Identify records of the drug of interest</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SACT drug</td>
                <td>Drug_name, NDC<sup>a</sup>, HCPCS<sup>b</sup> code, RxNorm code</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SACT administration</td>
                <td>Drug administration date<sup>c</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>SACT order</td>
                <td>Drug order date<sup>d</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Identify discontinuation date from subsequent LOT start date</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LOT</td>
                <td>LOT name<sup>e</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LOT</td>
                <td>LOT number</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LOT</td>
                <td>LOT start date</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LOT</td>
                <td>LOT end date</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>If no subsequent LOT, identify discontinuation date from patient death record during treatment</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Mortality status</td>
                <td>Vital status or date of death</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>If no date of death, identify discontinuation date by last follow-up date subheading</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Last follow-up</td>
                <td>Date of last follow-up<sup>f</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>NDC: National Drug Code.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>HCPCS: Healthcare Common Procedure Coding System.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>The drug administration date is defined as the date of receiving medication at a health care facility as a medical service, often applicable to an intravenous drug.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>The drug order date is defined as the order date for drugs used at home, often applicable to an oral drug.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>The LOT name is determined by the combination of SACT drugs administered or ordered from the LOT start to end dates.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>The date of last follow-up is defined as the last documented clinic visit or procedure in the electronic health record.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>We defined SACT as any systemic anticancer medication received by the patient, documented as given either by a health care provider at the site of care (eg, by infusion), with the date defined as the “administration” date, or as a prescription to take or apply at home, with the date defined as the “drug order” date. The number of refills (or alternative data elements such as days of supply or expected medication end date) was used to determine the last use of oral drugs (<xref ref-type="table" rid="table1">Table 1</xref>).</p>
        <p>LOT was defined as the sequence of the SACT regimens prescribed for an individual patient, as previously described in detail [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. In brief, the first LOT (line 1 [1L]) begins with the first SACT initiated after a study index date (often the advanced or metastatic cancer diagnosis date), and any other drug introduced within the next 28 days is considered part of that LOT [<xref ref-type="bibr" rid="ref29">29</xref>]. We defined the start of a new LOT when a new SACT not belonging to the prior LOT was introduced or if a new SACT was initiated after a ≥120-day gap in therapy.</p>
        <p>Because the target SACT was administered intravenously, we omitted 2 tasks applicable only to oral target SACTs: the check of patient numbers with target drug order date after the index date (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, task 6 [<xref ref-type="bibr" rid="ref13">13</xref>]) and the check for distribution of gaps between drug order dates (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, task 9).</p>
        <p>The patient mortality status was determined based on the recorded dates of death. For patients who were still alive at data cutoff, the date of the last follow-up was defined as the last documented clinical activity date in the EHR (<xref ref-type="table" rid="table1">Table 1</xref>).</p>
      </sec>
      <sec>
        <title>Step 3: Identifying Data Quality Checks for Required Data Elements</title>
        <p>For each of the required data elements, we identified corresponding verification checks to assess data quality at both the variable level and the cohort level. A total of 20 data quality checks (tasks) were identified and categorized into the quality dimensions of conformance, completeness, and plausibility, as per the harmonized data quality assessment terms and framework developed by Kahn et al [<xref ref-type="bibr" rid="ref13">13</xref>] (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Our goal in creating these tasks was to develop a comprehensive toolbox for assessing data quality for the rwTTD use case. However, when adapting them to a specific RWD database and a SACT drug of interest, not every task and check would be necessary. For example, the checks for LOT, mortality, and follow-up are not needed if a data set already provides the reason for discontinuation and censored status for each drug exposure. In addition, tasks 3-5 were applicable to cancer therapies received in hospitals or clinics as intravenous or infusion procedures, whereas tasks 4-9 were dedicated to oral cancer therapies that were mostly self-administrated at home. As tracking the actual time patients took oral therapies was infeasible, researchers examined days supply and refill records to estimate the drug exposure period. Therefore, when investigating the rwTTD of an oral SACT drug, it is necessary to check the completeness of these oral therapy–specific data elements (task 7).</p>
      </sec>
      <sec>
        <title>Step 4: Implementing the rwTTD Use Case for Assessing 2 RWD Sets</title>
        <sec>
          <title>Data Set Preassessment</title>
          <p>We followed the preassessment step in UReQA [<xref ref-type="bibr" rid="ref3">3</xref>] to identify 2 anonymized, commercially available US real-world oncology databases, designated as <italic>Data set A</italic> and <italic>Data set</italic> <italic>B</italic> in this report, which included patients with advanced (metastatic or unresectable, recurrent) HNC. Both databases contained data elements sourced from structured and unstructured information captured within health care providers’ EHR systems as part of routine cancer care.</p>
        </sec>
        <sec>
          <title>Cohort Selection and Patient Characteristics</title>
          <p>Data set A was commercialized and included patients with advanced HNC, whereas Data set B included patients with all stages of HNC. To align the 2 patient populations as having advanced HNC, we restricted Data set B to the subset of patients with HNC and a record of the American Joint Committee on Cancer stage IV and <italic>International Classification of Diseases</italic> (ICD), <italic>revision 9 or 10</italic> (ICD-9 or ICD-10) code for metastatic tumor (ICD-9 codes 196.x, 197.x, and 198.x and ICD-10 codes C76.x, C77.x, and C78.x). The distributions of the patient characteristics were then tabulated for the 2 data sets.</p>
        </sec>
        <sec>
          <title>Data Elements Harmonization</title>
          <p>In Data set A, the names of SACT medications were harmonized from clinic formulary information and medical service records to standard generic drug names in a commercial drug database along with drug category information. In Data set B, all medication records in the raw EHR data were harmonized into the RxNorm code [<xref ref-type="bibr" rid="ref31">31</xref>]; however, drug category information was not available. To harmonize all SACT medication in Data set B, we retrieved the RxNorm codes for generic names of all SACT medications using the RxNav software developed by and available from the US National Library of Medicine [<xref ref-type="bibr" rid="ref32">32</xref>].</p>
          <p>The LOT information was previously derived by both data providers but was presented differently in the 2 data sets. In Data set A, the LOT table provided the LOT number, LOT regimen name, LOT start date, and LOT end date, with a flag indicative of maintenance therapy, as appropriate. Instead, Data set B included only the LOT number and LOT start date. Therefore, to evaluate the LOT information in Data set B, we indirectly deduced the end date of each LOT as the date before the start of the next LOT or as the data cutoff date for the last LOT in the data set. Then, all individual SACT medications administered or ordered between the LOT start and end dates were combined to serve as the LOT regimen name. This approach was a necessary but imperfect solution because the LOT end date and the LOT regimen name should ideally be generated using a more rigorous algorithm [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>].</p>
          <p>The date of death was provided at the month and day levels in Data set A, whereas in Data set B, the death date was aggregated by year. Given the relatively short length of survival of many patients with advanced HNC [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref36">36</xref>], the allocation of death dates by year was not sufficiently granular for accurate rwTTD calculation; better precision (ie, month of death) would be needed for accurate rwTTD calculation. Consequently, quality assessment tasks related to mortality variables were omitted (task 17) for Data set B.</p>
        </sec>
        <sec>
          <title>Reporting the Verification Results</title>
          <p>Descriptive statistics were used to summarize the results of implementing rwTTD data quality checks on Data sets A and B. We used frequencies to summarize categorical variables and mean (SD) and median (IQR or range) to summarize continuous variables. The study index date was the date of first advanced HNC diagnosis, and the cutoff date was November 25, 2019.</p>
          <p>All analyses were conducted using SAS Studio release 3.8 (Basic Edition; SAS Institute, Inc).</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Patient Characteristics</title>
        <p>Data set A included 7366 patients with advanced HNC, and we identified 11,386 patients in Data set B with advanced HNC. The median patient age at the first advanced HNC diagnosis was 65 (IQR 58-72) years in Data set A and 61 (IQR 54-68) years in Data set B, and the percentages of male individuals were 74.16% (5643/7366) and 69.97% (7967/11386), respectively (<xref ref-type="table" rid="table2">Table 2</xref>), similar to the HNC population data from the United States [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref37">37</xref>].</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Baseline characteristics of patients with advanced head and neck cancer (HNC) included in 2 data sets under evaluation<sup>a</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="520"/>
            <col width="220"/>
            <col width="230"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Characteristic</td>
                <td>Data set A (n=7366)</td>
                <td>Data set B (n=11,386)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="4">
                  <bold>Sex, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>1723 (23.4)</td>
                <td>3408 (29.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>5643 (76.6)</td>
                <td>7967 (70)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Missing or unknown</td>
                <td>0 (0)</td>
                <td>11 (0.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Age at first advanced HNC diagnosis (y), median (IQR)</td>
                <td>65 (58-72)</td>
                <td>61 (54-68)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Age at first advanced HNC diagnosis (y), n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#60;18</td>
                <td>0 (0)</td>
                <td>31 (0.27)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>18-44</td>
                <td>187 (2.53)</td>
                <td>688 (6.04)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>45-64</td>
                <td>3402 (46.19)</td>
                <td>5955 (52.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>65-88</td>
                <td>3777 (51.28)</td>
                <td>4111 (36.11)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥89</td>
                <td>0 (0)</td>
                <td>6 (0.05)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Missing or unknown</td>
                <td>0 (0)</td>
                <td>595 (5.23)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Race or ethnicity, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>American Indian or Alaska Native</td>
                <td>N/A<sup>b</sup></td>
                <td> 40 (0.35)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asian</td>
                <td>103 (1.4)</td>
                <td>165 (1.45)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Black or African American</td>
                <td>487 (6.61)</td>
                <td>1250 (10.98)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hispanic or Latino</td>
                <td>13 (0.18)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Native Hawaiian or other Pacific Islander</td>
                <td>N/A</td>
                <td>6 (0.05)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>White</td>
                <td>4939 (67.05)</td>
                <td>9239 (81.14)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Missing</td>
                <td>650 (8.82)</td>
                <td>686 (6.02)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other race</td>
                <td>1174 (15.94)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>AJCC<sup>c</sup> stage at first HNC diagnosis, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0</td>
                <td>2 (0.03)</td>
                <td>28 (0.25)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I</td>
                <td>419 (5.69)</td>
                <td>603 (5.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>II</td>
                <td>505 (6.86)</td>
                <td>542 (4.76)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>III</td>
                <td>929 (12.61)</td>
                <td>798 (7.01)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>IV</td>
                <td>4330 (58.78)</td>
                <td>4978 (43.72)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Missing or unknown</td>
                <td>1181 (16.03)</td>
                <td>4437 (38.97)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Year of first advanced HNC diagnosis, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Before 2006</td>
                <td>0 (0)</td>
                <td>1245 (10.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2006-2009</td>
                <td>0 (0)</td>
                <td>1537 (13.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2010-2012</td>
                <td>1068 (14.5)</td>
                <td>2721 (23.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2013-2018</td>
                <td>5435 (73.8)</td>
                <td>5577 (49.0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2019 or later</td>
                <td>863 (11.7)</td>
                <td>306 (2.7)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Percentages may not add up to 100% because of rounding.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>AJCC: American Joint Committee on Cancer.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>SACT Data Checks</title>
        <p>Overall, 75.91% (5592/7366) and 38.74% (4411/11386) of the patients in Data sets A and B, respectively, had a recorded drug administration or drug order for any SACT (<xref ref-type="table" rid="table3">Table 3</xref>, task 1). A complete start date (y, mo, and d) was recorded for all SACT administrations and orders in both data sets (<xref ref-type="table" rid="table3">Table 3</xref>, tasks 4 and 8).</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Data quality assessment of SACT<sup>a</sup> administration and order records after the advanced HNC<sup>b</sup> diagnosis<sup>c</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="600"/>
            <col width="0"/>
            <col width="190"/>
            <col width="0"/>
            <col width="180"/>
            <thead>
              <tr valign="top">
                <td colspan="3">SACT data quality checks</td>
                <td colspan="2">Data set A</td>
                <td>Data set B</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Task 1: patients with any SACT drug administration or order record after the advanced HNC diagnosis date, n (%)<sup>d</sup></td>
                <td colspan="2">5592 (75.9)</td>
                <td>4411 (38.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Task 2: SACT drug records with missing drug identity (name and code) information</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Value, n (%)</td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">0 (0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Normalization of medication name</td>
                <td colspan="2">Normalized generic name</td>
                <td colspan="2">RxNorm ingredient level</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Task 3: patients with target SACT administration date after the advanced HNC diagnosis date, 2015 onward, % (n/N)<sup>e</sup></td>
                <td colspan="2">24.96 (1200/4808)</td>
                <td>5.92 (237/4003)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Task 4: SACT drug administration records with complete administration date, n (%)</td>
                <td colspan="2">425,505 (100)</td>
                <td>37,662 (100)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Task 5: gap (in d) between the target SACT drug administration dates, median (IQR; range)</td>
                <td colspan="2">21 (21-21; 1-113)</td>
                <td>21 (11-21; 1-824)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Task 6: patients with target SACT order date after the advanced HNC diagnosis date</td>
                <td colspan="2">N/A<sup>f,g</sup></td>
                <td>N/A<sup>g</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="3">Task 7 SACT drug order records with complete days supply and refill information, n (%)</td>
                <td colspan="2">1732 (53.4)</td>
                <td>N/A<sup>h</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="3">Task 8: SACT drug order records with complete order date, n (%)<sup>i</sup></td>
                <td colspan="2">3241 (100)</td>
                <td>8380 (100)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Task 9: distribution of gaps (in d) between target SACT drug order dates, normalized by days supply, refill, and cancelation record</td>
                <td colspan="2">N/A<sup>g</sup></td>
                <td>N/A<sup>g</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>SACT: systemic anticancer therapy.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>HNC: head and neck cancer.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>Drug <italic>administration</italic> refers to drugs administered by health care providers at the site of care, whereas drug <italic>order</italic> refers to prescriptions for drugs used at home.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>Task 1 was applied to the full data sets, including 7366 and 11,386 patients in Data sets A and B, respectively.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>Task 3 was applied for patients with the first advanced HNC diagnosis on or after January 1, 2015, including 4808 and 4003 patients in Data sets A and B, respectively.</p>
            </fn>
            <fn id="table3fn6">
              <p><sup>f</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table3fn7">
              <p><sup>g</sup>Tasks 6 and 9 were not conducted because they apply to an oral target SACT.</p>
            </fn>
            <fn id="table3fn8">
              <p><sup>h</sup>Information about the number of refills, days supply, or alternative data elements was not available in Data set B.</p>
            </fn>
            <fn id="table3fn9">
              <p><sup>i</sup>The total number of drug order records in Data set A (3241) and Data set B (8380) was used as the denominator in task 8.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>We determined that 4808 (65.27%) of the 7366 patients in Data set A and 4003 (35.16%) of the 11,386 patients in Data set B had a first advanced HNC diagnosis on or after January 1, 2015, the timeline we applied for the study index date as it covered the key diagnostic and therapeutic timeline of the target SACT (first approved in 2016). A total of 1200 (24.96%) of the 4808 patients meeting this timeline in Data set A and 237 (5.92%) of the 4003 patients meeting this timeline in Data set B had a record of receiving the target SACT (<xref ref-type="table" rid="table3">Table 3</xref>, task 3).</p>
        <p>The median length of the gap between target SACT administrations was 21 days in both the data sets, which aligned with the expected dose schedule for the target SACT (<xref ref-type="table" rid="table3">Table 3</xref>, task 5). However, the range of the gap was considerably shorter in Data set A (1-113 d) than in Data set B (1-824 d), suggesting incomplete target SACT administration records in Data set B.</p>
        <p>For the oral SACT records, Data set A included the number of refills and a flag for canceled medication orders, whereas Data set B did not provide refill information (<xref ref-type="table" rid="table3">Table 3</xref>, task 7). This could impact the accuracy of calculating rwTTD for an orally dispensed SACT because the drug orders for patients remaining on treatment through refills would not be recorded in the database.</p>
      </sec>
      <sec>
        <title>LOT Data Checks</title>
        <p>The 2 data sets differed in terms of the target SACT LOT distribution over time. The cumulative frequency of target SACT initiation, including as monotherapy or combination therapy and in any LOT, tended to be greater in later years in Data set A, peaking in the third quarter (Q3) of 2019, than in Data set B, peaking in the first and second quarters of 2018 (<xref rid="figure1" ref-type="fig">Figure 1</xref>, task 10). In Data set A, a greater frequency of target SACT initiation as second-line or later monotherapy was consistent with approval timing in this setting (2016), which preceded the first-line approvals (2019). The later time points for second-line or later monotherapy initiation in Data set B suggest the possibility of longer data lags than for Data set A.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Task 10: number of patients initiating the target systemic anticancer therapy (SACT) by year and quarter in (A) Data set A and (B) Data set B. Note: Y-axis heights in panels A and B differ but were selected to best depict the patient numbers in Data sets A and B. 1L: first-line therapy; 2L+: second-line or later therapy; combo: target SACT in any combination therapy (approved or not approved); mono: target SACT monotherapy; Q1: first quarter; Q2: second quarter; Q3: third quarter; Q4: fourth quarter.</p>
          </caption>
          <graphic xlink:href="medinform_v12i1e47744_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>In both data sets, we observed the inclusion of patients who initiated the target SACT therapy before the applicable first-line or second-line or later US Food and Drug Administration approval dates. We believe that these are true real-world findings, which do not always correspond to recommended or approved indications, rather than data quality issues.</p>
        <p>In Data set B, only 40.3% (4589/11386) of patients had SACT LOT records (<xref ref-type="table" rid="table4">Table 4</xref>, task 11), which coincides with the finding of lower-than-expected SACT drug administration and order rates (<xref ref-type="table" rid="table3">Table 3</xref>, task 1).</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>LOT<sup>a</sup> rules for SACT<sup>b</sup> and mortality information.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="30"/>
            <col width="580"/>
            <col width="0"/>
            <col width="190"/>
            <col width="0"/>
            <col width="170"/>
            <col width="0"/>
            <col width="0"/>
            <col width="0"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Task</td>
                <td colspan="2">Data set A</td>
                <td colspan="2">Data set B</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Task 10: number of patients initiating the target SACT by year and quarter</td>
                <td colspan="2"><xref rid="figure1" ref-type="fig">Figure 1</xref>A</td>
                <td colspan="2"><xref rid="figure1" ref-type="fig">Figure 1</xref>B</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Task 11: completeness of LOT information, n (%)<sup>c</sup></bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Patients with complete line number</td>
                <td colspan="2">5594 (75.94)</td>
                <td colspan="2">4589 (40.3)</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Patients with complete line name</td>
                <td colspan="2">5594 (75.94)</td>
                <td colspan="2">N/A<sup>d,e</sup></td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Patients with complete line start date</td>
                <td colspan="2">5594 (75.94)</td>
                <td colspan="2">4589 (40.3)</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Patients with complete line end date</td>
                <td colspan="2">5594 (75.94)</td>
                <td colspan="2">N/A<sup>e</sup></td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">Task 12: patients for whom the first LOT number after the advanced HNC<sup>f</sup> diagnosis date was not 1, n (%)<sup>c</sup></td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">434 (3.81)</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Task 13: distribution of LOT number at target SACT initiation</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Patients who received the target SACT, n</td>
                <td colspan="2">1200</td>
                <td colspan="2">237</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Line 1, n (%)</td>
                <td colspan="2">481 (40.08)</td>
                <td colspan="2">65 (27.43)</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Line 2, n (%)</td>
                <td colspan="2">486 (40.5)</td>
                <td colspan="2">92 (38.82)</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Line 3, n (%)</td>
                <td colspan="2">161 (13.42)</td>
                <td colspan="2">54 (22.78)</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Line 4, n (%)</td>
                <td colspan="2">46 (3.83)</td>
                <td colspan="2">16 (6.75)</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Line 5, n (%)</td>
                <td colspan="2">13 (1.83)</td>
                <td colspan="2">10 (4.22)</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Lines 6-10, n (%)</td>
                <td colspan="2">13 (1.83)</td>
                <td colspan="2">0 (0)</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Task 14: use of target SACT in 1L<sup>g</sup> before approval date</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="7">
                  <bold>1L monotherapy</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Patients who received target SACT, % (n/N)</td>
                <td colspan="2">78.37 (377/481)</td>
                <td colspan="4">67.69 (44/65)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">First administration date<sup>h</sup> in database</td>
                <td colspan="2">July 15, 2015</td>
                <td colspan="4">November 10, 2014</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Cutoff date for the earliest 5% receipt</td>
                <td colspan="2">August 29, 2016</td>
                <td colspan="4">February 4, 2016</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Cutoff date for the earliest 10% receipt</td>
                <td colspan="2">November 3, 2016</td>
                <td colspan="4">September 23, 2016</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Cutoff date for the earliest 25% receipt</td>
                <td colspan="2">June 28, 2017</td>
                <td colspan="4">April 27, 2017</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="7">
                  <bold>Approved 1L combination</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Patients who received the target SACT in approved 1L combination, % (n/N)</td>
                <td colspan="2">7.69 (37/481)</td>
                <td colspan="4">6.15 (4/65)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">First administration date in database</td>
                <td colspan="2">December 18, 2018</td>
                <td colspan="4">July 1, 2019</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Cutoff date for the earliest 5% receipt</td>
                <td colspan="2">February 18, 2019</td>
                <td colspan="4">N/A<sup>i</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Cutoff date for the earliest 10% receipt</td>
                <td colspan="2">April 2, 2019</td>
                <td colspan="4">N/A<sup>i</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td colspan="2">Cutoff date for the earliest 25% receipt</td>
                <td colspan="2">July 9, 2019</td>
                <td colspan="4">N/A<sup>i</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="3">Task 15: patients with death record, n (%)<sup>c</sup></td>
                <td colspan="2">4695 (63.74)</td>
                <td colspan="2">3531 (31)</td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">Task 16: patients with multiple death records on different dates, n (%)</td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">N/A<sup>j</sup></td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Task 17: patients with clinical records showing health care activity after death date (n=4695), n (%)</bold>
                </td>
                <td colspan="2">1497 (31.88)</td>
                <td colspan="2">N/A<sup>j</sup></td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">≥1 d after date of death</td>
                <td colspan="2">1436 (30.59)</td>
                <td colspan="2">N/A<sup>j</sup></td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">≥3 d after date of death</td>
                <td colspan="2">1290 (27.48)</td>
                <td colspan="2">N/A<sup>j</sup></td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">≥7 d after date of death</td>
                <td colspan="2">1002 (21.34)</td>
                <td colspan="2">N/A<sup>j</sup></td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">≥30 d after date of death</td>
                <td colspan="2">79 (1.68)</td>
                <td colspan="2">N/A<sup>j</sup></td>
                <td colspan="3">
                  <break/>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup> LOT: line of therapy.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>SACT: systemic anticancer therapy.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>Tasks 11, 12, and 15 were applied to the full data sets, including 7366 and 11,386 patients in Data sets A and B, respectively.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table4fn5">
              <p><sup>e</sup>Line name and line end date were not available in Data set B.</p>
            </fn>
            <fn id="table4fn6">
              <p><sup>f</sup>HNC: head and neck cancer.</p>
            </fn>
            <fn id="table4fn7">
              <p><sup>g</sup>1L: first line of therapy after the advanced HNC diagnosis date.</p>
            </fn>
            <fn id="table4fn8">
              <p><sup>h</sup>Dates are written as month/day/year.</p>
            </fn>
            <fn id="table4fn9">
              <p><sup>i</sup>Not calculated as only 4 patients received the target SACT in a 1L combination LOT.</p>
            </fn>
            <fn id="table4fn10">
              <p><sup>j</sup>Only the year of death was available in Data set B.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The LOT start date in both data sets included year, month, and day, and the minimum LOT number started from 1 (first line) after the earliest advanced HNC diagnosis date for all but 3.81% (434/11386) of the patients in Data set B (<xref ref-type="table" rid="table4">Table 4</xref>, task 12). A line number other than 1 after the advanced HNC diagnosis date suggests that either a definition different from the commonly used definition [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>] was used or that there was an earlier advanced HNC diagnosis date that was not documented.</p>
        <p>In Data set A, 40.08% (481/1200) of patients received the target SACT in first-line therapy and 59.91% (719/1200) in second-line or later therapy, including 13.42% (161/1200) in third-line therapy (<xref ref-type="table" rid="table4">Table 4</xref>, task 13). In Data set B, 27.4% (65/237) of patients received the target SACT in first-line therapy, and 72.6% (172/237) received it in the second-line or later therapy, with frequent third-line receipt (54/237, 22.8%). Therefore, LOT rules may have been applied differently in Data set A and Data set B.</p>
        <p>Complete information about the start date of first-line target SACT drug administration (as both monotherapy and combination therapy) was available for 377+37=414 (86.1%) of 481 patients in Data set A and 44+4=48 (74%) of 65 patients in Data set B (<xref ref-type="table" rid="table4">Table 4</xref>, task 14). In Data set A, first-line target SACT monotherapy was initiated for the first time in 2015, and approximately 5% of first-line monotherapy initiation dates fell on or before 2016, when the target SACT was approved for second-line or later therapy. Target SACT in combination therapy was first initiated in late 2018, with approximately 25% of the initiation dates falling before the start of Q3 in 2019, shortly after the approval of first-line combination therapy. In Data set B, first-line target SACT monotherapy initiation was first recorded in the fourth quarter in 2014, earlier than in Data set A, and close to 10% of initiation dates occurred before the end of Q3 in 2016. Instead, the approved target SACT combination therapy was first initiated at the start of Q3 in 2019, in line with the approval date for this indication.</p>
      </sec>
      <sec>
        <title>Mortality Data</title>
        <p>Among 7366 and 11,386 patients in Data sets A and B, 4695 (63.74%) and 3531 (31%), respectively, had a recorded date of death (<xref ref-type="table" rid="table4">Table 4</xref>, task 15); and 4427 (60%) and 3093 (27%) patients, respectively, had death records within 3 years after the date of advanced HNC diagnosis. These percentage differences indicate that Data set B may have incomplete mortality records (or a high loss to follow-up).</p>
        <p>In Data set A, one-third of patients (1497/4695, 31.88%) with a recorded date of death had clinical records recorded after the death date (<xref ref-type="table" rid="table4">Table 4</xref>, task 17), with a median of 11 days from the death date to the last activity date. Thus, clinical records could be entered into the health information system after the reported death date, but extreme values (eg, &#62;30 d after the death date) might indicate integrity issues in collecting mortality data. This information was not available for Data set B, in which the dates of death were recorded only by year.</p>
      </sec>
      <sec>
        <title>Follow-Up Data</title>
        <p>In Data set A, most patients (5840/7366, 79.28% to 7269/7366, 99.86%) had recorded data for diagnosis, drug records, laboratory results, facility visits, and vital sign measurements (<xref ref-type="table" rid="table5">Table 5</xref>, task 18). Similarly, in the subset of 7754 patients in Data set B whose advanced HNC diagnosis date was on or after January 1, 2011, the earliest date in Data set A, these data categories were also recorded for most patients (6123/7754, 78.97% to 6893/7754, 88.7%). Records of medical procedures not related to drug administration and genomic testing were not available in Data set A, which could result in inaccurate estimates of follow-up times.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Unique number of patients and patient-date pairs after the advanced HNC<sup>a</sup> diagnosis date (task 18): follow-up data for patients with advanced HNC diagnosis on or after January 1, 2011.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="220"/>
            <col width="190"/>
            <col width="140"/>
            <col width="80"/>
            <col width="0"/>
            <col width="170"/>
            <col width="120"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td>Variable</td>
                <td colspan="4">Data set A (n=7366)</td>
                <td colspan="3">Data set B (n=7754)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Value, n (%)</td>
                <td>Unique patient-date pairs, n</td>
                <td>Pairs per patient, n</td>
                <td colspan="2">Value, n (%)</td>
                <td>Unique patient-date pairs, n</td>
                <td>Pairs per patient, n</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Diagnosis</td>
                <td>6567 (89.15)</td>
                <td>60,178</td>
                <td>9.2</td>
                <td colspan="2">6893 (88.9)</td>
                <td>370,671</td>
                <td>53.8</td>
              </tr>
              <tr valign="top">
                <td>Drug records<sup>b</sup></td>
                <td>5840 (79.28)</td>
                <td>113,948</td>
                <td>19.5</td>
                <td colspan="2">6802 (87.72)</td>
                <td>269,225</td>
                <td>39.6</td>
              </tr>
              <tr valign="top">
                <td>Laboratory records</td>
                <td>6860 (93.13)</td>
                <td>179,177</td>
                <td>26.1</td>
                <td colspan="2">6403 (82.58)</td>
                <td>147,314</td>
                <td>23</td>
              </tr>
              <tr valign="top">
                <td>Facility visit</td>
                <td>7269 (98.68)</td>
                <td>274,714</td>
                <td>37.8</td>
                <td colspan="2">6838 (88.19)</td>
                <td>392,175</td>
                <td>57.4</td>
              </tr>
              <tr valign="top">
                <td>Vital sign measurements</td>
                <td>7254 (98.48)</td>
                <td>233,623</td>
                <td>32.2</td>
                <td colspan="2">6123 (78.97)</td>
                <td>217,797</td>
                <td>35.6</td>
              </tr>
              <tr valign="top">
                <td>Nondrug medical procedure</td>
                <td>N/A<sup>c</sup></td>
                <td>N/A</td>
                <td>N/A</td>
                <td colspan="2">6740 (86.92)</td>
                <td>390,556</td>
                <td>57.9</td>
              </tr>
              <tr valign="top">
                <td>Genomic test</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td colspan="2">118 (1.52)</td>
                <td>208</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>Biomarker test</td>
                <td>440 (5.97)</td>
                <td>469</td>
                <td>1.1</td>
                <td colspan="2">N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>ECOG PS<sup>d</sup></td>
                <td>5416 (73.53)</td>
                <td>100,607</td>
                <td>17.7</td>
                <td colspan="2">N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>HNC: head and neck cancer.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>Any drug, not just systemic anticancer therapies.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>ECOG PS: Eastern Cooperative Oncology group performance status.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The median frequency of visits (normalized by length between first and last target SACT administration) for patients who received the target SACT was somewhat less in Data set A, varying from 0.05 to 0.12, depending on treatment line, than in Data set B, in which it varied from 0.14 to 0.18 (<xref ref-type="table" rid="table6">Table 6</xref>, task 19). This might indicate that more clinical activities were recorded in Data set B during treatment.</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Follow-up data for patients with advanced HNC<sup>a</sup> diagnosis on or after January 1, 2011.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="300"/>
            <col width="0"/>
            <col width="90"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="90"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="110"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Task</td>
                <td colspan="6">Data set A (n=7366)</td>
                <td colspan="5">Data set B (n=7754)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">Value, n</td>
                <td colspan="2">Value, median (IQR; range)</td>
                <td colspan="2">Value, mean (SD)</td>
                <td colspan="2">Value, n</td>
                <td colspan="2">Value, median (IQR; range)</td>
                <td>Value, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="14">
                  <bold>Task 19: frequency of visits during target SACT<sup>b,c</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1L<sup>d</sup> combination therapy</td>
                <td colspan="2">101</td>
                <td colspan="2">0.11 (0.07-0.16; 0.02-0.33)</td>
                <td colspan="2">0.13 (0.07)</td>
                <td colspan="2">19</td>
                <td colspan="2">0.17 (0.11-0.24; 0-0.36)</td>
                <td colspan="2">0.17 (0.09)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1L monotherapy</td>
                <td colspan="2">358</td>
                <td colspan="2">0.05 (0.05-0.08; 0.01-0.50)</td>
                <td colspan="2">0.07 (0.05)</td>
                <td colspan="2">44</td>
                <td colspan="2">0.18 (0.09-0.22; 0-0.48)</td>
                <td colspan="2">0.16 (0.11)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2L+<sup>e</sup> monotherapy</td>
                <td colspan="2">634</td>
                <td colspan="2">0.06 (0.05-0.10; 0.01-0.95)</td>
                <td colspan="2">0.08 (0.06)</td>
                <td colspan="2">106</td>
                <td colspan="2">0.13 (0.07-0.25; 0-0.75)</td>
                <td colspan="2">0.17 (0.14)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>All other</td>
                <td colspan="2">104</td>
                <td colspan="2">0.12 (0.09-0.17; 0.02-0.48)</td>
                <td colspan="2">0.14 (0.08)</td>
                <td colspan="2">76</td>
                <td colspan="2">0.14 (0.09-0.21; 0-1.3)</td>
                <td colspan="2">0.17 (0.17)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Task 20: for patients still alive, gap (in d) from the last target SACT administration and last visit<sup>f</sup></td>
                <td colspan="2">708</td>
                <td colspan="2">28 (6-187; 0-1118)</td>
                <td colspan="2">128 (199)</td>
                <td colspan="2">167</td>
                <td colspan="2">70 (29-223; 0-1755)</td>
                <td>159 (215)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>HNC: head and neck cancer.</p>
            </fn>
            <fn id="table6fn2">
              <p><sup>b</sup>SACT: systemic anticancer therapy.</p>
            </fn>
            <fn id="table6fn3">
              <p><sup>c</sup>Frequency defined as number of visits between the first and last target SACT administration dates within the same LOT number and name, divided by number of days between the last and first target SACT administration.</p>
            </fn>
            <fn id="table6fn4">
              <p><sup>d</sup>1L: first line of therapy after the advanced HNC diagnosis date.</p>
            </fn>
            <fn id="table6fn5">
              <p><sup>e</sup>2L+: second-line or later therapy.</p>
            </fn>
            <fn id="table6fn6">
              <p><sup>f</sup>Limited to patients who (1) were still alive ≥180 days after last receipt of target SACT and (2) received last dose of target SACT ≥180 days before data cutoff on November 25, 2019 (thus on or before May 29, 2019).</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study identified 20 data quality assessment tasks for the use case of estimating the rwTTD of an SACT. By executing the 18 tasks pertinent to the intravenously administered target SACT, we demonstrated that the UReQA framework for the rwTTD use case can be implemented to generate descriptive summary statistics and charts. These visualizations provide additional insights into the relevance and quality of 2 US EHR-based oncology RWD. The approach is generalizable to implement for other SACT and databases.</p>
        <p>Both data sets in the evaluation provided all the required data elements; however, verification checks revealed that Data set B might not be suitable for analyzing rwTTD for the target SACT because (1) the large decrease in patient receiving the target SACT in recent years suggests longer lags in incorporating the most recent data and (2) the completeness and plausibility issues in the SACT, LOT, and mortality data could cause faulty determination of treatment discontinuation date and status of censoring.</p>
        <p>The fact that Data set B included a lower percentage of patients receiving the target SACT (237/4003, 5.9% vs 1200/4808, 24.96% in Data set A) limited the utility of the data for determining the rwTTD. This finding highlights the need and importance of conducting a rigorous and use case–specific data quality assessment in the planning stage of RWD studies. In addition, for Data set B, findings of extremely low and high gaps between target SACT administration dates would warrant further investigation of each patient’s trajectory to verify the specific data quality issue before taking proper data quality improvement actions such as removing the patient or the SACT record as outliers.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study has several limitations that require further discussion. First, adequately assessing the reasons for missingness across different RWD sources is challenging. In particular, the data feeds and capture of elements across different data sources are variable. A lack of transparency and consistency means that different RWD sources are often not fully interoperable [<xref ref-type="bibr" rid="ref38">38</xref>]. In this study, we applied cohort attrition steps to align populations represented in the 2 data sets and imputed the LOT end date and LOT name that were missing in Data set B. However, a major remaining roadblock was the vendor’s privacy-preserving aggregation, which does not allow data sources to be adequately reviewed on more granular level to understand the reason behind missing data, data quality issues, or data discrepancies.</p>
        <p>Second, the implementation of data quality checks for new RWD sources, especially for those with data table structures that differ from those of prior data sets, requires customization and reconfiguration that are often time consuming. We are developing a data dashboard tool that can accelerate this process for both raw data and a common data model such as that of the Observational Health Data Sciences and Informatics [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>].</p>
        <p>Third, use case–specific data quality assessment checks often provide only a limited view of the comparative validity of the RWD under consideration, particularly when a well-recognized gold standard is absent. The paucity of data often limits an effective comparison with the distribution of key data elements in the general population (external validity). In this study, we set a priori metrics for these checks by using domain knowledge such as HNC prevalence [<xref ref-type="bibr" rid="ref33">33</xref>] and regulatory approval timelines. It would be interesting for future studies to validate and update these metrics.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>Prior studies have evaluated rwTTD, also known as the duration of therapy and real-world time on treatment, for immuno-oncology agents used in treating recurrent or metastatic HNC [<xref ref-type="bibr" rid="ref39">39</xref>], advanced non-small cell lung cancer [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref40">40</xref>-<xref ref-type="bibr" rid="ref42">42</xref>], and other solid cancers [<xref ref-type="bibr" rid="ref42">42</xref>]. In contrast to this study, these studies drew on research-ready databases (as would be identified in the preassessment step of UReQA [<xref ref-type="bibr" rid="ref3">3</xref>]), and the actions taken to ensure RWD fitness and quality were limited to aligning patient eligibility criteria (the cohort definition step of UReQA [<xref ref-type="bibr" rid="ref3">3</xref>]).</p>
        <p>New use cases can be created for other medication-related outcomes or therapeutic areas by following the first 3 steps of implementing the rwTTD use case in this study. In addition, the data quality checks that we identified and created for the rwTTD use case can be used for other types of use cases. For example, checks on medication identification and dates can also be used to evaluate the fitness of RWD sources for studying medication adherence. The checks on mortality and follow-up visits could validate the applicability of an RWD source for survival analyses.</p>
      </sec>
      <sec>
        <title>Future Work</title>
        <p>We selected 2 US EHR-based oncology databases to implement the UReQA use case of rwTTD. These were the only 2 databases the research team had access to that provided both oncology treatment and LOT information during the time of study execution. Each database may have its own bias in representing the overall advanced HNC population in the United States. Future work could implement (1) evaluation of more US EHR-based oncology databases to bring more impactful findings and (2) investigating the associations between rwTTD calculation and quantitative data quality assessment for various medications of interest and cancer types.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The fit-for-purpose quality assessment demonstrated the high level of variability in quality of the 2 real-world data sets for estimating the rwTTD of an SACT for advanced HNC. This study illustrates the application and value of use case–specific data assessment tasks in identifying high-quality RWD for research studies. The data quality specifications supporting this comprehensive use case can be expanded to other use cases in oncology outcomes research. Incorporating such comprehensive data quality assessment could help the study team select the most suitable database in the planning stage of a real-world evidence study. In addition, understanding data quality concerns particularly relevant to research questions can provide additional insights for properly preparing data in full study execution.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Data checks comprising 20 tasks assessing conformance, completeness, or plausibility.</p>
        <media xlink:href="medinform_v12i1e47744_app1.docx" xlink:title="DOCX File , 28 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">HNC</term>
          <def>
            <p>head and neck cancer</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">ICD</term>
          <def>
            <p>International Classification of Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">LOT</term>
          <def>
            <p>line of therapy</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">Q3</term>
          <def>
            <p>third quarter</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">RWD</term>
          <def>
            <p>real-world data</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">rwTTD</term>
          <def>
            <p>real-world time to treatment discontinuation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">SACT</term>
          <def>
            <p>systemic anticancer therapy</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">UReQA</term>
          <def>
            <p>Use Case Specific Relevance and Quality Assessment</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by Merck Sharp &#38; Dohme LLC, a subsidiary of Merck &#38; Co, Inc, Rahway, New Jersey, United States. Medical writing and editorial assistance were provided by Elizabeth V Hillyer, DVM (freelance). This assistance was funded by Merck Sharp &#38; Dohme LLC, a subsidiary of Merck &#38; Co, Inc, Rahway, New Jersey, United States.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data sets generated during and/or analyzed during this study are not publicly available as they were data vendors’ proprietary assets provided to the study team under commercial licenses but are available from the corresponding author on reasonable request and permission from the data vendor.</p>
        <p>In addition, we cannot disclose the identities of the data vendors, as doing so would inevitably promote the business of 1 data vendor and may violate data use agreements.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>BR, AS, KD, and SC conceptualized and designed the study. BR and AS contributed to data acquisition and data analysis. BR, AS, KD, SC, LY, and SK contributed to the interpretation of results. BR and AS drafted the manuscript. BR, AS, KD, SC, LY, and SK contributed to manuscript revision. All authors approved the publication of the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>BR, KD, and SK report employment with Merck Sharp &#38; Dohme LLC, a subsidiary of Merck &#38; Co, Inc, Rahway, NJ, United States, and stock ownership of Merck &#38; Co, Inc, Rahway, NJ, United States. AS reports employment with Real World Evidence, Epidemiology, Medical Affairs and Value Statistics (REM) Data Science department, Jazz Pharmaceutical. SC reports employment with ConcertAI. LY reports employment with and ownership of Polygon Health Analytics LLC. AS, SC, and LY were employees of Merck Sharp &#38; Dohme LLC, a subsidiary of Merck &#38; Co, Inc, Rahway, NJ, United States, when they worked on this study.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khozin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Blumenthal</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Pazdur</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Real-world data for clinical evidence generation in oncology</article-title>
          <source>J Natl Cancer Inst</source>
          <year>2017</year>
          <month>11</month>
          <day>01</day>
          <volume>109</volume>
          <issue>11</issue>
          <fpage>1</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1093/jnci/djx187</pub-id>
          <pub-id pub-id-type="medline">29059439</pub-id>
          <pub-id pub-id-type="pii">4157738</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miksad</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Samant</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Sarkar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Abernethy</surname>
              <given-names>AP</given-names>
            </name>
          </person-group>
          <article-title>Small but mighty: the use of real-world evidence to inform precision medicine</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2019</year>
          <month>07</month>
          <volume>106</volume>
          <issue>1</issue>
          <fpage>87</fpage>
          <lpage>90</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31112289"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cpt.1466</pub-id>
          <pub-id pub-id-type="medline">31112289</pub-id>
          <pub-id pub-id-type="pmcid">PMC6617709</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Chandwani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ru</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Reynolds</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Christian</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Estiri</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Fit-for-purpose real-world data assessments in oncology: a call for cross-stakeholder collaboration</article-title>
          <source>Value Outcomes Spotlight</source>
          <year>2021</year>
          <month>06</month>
          <volume>24</volume>
          <fpage>S25</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.valueinhealthjournal.com/article/S1098-3015(21)00346-6/fulltext"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jval.2021.04.129</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dagenais</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Russo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Madsen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Webster</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Becnel</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Use of real-world evidence to drive drug development strategy and inform clinical trial design</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2022</year>
          <month>01</month>
          <volume>111</volume>
          <issue>1</issue>
          <fpage>77</fpage>
          <lpage>89</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34839524"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cpt.2480</pub-id>
          <pub-id pub-id-type="medline">34839524</pub-id>
          <pub-id pub-id-type="pmcid">PMC9299990</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lakdawalla</surname>
              <given-names>DN</given-names>
            </name>
            <name name-style="western">
              <surname>Shafrin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Peneva</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Vine</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Brookmeyer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Figlin</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Predicting real-world effectiveness of cancer therapies using overall survival and progression-free survival from clinical trials: empirical evidence for the ASCO value framework</article-title>
          <source>Value Health</source>
          <year>2017</year>
          <volume>20</volume>
          <issue>7</issue>
          <fpage>866</fpage>
          <lpage>75</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1098-3015(17)30203-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jval.2017.04.003</pub-id>
          <pub-id pub-id-type="medline">28712615</pub-id>
          <pub-id pub-id-type="pii">S1098-3015(17)30203-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
          <article-title>Framework for FDA's real-world evidence program</article-title>
          <source>U.S. Food &#38; Drug Administration (FDA)</source>
          <year>2018</year>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fda.gov/media/120060/download">https://www.fda.gov/media/120060/download</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <article-title>Real-world data: assessing electronic health records and medical claims data to support regulatory decision-making for drug and biological products</article-title>
          <source>U.S. Department of Health and Human Services</source>
          <year>2021</year>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fda.gov/media/152503/download">https://www.fda.gov/media/152503/download</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <article-title>Submitting documents using real-world data and real-world evidence to FDA for drug and biological products: guidance for industry</article-title>
          <source>U.S. Food &#38; Drug Administration (FDA)</source>
          <year>2022</year>
          <month>09</month>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.regulations.gov/document/FDA-2019-D-1263-0014">https://www.regulations.gov/document/FDA-2019-D-1263-0014</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
          <article-title>Snapshot: healthcare data ecosystem (2023)</article-title>
          <source>DATAVANT</source>
          <access-date>2023-10-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://datavant.com/health-data-ecosystem/">https://datavant.com/health-data-ecosystem/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Methods and dimensions of electronic health record data quality assessment: enabling reuse for clinical research</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2013</year>
          <month>01</month>
          <day>01</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>144</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22733976"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000681</pub-id>
          <pub-id pub-id-type="medline">22733976</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000681</pub-id>
          <pub-id pub-id-type="pmcid">PMC3555312</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="web">
          <article-title>Assessing data quality for healthcare systems data used in clinical research</article-title>
          <source>NIH Pragmatic Trials Collaboratory</source>
          <year>2014</year>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dcricollab.dcri.duke.edu/sites/NIHKR/KR/Assessing-data-quality_V1%200.pdf">https://dcricollab.dcri.duke.edu/sites/NIHKR/KR/Assessing-data-quality_V1%200.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Franklin</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Liaw</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Iyasu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Critchlow</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Dreyer</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Real-world evidence to support regulatory decision making: new or expanded medical product indications</article-title>
          <source>Pharmacoepidemiol Drug Saf</source>
          <year>2021</year>
          <month>06</month>
          <volume>30</volume>
          <issue>6</issue>
          <fpage>685</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1002/pds.5222</pub-id>
          <pub-id pub-id-type="medline">33675248</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kahn</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Callahan</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Barnard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bauck</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Davidson</surname>
              <given-names>BN</given-names>
            </name>
            <name name-style="western">
              <surname>Estiri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Goerg</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Holve</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Liaw</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hamilton-Lopez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meeker</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zozus</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Schilling</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>A harmonized data quality assessment terminology and framework for the secondary use of electronic health record data</article-title>
          <source>EGEMS (Wash DC)</source>
          <year>2016</year>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>1244</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27713905"/>
          </comment>
          <pub-id pub-id-type="doi">10.13063/2327-9214.1244</pub-id>
          <pub-id pub-id-type="medline">27713905</pub-id>
          <pub-id pub-id-type="pii">egems1244</pub-id>
          <pub-id pub-id-type="pmcid">PMC5051581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mahendraratnam</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Silcox</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mercon</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kroetsch</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Romine</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Harrison</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Aten</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sherman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Daniel</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>McClellan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Determining real-world data?s fitness for use and the role of reliability: Duke-Margolis Center for Health Policy</article-title>
          <source>Duke Margolis Center for Health Policy</source>
          <year>2019</year>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://healthpolicy.duke.edu/publications/determining-real-world-datas-fitness-use-and-role-reliability">https://healthpolicy.duke.edu/publications/determining-real-world-datas-fitness-use-and-role-reliability</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Callahan</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bauck</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Bertoch</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Khare</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Staab</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zozus</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Kahn</surname>
              <given-names>MG</given-names>
            </name>
          </person-group>
          <article-title>A comparison of data quality assessment checks in six data sharing networks</article-title>
          <source>EGEMS (Wash DC)</source>
          <year>2017</year>
          <month>06</month>
          <day>12</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>8</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29881733"/>
          </comment>
          <pub-id pub-id-type="doi">10.5334/egems.223</pub-id>
          <pub-id pub-id-type="medline">29881733</pub-id>
          <pub-id pub-id-type="pmcid">PMC5982846</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reynolds</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Bourke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dreyer</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Considerations when evaluating real-world data quality in the context of fitness for purpose</article-title>
          <source>Pharmacoepidemiol Drug Saf</source>
          <year>2020</year>
          <month>10</month>
          <volume>29</volume>
          <issue>10</issue>
          <fpage>1316</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32374042"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/pds.5010</pub-id>
          <pub-id pub-id-type="medline">32374042</pub-id>
          <pub-id pub-id-type="pmcid">PMC7687257</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <article-title>OHDSI: data quality dashboard</article-title>
          <source>GitHub</source>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/OHDSI/DataQualityDashboard">https://github.com/OHDSI/DataQualityDashboard</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <article-title>Home page</article-title>
          <source>Observational Health Data Sciences and Informatics (OHDSI)</source>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ohdsi.org/">https://www.ohdsi.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
          <article-title>PEDSnet/data quality analysis</article-title>
          <source>GitHub</source>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/PEDSnet/Data-Quality-Analysis/blob/master/Data/DQACatalog/DQA_Check_Type_Inventory.csv">https://github.com/PEDSnet/Data-Quality-Analysis/blob/master/Data/DQACatalog/DQA_Check_Type_Inventory.csv</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <article-title>Home page</article-title>
          <source>The National Patient-Centered Clinical Research Network (PCORnet)</source>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pcornet.org/">https://pcornet.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
          <article-title>DQUEEN v 0.5 (data QUality assEssmENt and managing tool)</article-title>
          <source>GitHub</source>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/ABMI/DQUEEN_OMOP_CDM_Version">https://github.com/ABMI/DQUEEN_OMOP_CDM_Version</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Estiri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Klann</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
          </person-group>
          <article-title>A clustering approach for detecting implausible observation values in electronic health records data</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2019</year>
          <month>07</month>
          <day>23</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>142</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-019-0852-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-019-0852-6</pub-id>
          <pub-id pub-id-type="medline">31337390</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-019-0852-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC6652024</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Estiri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
          </person-group>
          <article-title>Semi-supervised encoding for outlier detection in clinical observation data</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2019</year>
          <month>11</month>
          <volume>181</volume>
          <fpage>104830</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30658851"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2019.01.002</pub-id>
          <pub-id pub-id-type="medline">30658851</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(18)30757-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC10111961</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Estiri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Klann</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Weiler</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Alema-Mensah</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Joseph Applegate</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lozinski</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Patibandla</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Natter</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Ofili</surname>
              <given-names>EO</given-names>
            </name>
            <name name-style="western">
              <surname>Ostasiewski</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Quarshie</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenthal</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstam</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Mandl</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
          </person-group>
          <article-title>A federated EHR network data completeness tracking system</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2019</year>
          <month>07</month>
          <day>01</day>
          <volume>26</volume>
          <issue>7</issue>
          <fpage>637</fpage>
          <lpage>45</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30925587"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz014</pub-id>
          <pub-id pub-id-type="medline">30925587</pub-id>
          <pub-id pub-id-type="pii">5423491</pub-id>
          <pub-id pub-id-type="pmcid">PMC6586954</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huser</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Facilitating analysis of measurements data though stricter model conventions: exploring units variability across sites</article-title>
          <source>Observational Health Data Sciences and Informatics</source>
          <year>2017</year>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ohdsi.org/web/wiki/lib/exe/fetch.php?media=resources:huser-2017-ohdsi-symp-units.pdf">https://www.ohdsi.org/web/wiki/lib/exe/fetch.php?media=resources:huser-2017-ohdsi-symp-units.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blumenthal</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kehl</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra-Kalyani</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Khozin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kluetz</surname>
              <given-names>PG</given-names>
            </name>
            <name name-style="western">
              <surname>Oxnard</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Pazdur</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Analysis of time-to-treatment discontinuation of targeted therapy, immunotherapy, and chemotherapy in clinical trials of patients with non-small-cell lung cancer</article-title>
          <source>Ann Oncol</source>
          <year>2019</year>
          <month>05</month>
          <day>01</day>
          <volume>30</volume>
          <issue>5</issue>
          <fpage>830</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0923-7534(19)31160-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/annonc/mdz060</pub-id>
          <pub-id pub-id-type="medline">30796424</pub-id>
          <pub-id pub-id-type="pii">S0923-7534(19)31160-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <article-title>Establishing a framework to evaluate real-world endpoints</article-title>
          <source>Friends of Cancer Research</source>
          <year>2018</year>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://friendsofcancerresearch.org/wp-content/uploads/RWE_FINAL-7.6.18_1.pdf">https://friendsofcancerresearch.org/wp-content/uploads/RWE_FINAL-7.6.18_1.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Norden</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Dreyer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Henk</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Abernethy</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Chrischilles</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kushi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mansfield</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Khozin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sharon</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Arunajadai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Carnahan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Christian</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Miksad</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Sakoda</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Torres</surname>
              <given-names>AZ</given-names>
            </name>
            <name name-style="western">
              <surname>Valice</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>An exploratory analysis of real-world end points for assessing outcomes among immunotherapy-treated patients with advanced non-small-cell lung cancer</article-title>
          <source>JCO Clin Cancer Inform</source>
          <year>2019</year>
          <month>07</month>
          <volume>3</volume>
          <fpage>1</fpage>
          <lpage>15</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ascopubs.org/doi/10.1200/CCI.18.00155?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1200/CCI.18.00155</pub-id>
          <pub-id pub-id-type="medline">31335166</pub-id>
          <pub-id pub-id-type="pmcid">PMC6873914</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ou</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Chandwani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Black</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Temporal phenotyping by mining healthcare data to derive lines of therapy for cancer</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <month>12</month>
          <volume>100</volume>
          <fpage>103335</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30254-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103335</pub-id>
          <pub-id pub-id-type="medline">31689549</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30254-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Mosesso</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Lane</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Griffith</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ou</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Dexter</surname>
              <given-names>PR</given-names>
            </name>
          </person-group>
          <article-title>An automated line-of-therapy algorithm for adults with metastatic non-small cell lung cancer: validation study using blinded manual chart review</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>10</month>
          <day>12</day>
          <volume>9</volume>
          <issue>10</issue>
          <fpage>e29017</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/10/e29017/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/29017</pub-id>
          <pub-id pub-id-type="medline">34636730</pub-id>
          <pub-id pub-id-type="pii">v9i10e29017</pub-id>
          <pub-id pub-id-type="pmcid">PMC8548977</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
          <article-title>RxNorm</article-title>
          <source>NIH National Library of Medicine</source>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nlm.nih.gov/research/umls/rxnorm/index.html">https://www.nlm.nih.gov/research/umls/rxnorm/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <article-title>RxNav-in-a-box</article-title>
          <source>NIH National Library of Medicine</source>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://lhncbc.nlm.nih.gov/RxNav/applications/RxNav-in-a-Box.html">https://lhncbc.nlm.nih.gov/RxNav/applications/RxNav-in-a-Box.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <article-title>Cancer stat facts: oral cavity and pharynx cancer</article-title>
          <source>National Cancer Institute: Surveillance, Epidemiology, and End Results Program (SEER)</source>
          <year>2022</year>
          <access-date>2023-03-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://seer.cancer.gov/statfacts/html/oralcav.html">https://seer.cancer.gov/statfacts/html/oralcav.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nadler</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Joo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Boyd</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Black-Shinn</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chirovsky</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Treatment patterns and outcomes among patients with recurrent/metastatic squamous cell carcinoma of the head and neck</article-title>
          <source>Future Oncol</source>
          <year>2019</year>
          <month>03</month>
          <volume>15</volume>
          <issue>7</issue>
          <fpage>739</fpage>
          <lpage>51</lpage>
          <pub-id pub-id-type="doi">10.2217/fon-2018-0572</pub-id>
          <pub-id pub-id-type="medline">30511880</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grünwald</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chirovsky</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cheung</surname>
              <given-names>WY</given-names>
            </name>
            <name name-style="western">
              <surname>Bertolini</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Castro</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Berrocal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sjoquist</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kuyas</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Auclair</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Guillaume</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Joo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Harrington</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Global treatment patterns and outcomes among patients with recurrent and/or metastatic head and neck squamous cell carcinoma: results of the GLANCE H and N study</article-title>
          <source>Oral Oncol</source>
          <year>2020</year>
          <month>03</month>
          <volume>102</volume>
          <fpage>104526</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1368-8375(19)30436-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.oraloncology.2019.104526</pub-id>
          <pub-id pub-id-type="medline">31978755</pub-id>
          <pub-id pub-id-type="pii">S1368-8375(19)30436-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mody</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Rocco</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Yom</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Haddad</surname>
              <given-names>RI</given-names>
            </name>
            <name name-style="western">
              <surname>Saba</surname>
              <given-names>NF</given-names>
            </name>
          </person-group>
          <article-title>Head and neck cancer</article-title>
          <source>Lancet</source>
          <year>2021</year>
          <month>12</month>
          <day>18</day>
          <volume>398</volume>
          <issue>10318</issue>
          <fpage>2289</fpage>
          <lpage>99</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(21)01550-6</pub-id>
          <pub-id pub-id-type="medline">34562395</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(21)01550-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mourad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jetmore</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Jategaonkar</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Moubayed</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moshier</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Urken</surname>
              <given-names>ML</given-names>
            </name>
          </person-group>
          <article-title>Epidemiological trends of head and neck cancer in the united states: a SEER population study</article-title>
          <source>J Oral Maxillofac Surg</source>
          <year>2017</year>
          <month>12</month>
          <volume>75</volume>
          <issue>12</issue>
          <fpage>2562</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28618252"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.joms.2017.05.008</pub-id>
          <pub-id pub-id-type="medline">28618252</pub-id>
          <pub-id pub-id-type="pii">S0278-2391(17)30537-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC6053274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Penberthy</surname>
              <given-names>LT</given-names>
            </name>
            <name name-style="western">
              <surname>Rivera</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Lund</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Bruno</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>An overview of real-world data sources for oncology and considerations for research</article-title>
          <source>CA Cancer J Clin</source>
          <year>2022</year>
          <month>05</month>
          <volume>72</volume>
          <issue>3</issue>
          <fpage>287</fpage>
          <lpage>300</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/doi/10.3322/caac.21714"/>
          </comment>
          <pub-id pub-id-type="doi">10.3322/caac.21714</pub-id>
          <pub-id pub-id-type="medline">34964981</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ramakrishnan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Baxi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chandwani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Joo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chirovsky</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Real-world time on treatment with immuno-oncology therapy in recurrent/metastatic head and neck squamous cell carcinoma</article-title>
          <source>Future Oncol</source>
          <year>2021</year>
          <month>08</month>
          <volume>17</volume>
          <issue>23</issue>
          <fpage>3037</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.futuremedicine.com/doi/abs/10.2217/fon-2021-0360?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.2217/fon-2021-0360</pub-id>
          <pub-id pub-id-type="medline">34044594</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Waterhouse</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Betts</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hartman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lubinga</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Stenehjem</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Real-world outcomes of immunotherapy-based regimens in first-line advanced non-small cell lung cancer</article-title>
          <source>Lung Cancer</source>
          <year>2021</year>
          <month>06</month>
          <volume>156</volume>
          <fpage>41</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0169-5002(21)00135-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.lungcan.2021.04.007</pub-id>
          <pub-id pub-id-type="medline">33894493</pub-id>
          <pub-id pub-id-type="pii">S0169-5002(21)00135-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Horvat</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Lambova</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Christian</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Lasiter</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Reich</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Comparing findings from a friends of cancer research exploratory analysis of real-world end points with the cancer analysis system in England</article-title>
          <source>JCO Clin Cancer Inform</source>
          <year>2021</year>
          <month>12</month>
          <volume>5</volume>
          <fpage>1155</fpage>
          <lpage>68</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ascopubs.org/doi/10.1200/CCI.21.00013?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1200/CCI.21.00013</pub-id>
          <pub-id pub-id-type="medline">34860576</pub-id>
          <pub-id pub-id-type="pmcid">PMC8763340</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Torres</surname>
              <given-names>AZ</given-names>
            </name>
            <name name-style="western">
              <surname>Nussbaum</surname>
              <given-names>NC</given-names>
            </name>
            <name name-style="western">
              <surname>Parrinello</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Bourla</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Bowser</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Wagner</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tabano</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>George</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Miksad</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Analysis of a real-world progression variable and related endpoints for patients with five different cancer types</article-title>
          <source>Adv Ther</source>
          <year>2022</year>
          <month>06</month>
          <volume>39</volume>
          <issue>6</issue>
          <fpage>2831</fpage>
          <lpage>49</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35430670"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s12325-022-02091-8</pub-id>
          <pub-id pub-id-type="medline">35430670</pub-id>
          <pub-id pub-id-type="pii">10.1007/s12325-022-02091-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC9123022</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
