<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e64705</article-id><article-id pub-id-type="doi">10.2196/64705</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Assessing Total Hip Arthroplasty Outcomes and Generating an Orthopedic Research Outcome Database via a Natural Language Processing Pipeline: Development and Validation Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Mast</surname><given-names>Nicholas H</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Oeste</surname><given-names>Clara L.</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Hens</surname><given-names>Dries</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib></contrib-group><aff id="aff1"><institution>Hip and Pelvis Institute</institution><addr-line>2250 Hayes St # 208</addr-line><addr-line>San Francisco</addr-line><addr-line>CA</addr-line><country>United States</country></aff><aff id="aff2"><institution>LynxCare Inc</institution><addr-line>Leuven</addr-line><country>Belgium</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Lovis</surname><given-names>Christian</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Chaturvedi</surname><given-names>Akhil</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Senst</surname><given-names>Benjamin</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Chinthala</surname><given-names>Lokesh</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Nicholas H Mast, MD, Hip and Pelvis Institute, 2250 Hayes St # 208, San Francisco, CA, 94117, United States, 1 415-530-5330; <email>doctormast@sfhips.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>12</day><month>3</month><year>2025</year></pub-date><volume>13</volume><elocation-id>e64705</elocation-id><history><date date-type="received"><day>24</day><month>07</month><year>2024</year></date><date date-type="rev-recd"><day>30</day><month>01</month><year>2025</year></date><date date-type="accepted"><day>16</day><month>02</month><year>2025</year></date></history><copyright-statement>&#x00A9; Nicholas H Mast, Clara L Oeste, Dries Hens. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 12.3.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2025/1/e64705"/><abstract><sec><title>Background</title><p>Processing data from electronic health records (EHRs) to build research-grade databases is a lengthy and expensive process. Modern arthroplasty practice commonly uses multiple sites of care, including clinics and ambulatory care centers. However, most private data systems prevent obtaining usable insights for clinical practice.</p></sec><sec><title>Objective</title><p>This study aims to create an automated natural language processing (NLP) pipeline for extracting clinical concepts from EHRs related to orthopedic outpatient visits, hospitalizations, and surgeries in a multicenter, single-surgeon practice. The pipeline was also used to assess therapies and complications after total hip arthroplasty (THA).</p></sec><sec sec-type="methods"><title>Methods</title><p>EHRs of 1290 patients undergoing primary THA from January 1, 2012 to December 31, 2019 (operated and followed by the same surgeon) were processed using artificial intelligence (AI)&#x2013;based models (NLP and machine learning). In addition, 3 independent medical reviewers generated a gold standard using 100 randomly selected EHRs. The algorithm processed the entire database from different EHR systems, generating an aggregated clinical data warehouse. An additional manual control arm was used for data quality control.</p></sec><sec sec-type="results"><title>Results</title><p>The algorithm was as accurate as human reviewers (0.95 vs 0.94; <italic>P=</italic>.01), achieving a database-wide average <italic>F</italic><sub>1</sub>-score of 0.92 (SD 0.09; range 0.67&#x2010;0.99), validating its use as an automated data extraction tool. During the first year after direct anterior THA, 92.1% (1188/1290) of our population had a complication-free recovery. In 7.9% (102/1290) of cases where surgery or recovery was not uneventful, lateral femoral cutaneous nerve sensitivity (47/1290, 3.6%), intraoperative fractures (13/1290, 1%), and hematoma (9/1290, 0.7%) were the most common complications.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Algorithm evaluation of this dataset accurately represented key clinical information swiftly, compared with human reviewers. This technology may provide substantial value for future surgeon practice and patient counseling. Furthermore, the low early complication rate of direct anterior THA in this surgeon&#x2019;s hands was supported by the dataset, which included data from all treated patients in a multicenter practice.</p></sec></abstract><kwd-group><kwd>total hip arthroplasty</kwd><kwd>THA</kwd><kwd>direct anterior approach</kwd><kwd>electronic health records</kwd><kwd>EHR</kwd><kwd>natural language processing</kwd><kwd>NLP</kwd><kwd>complication rate</kwd><kwd>single-surgeon registry</kwd><kwd>hip arthroplasty</kwd><kwd>orthopedic</kwd><kwd>validation</kwd><kwd>surgeon</kwd><kwd>outpatient visits</kwd><kwd>hospitalizations</kwd><kwd>surgery</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Total hip arthroplasty (THA) is one of the most effective orthopedic procedures [<xref ref-type="bibr" rid="ref1">1</xref>]. The number of THAs is projected to rise, along with its impact on health care resources [<xref ref-type="bibr" rid="ref2">2</xref>]. However, more government funding requires efficient quality control and accountability. Quality monitoring is expected to have a bigger impact on orthopedic practices and on medicine as a whole in the near future. Unfortunately, many surgeons working in nonacademic settings frequently lack the resources and financing needed to properly evaluate the quality of patient care they provide. The broad adoption of electronic health records (EHRs) simplifies access to vast amounts of medical data and facilitates data analysis.</p><p>Despite how inefficient and time-consuming manual review is, it remains the gold standard for reviewing medical information. Research has shown that systematic reporting of postoperative orthopedic surgical adverse events is infrequent [<xref ref-type="bibr" rid="ref3">3</xref>], despite the low complication rates associated with THA. Monitoring the standard of care after THA is still challenging, since evaluating sufficient records in a timely manner is a complex task. Using natural language processing (NLP) technology, we developed a system that can extract relevant postoperative problems from unstructured EHR data [<xref ref-type="bibr" rid="ref4">4</xref>]. We questioned whether such an AI-supported approach might be used to provide precise, continuing feedback on the quality of care provided after THA in a high-volume, nonacademic clinical setting. We assumed that a computer algorithm would perform at least as well as a human reviewer, which is considered the industry standard.</p><p>The primary goal of this study was, therefore, to design and develop an automated NLP pipeline for extracting clinical concepts from reports on outpatients, hospitalizations, and surgeries from a single surgeon, multicenter practice. Using the pipeline, the secondary goal was to examine and evaluate therapies and complications following THA.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Ethical Considerations</title><p>Patients were invited to participate in the research on the direct anterior approach (DAA) of hip replacement. Informed consent for the use of patient data in this retrospective study was obtained as part of the institutional review board (IRB) protocol (WCG IRB Protocol 20225993). Patients undergoing surgery were provided with a consent form at the time of intake, which was signed before the procedure. Patients who continued to be followed up subsequently signed consent forms that were applicable retrospectively. Data were anonymized before analysis.</p></sec><sec id="s2-2"><title>Patient Selection</title><p>Data from 1290 patients undergoing 1304 primary DAA THAs using a Hana Orthopedic Surgery Table (Mizuho OSI), with the same surgical team and implants. Data was collected from January 1, 2012 to December 31, 2019, and analyzed retrospectively. Exclusion criteria included age under 18 years, failure to provide informed consent, and revision surgery.</p></sec><sec id="s2-3"><title>Follow-Up Schedule</title><p>Patients were followed preoperatively and postoperatively at 2 weeks, 6 weeks, 3 months (on a per-case basis), and 1 year. The algorithm screened EHRs for key sentences, words, and clinical definitions that were compiled by the surgical team.</p></sec><sec id="s2-4"><title>Adverse Event Classification</title><p>A list of 19 complications based on the study of the Hip Society THA Complications Workgroup was compiled [<xref ref-type="bibr" rid="ref5">5</xref>]. A separate category was added for lower back pain, sciatica, or both. Treatment was categorized as either conservative or interventional.</p></sec><sec id="s2-5"><title>EHR Data Structure and Documentation Variability</title><p>The study used EHR systems that capture all patient interactions across the health system. Documentation varied by note type: operative reports were dictated using a standardized format, with intraoperative complications documented in a dedicated subsection. Radiographic reports, however, were dictated by multiple radiologists without a uniform structure. Complications were often identifiable through multiple associated notes across different document types. Implant records were dictated directly from intraoperative purchasing logs, ensuring high reliability. The NLP algorithm flagged typographical errors in dictated notes that human reviewers overlooked.</p></sec><sec id="s2-6"><title>Gold Standard Adjudication Process</title><p>To ensure consistency in the gold standard corpus used for training the algorithm, all discrepancies among reviewers were resolved through senior adjudication. When ambiguities were identified in a case, they were escalated to the senior author, who conducted a thorough review of the full case file. Final determinations were made based on clinical expertise and consensus, ensuring a standardized and reliable reference dataset.</p></sec><sec id="s2-7"><title>NLP Pipeline Development and Validation</title><p>The NLP pipeline was developed and validated in 3 phases, as described by Van de Meulebroucke et al [<xref ref-type="bibr" rid="ref4">4</xref>]. First, a training set of 50 EHRs was annotated to generate relevant input, since a sample size of 50 EHRs was previously found sufficient to achieve accuracy over 90% [<xref ref-type="bibr" rid="ref4">4</xref>]. Second, an independent gold standard was generated through manual review by 3 independent surgeons of a derivation cohort of 100 EHRs. Third, the entire dataset of 1290 patients was manually reviewed to calculate the algorithm&#x2019;s recall, precision, and <italic>F</italic><sub>1</sub>-score. Patient records were analyzed using standard procedures of each center&#x2019;s EHR system by a manual reviewer.</p><p>The pipeline uses a text mining engine based on machine learning and NLP to extract important concepts from EHRs. The NLP pipeline incorporates several preprocessing steps, including language detection, sentence segmentation, and tokenization, to prepare unstructured EHR text for analysis. The core architecture is based on a deep learning model fine-tuned on large-scale clinical datasets and adapted for domain-specific tasks in orthopedics. Named entity recognition identifies relevant medical concepts, relation extraction determines associations between entities, and attribute extraction captures features such as negations and temporal qualifiers. Processed outputs were mapped to Unified Medical Language System (UMLS) Concept Unique Identifiers (CUIs), which includes standard terminologies like the Systematized Nomenclature of Medicine-Clinical Terms (SNOMED-CT). Mapping was performed by a probabilistic entity-linking algorithm that integrates semantic ranking and term preferences, ensuring precise and standardized representation. In addition, the processed data were standardized using the Observational Medical Outcomes Partnership Common Data Model, which harmonizes structured and unstructured data from different EHR systems into a unified format. This approach enables the efficient processing of unstructured clinical text and supports the accurate extraction and mapping of clinical concepts.</p><p>Complications and their respective treatment, along with other clinical features, were collected into a database and standardized using UMLS CUIs. The NLP tool mined variables from the full set of source data within EHRs, including, but not limited to, clinical notes, primary care records, radiology reports, laboratory results, discharge summaries, and surgical documentation. The full list of study variables is shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. To assess accuracy, a scoring system was established such that one point was given to each correct clinical concept, extracted by the algorithm or the human reviewer (<xref ref-type="fig" rid="figure1">Figure 1</xref>). Correct clinical concepts referred to those matching the gold standard. Precision, recall, and <italic>F</italic><sub>1</sub>-score were used as statistical parameters to reflect the performance of the algorithm, as calculated with R (R Foundation for Statistical Computing) statistical programming (<xref ref-type="table" rid="table1">Table 1</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Scoring system flowchart for concept identification by human versus algorithm.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e64705_fig01.png"/></fig><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Statistical parameters for algorithm performance.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Definition</td><td align="left" valign="bottom">Calculation</td></tr></thead><tbody><tr><td align="left" valign="top">Accuracy</td><td align="left" valign="top">Percentage (%) of relevant concepts extracted by method A/B.</td><td align="left" valign="top">Number of concepts&#x00F7;total number of concepts expected to be extracted</td></tr><tr><td align="left" valign="top">Recall or sensitivity</td><td align="left" valign="top">Ratio between all identified concepts and all existing concepts in a given text (0&#x2010;1).</td><td align="left" valign="top">True positives&#x00F7;(true positives+false negatives)</td></tr><tr><td align="left" valign="top">Precision</td><td align="left" valign="top">Ratio between all adequately identified concepts and all identified concepts (0&#x2010;1).</td><td align="left" valign="top">True positives&#x00F7;(true positives+false positives)</td></tr><tr><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">Harmonic mean of recall and precision (0&#x2010;1).</td><td align="left" valign="top">2&#x00D7;(recall&#x00D7;precision)&#x00F7;(recall+precision)</td></tr></tbody></table></table-wrap></sec><sec id="s2-8"><title>Statistical Analysis</title><p>For categorical values, the number of patients (n) and relative proportions (%) are shown.</p><p>Checks for accuracy, recall, and precision involved measuring model outcomes against a gold standard created by human annotators. The <italic>F</italic><sub>1</sub>-score assesses the trade-off between precision and recall by calculating their harmonic mean (<xref ref-type="table" rid="table1">Table 1</xref>).</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Performance of the NLP Pipeline</title><p><xref ref-type="table" rid="table2">Table 2</xref> compares the accuracy of human reviewers to an algorithm on various aspects of 100 patient records. Overall, the algorithm was slightly more accurate than human reviewers, with an accuracy of 0.952 compared with 0.945 for human reviewers, a difference of 0.007 (<italic>P=</italic>.01). The most notable differences in accuracy between the algorithm and human reviewers were on the variables of weight (0.24 difference in accuracy), revision (0.06 difference), and offset (0.02 difference), all of which were detected more accurately by the algorithm. The algorithm was less accurate on variables such as cup size, prosthetic loosening, and heterotopic ossification grade, though with small differences in accuracy ranging from &#x2212;0.06 to 0.04.</p><p>In order to further assess the quality of data extracted by the algorithm, we calculated statistical parameters such as recall, precision, and <italic>F</italic><sub>1</sub>-score of the different variables detected in the study, as defined in <xref ref-type="table" rid="table1">Table 1</xref>. The results shown in <xref ref-type="table" rid="table3">Table 3</xref> reflect that for most variables, the recall and <italic>F</italic><sub>1</sub>-score are high, indicating that the model is able to correctly identify the presence of the clinical variables in the data. The average values for all the variables show an overall high performance of the model.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Human versus algorithm accuracy on a randomly selected group of 100 patients.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Human reviewer accuracy</td><td align="left" valign="bottom">Algorithm accuracy</td><td align="left" valign="bottom">Delta</td></tr></thead><tbody><tr><td align="left" valign="top">Antibiotics</td><td align="left" valign="top">1</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Blood loss</td><td align="left" valign="top">1</td><td align="left" valign="top">0.98</td><td align="left" valign="top">&#x2212;0.02</td></tr><tr><td align="left" valign="top">Cup size</td><td align="left" valign="top">0.98</td><td align="left" valign="top">0.92</td><td align="left" valign="top">&#x2212;0.06</td></tr><tr><td align="left" valign="top">Date of procedure</td><td align="left" valign="top">0.98</td><td align="left" valign="top">0.98</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Dislocation</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0.94</td><td align="left" valign="top">&#x2212;0.02</td></tr><tr><td align="left" valign="top">Fracture</td><td align="left" valign="top">0.98</td><td align="left" valign="top">0.96</td><td align="left" valign="top">&#x2212;0.02</td></tr><tr><td align="left" valign="top">Heterotopic ossification grade</td><td align="left" valign="top">0.9</td><td align="left" valign="top">0.92</td><td align="left" valign="top">0.02</td></tr><tr><td align="left" valign="top">Offset</td><td align="left" valign="top">1</td><td align="left" valign="top">0.98</td><td align="left" valign="top">&#x2212;0.02</td></tr><tr><td align="left" valign="top">Pain killer</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Primary arthrosis</td><td align="left" valign="top">0.98</td><td align="left" valign="top">0.98</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Prosthesis manufacturer</td><td align="left" valign="top">0.94</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0.02</td></tr><tr><td align="left" valign="top">Prosthetic loosening</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0.92</td><td align="left" valign="top">&#x2212;0.04</td></tr><tr><td align="left" valign="top">Psoas tendinopathy</td><td align="left" valign="top">1</td><td align="left" valign="top">0.96</td><td align="left" valign="top">&#x2212;0.04</td></tr><tr><td align="left" valign="top">Range of motion</td><td align="left" valign="top">0.86</td><td align="left" valign="top">0.88</td><td align="left" valign="top">0.02</td></tr><tr><td align="left" valign="top">Revision</td><td align="left" valign="top">0.9</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0.06</td></tr><tr><td align="left" valign="top">Steel type</td><td align="left" valign="top">0.9</td><td align="left" valign="top">0.92</td><td align="left" valign="top">0.02</td></tr><tr><td align="left" valign="top">Surgery duration</td><td align="left" valign="top">1</td><td align="left" valign="top">0.98</td><td align="left" valign="top">&#x2212;0.02</td></tr><tr><td align="left" valign="top">Thromboembolism</td><td align="left" valign="top">1</td><td align="left" valign="top">0.98</td><td align="left" valign="top">&#x2212;0.02</td></tr><tr><td align="left" valign="top">Weight</td><td align="left" valign="top">0.64</td><td align="left" valign="top">0.88</td><td align="left" valign="top">0.24</td></tr><tr><td align="left" valign="top">Wound infection</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0.98</td><td align="left" valign="top">0.02</td></tr><tr><td align="left" valign="top">Total</td><td align="left" valign="top">0.945</td><td align="left" valign="top">0.952</td><td align="left" valign="top">0.007</td></tr></tbody></table></table-wrap><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Recall, precision, and <italic>F</italic><sub>1</sub>-scores for entire dataset of 1290 cases across all data points.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Recall</td><td align="left" valign="bottom">Precision</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score</td></tr></thead><tbody><tr><td align="left" valign="top">Superficial wound infection</td><td align="left" valign="top">1</td><td align="left" valign="top">0.88</td><td align="left" valign="top">0.94</td></tr><tr><td align="left" valign="top">Heterotopic ossification</td><td align="left" valign="top">0.92</td><td align="left" valign="top">0.95</td><td align="left" valign="top">0.93</td></tr><tr><td align="left" valign="top">Lower back pain</td><td align="left" valign="top">1</td><td align="left" valign="top">0.98</td><td align="left" valign="top">0.99</td></tr><tr><td align="left" valign="top">Peri-prosthetic Infection</td><td align="left" valign="top">0.98</td><td align="left" valign="top">0.95</td><td align="left" valign="top">0.96</td></tr><tr><td align="left" valign="top">Wound infection</td><td align="left" valign="top">0.95</td><td align="left" valign="top">0.82</td><td align="left" valign="top">0.88</td></tr><tr><td align="left" valign="top">Dislocation</td><td align="left" valign="top">1</td><td align="left" valign="top">0.99</td><td align="left" valign="top">0.99</td></tr><tr><td align="left" valign="top">Revision</td><td align="left" valign="top">1</td><td align="left" valign="top">0.97</td><td align="left" valign="top">0.98</td></tr><tr><td align="left" valign="top">Intra-operative fracture</td><td align="left" valign="top">1</td><td align="left" valign="top">0.99</td><td align="left" valign="top">0.99</td></tr><tr><td align="left" valign="top">Post-operative fracture</td><td align="left" valign="top">1</td><td align="left" valign="top">0.89</td><td align="left" valign="top">0.94</td></tr><tr><td align="left" valign="top">Bleeding</td><td align="left" valign="top">0.95</td><td align="left" valign="top">0.65</td><td align="left" valign="top">0.77</td></tr><tr><td align="left" valign="top">Prosthetic loosening</td><td align="left" valign="top">1</td><td align="left" valign="top">0.98</td><td align="left" valign="top">0.99</td></tr><tr><td align="left" valign="top">Pain</td><td align="left" valign="top">0.97</td><td align="left" valign="top">0.88</td><td align="left" valign="top">0.92</td></tr><tr><td align="left" valign="top">Nerve injury</td><td align="left" valign="top">0.89</td><td align="left" valign="top">0.92</td><td align="left" valign="top">0.90</td></tr><tr><td align="left" valign="top">Psoas burden</td><td align="left" valign="top">0.99</td><td align="left" valign="top">0.99</td><td align="left" valign="top">0.99</td></tr><tr><td align="left" valign="top">Sciatica</td><td align="left" valign="top">0.75</td><td align="left" valign="top">0.88</td><td align="left" valign="top">0.81</td></tr><tr><td align="left" valign="top">Vascular systems injury</td><td align="left" valign="top">1</td><td align="left" valign="top">0.5</td><td align="left" valign="top">0.67</td></tr><tr><td align="left" valign="top">Average</td><td align="left" valign="top">0.96</td><td align="left" valign="top">0.89</td><td align="left" valign="top">0.92</td></tr></tbody></table></table-wrap></sec><sec id="s3-2"><title>Complications and Interventions of DAA THA</title><p>The mean age of the patients included in the dataset was 63.5 (SD 9.6) years and 57.4% (740/1290) were women. The complications during the first year after direct anterior THA in these patients are shown in <xref ref-type="table" rid="table4">Table 4</xref>, as well as the conservative or interventional treatment of these clinical outcomes.</p><p>Soft tissue complications were the most common type of complication observed in patients undergoing THA. The most common type of soft tissue complication was sensory deficit (47/1290, 3.6%), followed by hematoma (9/1290, 0.7%) and superficial wound infection (3/1290, 0.2%). No incidents of bleeding, prolonged wound drainage, motor nerve deficit, vascular injury, or sciatica were reported. Regarding mechanical complications, periprosthetic fractures occurred in 1.4% of cases (18/1290; 13 intraoperatively and 5 postoperatively), and instability occurred in 0.5% (7/1290) of cases. Implant fracture, cup-liner dislocation and osteolysis were not reported.</p><p><xref ref-type="table" rid="table5">Table 5</xref> shows interventions in the 1-year postoperative period. The most common interventions were intraoperative (cerclage and wiring), which account for 1% (n=13) of cases. Readmission was detected in 0.9% (n=12) of patients. Other interventions such as aspiration, wound debridement, closed reduction, osteosynthesis or cerclage, and revision, each account for less than 1% of cases.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Complications in the 1-year postoperative period (n=1290).</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Complication subgroup</td><td align="left" valign="bottom">Total, n (%)</td><td align="left" valign="bottom">Conservative treatment, n (%)</td><td align="left" valign="bottom">Interventional treatment, n (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Soft tissue complications: wounds</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Bleeding</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">&#x2003;Hematoma</td><td align="left" valign="top">9 (0.7)</td><td align="left" valign="top">6 (0.5)</td><td align="left" valign="top">3 (0.2)</td></tr><tr><td align="left" valign="top">&#x2003;Prolonged wound drainage</td><td align="left" valign="top">1 (0.1)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">1 (0.1)</td></tr><tr><td align="left" valign="top">Soft tissue complications: infection</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Superficial wound infection</td><td align="left" valign="top">3 (0.2)</td><td align="left" valign="top">3 (0.2)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">&#x2003;Deep PJI<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td><td align="left" valign="top">3 (0.2)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">3 (0.2)</td></tr><tr><td align="left" valign="top">Soft tissue complications: neural deficit</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Motor nerve deficit</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">&#x2003;Transient sensory deficit (LFCN<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> sensitivity)</td><td align="left" valign="top">47 (3.6)</td><td align="left" valign="top">47 (3.6)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">Soft tissue complications: lower back pain</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Lumbago</td><td align="left" valign="top">6 (0.5)</td><td align="left" valign="top">6 (0.5)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">&#x2003;Sciatica</td><td align="left" valign="top">1 (0.1)</td><td align="left" valign="top">1 (0.1)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">Soft tissue complications: other</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Vascular Injury</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">&#x2003;Heterotopic Ossification</td><td align="left" valign="top">2 (0.2)</td><td align="left" valign="top">2 (0.2)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">&#x2003;Thromboembolic disease</td><td align="left" valign="top">3 (0.2)</td><td align="left" valign="top">3 (0.2)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">Mechanical complications: periprosthetic fracture</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Intraoperative</td><td align="left" valign="top">13 (1)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">13 (1)</td></tr><tr><td align="left" valign="top">&#x2003;Postoperative</td><td align="left" valign="top">5 (0.4)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">5 (0.4)</td></tr><tr><td align="left" valign="top">Mechanical complications: other</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Instability</td><td align="left" valign="top">7 (0.5)</td><td align="left" valign="top">3 (0.2)</td><td align="left" valign="top">4 (0.3)</td></tr><tr><td align="left" valign="top">&#x2003;Implant fracture</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">&#x2003;Loosening</td><td align="left" valign="top">2 (0.2)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">2 (0.2)</td></tr><tr><td align="left" valign="top">&#x2003;Cup-liner dislocation</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">&#x2003;Bearing surface wear</td><td align="left" valign="top">1 (0.1)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">1 (0.1)</td></tr><tr><td align="left" valign="top">&#x2003;Osteolysis</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td><td align="left" valign="top">0 (0)</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>PJI: prosthetic joint infection.</p></fn><fn id="table4fn2"><p><sup>b</sup>LFCN: lateral femoral cutaneous nerve.</p></fn></table-wrap-foot></table-wrap><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Interventions in the 1-year post-operative period.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Intervention</td><td align="left" valign="bottom">Values (n=1290), n (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Intraoperative</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Cerclage and wiring</td><td align="left" valign="top">13 (1)</td></tr><tr><td align="left" valign="top">Outpatient</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Infiltration</td><td align="left" valign="top">0 (0)</td></tr><tr><td align="left" valign="top">&#x2003;Aspiration</td><td align="left" valign="top">3 (0.2)</td></tr><tr><td align="left" valign="top">Reoperation</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Wound debridement</td><td align="left" valign="top">2 (0.2)</td></tr><tr><td align="left" valign="top">&#x2003;Closed reduction</td><td align="left" valign="top">2 (0.2)</td></tr><tr><td align="left" valign="top">&#x2003;Osteosynthesis or cerclage</td><td align="left" valign="top">2 (0.2)</td></tr><tr><td align="left" valign="top">Other</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Revision</td><td align="left" valign="top">9 (0.7)</td></tr><tr><td align="left" valign="top">&#x2003;Readmission</td><td align="left" valign="top">12 (0.9)</td></tr></tbody></table></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study reflects the use of AI techniques to streamline and improve data capture from EHRs, in line with the current need for innovative solutions to obtain meaningful information from existing data sources in the field of orthopedics [<xref ref-type="bibr" rid="ref6">6</xref>]. AI-supported automation, substantiated in the first step by directly comparing it with a manual review of a random sample of patients, showed no statistical differences in accuracy across all compared clinical concepts. Subsequently, application of the algorithm to the entire dataset generated very high <italic>F</italic><sub>1</sub>-scores, therefore, validating its ability to detect positive results in our cohort with a high degree of precision and recall. This allowed a single-surgeon registry to be populated from existing health data within EHRs in a very short period of time. The NLP pipeline handled documentation variability using named entity recognition, probabilistic entity linking, and attribute extraction, allowing synonym recognition and standardization to SNOMED-CT and UMLS CUIs. This data-driven approach ensured robust identification of complications across different documentation sources. Furthermore, the methodology deployed in this study allows for inclusion of data from different software sources, which can be a limitation of single-surgeon registries that must be populated from diverse clinics or ambulatory care centers. The resulting multicenter, single-surgeon database is comparable in its granularity to single-system registries populated with conventional methods, circumventing the complexity of a system that is becoming increasingly fragmented.</p><p>The methodology that was previously described in a smaller cohort of Dutch patients is validated here in a multicenter, US-based practice, screening records in English from 1290 patients over an 8-year period at high accuracy [<xref ref-type="bibr" rid="ref4">4</xref>]. It also demonstrates its usefulness in the nonacademic setting, compared with previous studies at academic centers [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. Analysis of such a large cohort from a single surgeon permitted categorization of frequent concepts without needing to account for the confounding variables of different techniques and complication rates of multiple surgeons [<xref ref-type="bibr" rid="ref9">9</xref>].</p><p>Our dataset split balances annotation feasibility and model performance, following previous clinical NLP studies. Small, high-quality training sets have been shown to be effective in constrained domains, particularly when leveraging structured reporting patterns [<xref ref-type="bibr" rid="ref10">10</xref>]. The chosen test set size aligns with established practices in clinical NLP research [<xref ref-type="bibr" rid="ref11">11</xref>]. Instead of relying solely on predefined training-validation-test ratios, we incorporated post hoc validation on a large dataset to assess generalizability, a common strategy in clinical text mining [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>].</p><p>In addition, clinical insight was also gained regarding the frequency and management of complications over a 1-year period. While the study highlights the effectiveness of NLP tools in single surgeon practices, extensive datasets can greatly benefit from its capabilities. NLP tools offer versatility in both big data settings and smaller subsets, enabling comprehensive analysis across various practice settings and facilitating evaluation of outcomes, for example, relative to regional averages or previously published work.</p><p>Ultimately, concept detection and extraction of the pipeline demonstrated accuracy on par with human reviewers at a fraction of the cost and time required for manual chart review. Validation is a necessary step for algorithm use that benefits from physicians&#x2019; feedback through annotation. This input is necessary to test algorithm performance, to calibrate the algorithm&#x2019;s rates of false positives and false negatives, and to examine if clinical use of algorithms leads to better research insights and health care services [<xref ref-type="bibr" rid="ref14">14</xref>]. The ease and high degree of fidelity of concept extraction by the algorithm in this study facilitated longitudinal evaluation of clinical complications, and importantly, also precluded the need to manually filter through patient charts, which is time-consuming [<xref ref-type="bibr" rid="ref15">15</xref>].</p></sec><sec id="s4-2"><title>Comparison With Previous Work</title><p>The representativeness of the methodology in this study is hence reflected by the frequency of the complications, which falls within the lower range of previously described cohorts [<xref ref-type="bibr" rid="ref16">16</xref>]. For instance, a frequency of 1% of periprosthetic fractures was detected, which was the most common intraoperative complication in this study, and was found to be 2.1%, 1.6%, and 1.1% in other cohorts [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. Other similar comparisons show that revisions were detected in 0.7% (9/1290) of patients in our study vs 2.1% (5/239) and 1.6% (3/187), and prosthetic joint infection, at 0.2% (3/1290) in our study, appeared in 1.3% (3/239) and 1.6% (3/187) of patients in the aforementioned studies [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. In a prospective comparison of DAA to posterior approach THA (43 DAA THAs in total), 2.3% (1/43) had hematoma vs 0.7% (9/1290) in our study, 2.3% (1/43) presented heterotopic ossification vs 0.2% (3/1290) shown here, and neither study detected dislocations [<xref ref-type="bibr" rid="ref18">18</xref>]. Therefore, the results obtained using the validated, NLP-driven methodology shown here also highlight the quality of practice of the surgeon, for the complications described in this study fall within the lower range of those previously described in the literature [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref20">20</xref>].</p></sec><sec id="s4-3"><title>Limitations</title><p>As is the case in real-world evidence studies, there are certain limitations to consider for this study, such as missing values for certain variables. Regarding rare concepts such as bleeding, the scarcity of terms found in the EHRs may hinder algorithm training. The algorithm solely focused on patients undergoing DAA THA, which is the method used by the surgeon, but its validity could be further strengthened by expanding the analyses to other populations. In addition, the quality of records kept at each site determines the quality of algorithm training, highlighting the need for ongoing validation processes as the database expands. Missing structured data were treated as true absences and were not imputed. For unstructured text, missing values could reflect a lack of documentation or true absences. Manual review helped assess whether missing information stemmed from documentation gaps or NLP constraints. While a single-surgeon dataset ensures consistency in surgical technique and documentation style, it may limit generalizability to other surgical practices. However, the inclusion of multisource EHR data and independent validation by multiple reviewers helps mitigate this potential bias.</p></sec><sec id="s4-4"><title>Conclusions</title><p>In this study, the NLP pipeline proved highly effective in improving data capture and enhancing clinical outcomes analysis following DAA THA, overcoming constraints linked to single-surgeon registries, which typically require data aggregation from multiple care sites. It holds significant potential for future orthopedic studies, providing accurate and cost-effective insights. In addition, the dataset supports the low early complication rate of direct anterior THA in this surgeon&#x2019;s multicenter practice.</p></sec></sec></body><back><fn-group><fn fn-type="conflict"><p>NHM declares the following conflicts of interest: royalties from Medenvision and Synthes; speakers bureau or paid presentations for DePuy, Medenvision, and Mizuho/OSI; paid consultancy for Medacta USA and Medenvision; stock or stock options in DEO, Docspera, Ostaudio, OutcomeMD, and Radlink; board member of the Anterior Hip Foundation. DH is part of the management and CLO is an employee at LynxCare, Inc.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">CUI</term><def><p>Concept Unique Identifier</p></def></def-item><def-item><term id="abb3">DAA</term><def><p>direct anterior approach</p></def></def-item><def-item><term id="abb4">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb5">NLP</term><def><p>natural language processing</p></def></def-item><def-item><term id="abb6">SNOMED-CT</term><def><p>Systematized Nomenclature of Medicine-Clinical Terms</p></def></def-item><def-item><term id="abb7">THA</term><def><p>total hip arthroplasty</p></def></def-item><def-item><term id="abb8">UMLS</term><def><p>Unified Medical Language System</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Learmonth</surname><given-names>ID</given-names> </name><name name-style="western"><surname>Young</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rorabeck</surname><given-names>C</given-names> </name></person-group><article-title>The operation of the century: total hip replacement</article-title><source>The Lancet</source><year>2007</year><month>10</month><volume>370</volume><issue>9597</issue><fpage>1508</fpage><lpage>1519</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(07)60457-7</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>GC</given-names> </name><name name-style="western"><surname>Marconi</surname><given-names>D</given-names> </name></person-group><article-title>Complications following direct anterior hip procedures: costs to both patients and surgeons</article-title><source>J Arthroplasty</source><year>2015</year><month>09</month><volume>30</volume><issue>9 Suppl</issue><fpage>98</fpage><lpage>101</lpage><pub-id pub-id-type="doi">10.1016/j.arth.2015.03.043</pub-id><pub-id pub-id-type="medline">26118568</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bozic</surname><given-names>KJ</given-names> </name><name name-style="western"><surname>Grosso</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>Variation in hospital-level risk-standardized complication rates following elective primary total hip and knee arthroplasty</article-title><source>J Bone Joint Surg Am</source><year>2014</year><month>04</month><day>16</day><volume>96</volume><issue>8</issue><fpage>640</fpage><lpage>647</lpage><pub-id pub-id-type="doi">10.2106/JBJS.L.01639</pub-id><pub-id pub-id-type="medline">24740660</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Van de Meulebroucke</surname><given-names>C</given-names> </name><name name-style="western"><surname>Beckers</surname><given-names>J</given-names> </name><name name-style="western"><surname>Corten</surname><given-names>K</given-names> </name></person-group><article-title>What can we expect following anterior total hip arthroplasty on a regular operating table? A validation study of an artificial intelligence algorithm to monitor adverse events in a high-volume, nonacademic setting</article-title><source>J Arthroplasty</source><year>2019</year><month>10</month><volume>34</volume><issue>10</issue><fpage>2260</fpage><lpage>2266</lpage><pub-id pub-id-type="doi">10.1016/j.arth.2019.07.039</pub-id><pub-id pub-id-type="medline">31445868</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Healy</surname><given-names>WL</given-names> </name><name name-style="western"><surname>Iorio</surname><given-names>R</given-names> </name><name name-style="western"><surname>Clair</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Pellegrini</surname><given-names>VD</given-names> </name><name name-style="western"><surname>Della Valle</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Berend</surname><given-names>KR</given-names> </name></person-group><article-title>Complications of total hip arthroplasty: standardized list, definitions, and stratification developed by the hip society</article-title><source>Clin Orthop Relat Res</source><year>2016</year><month>02</month><volume>474</volume><issue>2</issue><fpage>357</fpage><lpage>364</lpage><pub-id pub-id-type="doi">10.1007/s11999-015-4341-7</pub-id><pub-id pub-id-type="medline">26040966</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zsidai</surname><given-names>B</given-names> </name><name name-style="western"><surname>Kaarre</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hilkert</surname><given-names>AS</given-names> </name><etal/></person-group><article-title>Accelerated evidence synthesis in orthopaedics-the roles of natural language processing, expert annotation and large language models</article-title><source>J Exp Orthop</source><year>2023</year><month>09</month><day>28</day><volume>10</volume><issue>1</issue><fpage>99</fpage><pub-id pub-id-type="doi">10.1186/s40634-023-00662-4</pub-id><pub-id pub-id-type="medline">37768352</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wyles</surname><given-names>CC</given-names> </name><name name-style="western"><surname>Tibbo</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Fu</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Use of natural language processing algorithms to identify common data elements in operative notes for total hip arthroplasty</article-title><source>J Bone Joint Surg Am</source><year>2019</year><month>11</month><day>6</day><volume>101</volume><issue>21</issue><fpage>1931</fpage><lpage>1938</lpage><pub-id pub-id-type="doi">10.2106/JBJS.19.00071</pub-id><pub-id pub-id-type="medline">31567670</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Flores-Balado</surname><given-names>&#x00C1;</given-names> </name><name name-style="western"><surname>Castresana M&#x00E9;ndez</surname><given-names>C</given-names> </name><name name-style="western"><surname>Herrero Gonz&#x00E1;lez</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Using artificial intelligence to reduce orthopedic surgical site infection surveillance workload: algorithm design, validation, and implementation in 4 Spanish hospitals</article-title><source>Am J Infect Control</source><year>2023</year><month>11</month><volume>51</volume><issue>11</issue><fpage>1225</fpage><lpage>1229</lpage><pub-id pub-id-type="doi">10.1016/j.ajic.2023.04.165</pub-id><pub-id pub-id-type="medline">37100291</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Frenkel Rutenberg</surname><given-names>T</given-names> </name><name name-style="western"><surname>Vitenberg</surname><given-names>M</given-names> </name><name name-style="western"><surname>Daglan</surname><given-names>E</given-names> </name><name name-style="western"><surname>Kadar</surname><given-names>A</given-names> </name><name name-style="western"><surname>Shemesh</surname><given-names>S</given-names> </name></person-group><article-title>Single surgeon versus co-surgeons in primary total joint arthroplasty: does &#x201C;two is better than one&#x201D; apply to surgeons?</article-title><source>J Pers Med</source><year>2022</year><month>10</month><day>9</day><volume>12</volume><issue>10</issue><fpage>1683</fpage><pub-id pub-id-type="doi">10.3390/jpm12101683</pub-id><pub-id pub-id-type="medline">36294821</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wen</surname><given-names>A</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>L</given-names> </name><etal/></person-group><article-title>An open natural language processing (NLP) framework for EHR-based clinical research: a case demonstration using the National COVID Cohort Collaborative (N3C)</article-title><source>J Am Med Inform Assoc</source><year>2023</year><month>11</month><day>17</day><volume>30</volume><issue>12</issue><fpage>2036</fpage><lpage>2040</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocad134</pub-id><pub-id pub-id-type="medline">37555837</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johnson</surname><given-names>AEW</given-names> </name><name name-style="western"><surname>Pollard</surname><given-names>TJ</given-names> </name><name name-style="western"><surname>Shen</surname><given-names>L</given-names> </name><etal/></person-group><article-title>MIMIC-III, a freely accessible critical care database</article-title><source>Sci Data</source><year>2016</year><month>05</month><day>24</day><volume>3</volume><issue>1</issue><fpage>160035</fpage><pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id><pub-id pub-id-type="medline">27219127</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chapman</surname><given-names>WW</given-names> </name><name name-style="western"><surname>Nadkarni</surname><given-names>PM</given-names> </name><name name-style="western"><surname>Hirschman</surname><given-names>L</given-names> </name><name name-style="western"><surname>D&#x2019;Avolio</surname><given-names>LW</given-names> </name><name name-style="western"><surname>Savova</surname><given-names>GK</given-names> </name><name name-style="western"><surname>Uzuner</surname><given-names>O</given-names> </name></person-group><article-title>Overcoming barriers to NLP for clinical text: the role of shared tasks and the need for additional creative solutions</article-title><source>J Am Med Inform Assoc</source><year>2011</year><volume>18</volume><issue>5</issue><fpage>540</fpage><lpage>543</lpage><pub-id pub-id-type="doi">10.1136/amiajnl-2011-000465</pub-id><pub-id pub-id-type="medline">21846785</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Uzuner</surname><given-names>O</given-names> </name><name name-style="western"><surname>Solti</surname><given-names>I</given-names> </name><name name-style="western"><surname>Cadag</surname><given-names>E</given-names> </name></person-group><article-title>Extracting medication information from clinical text</article-title><source>J Am Med Inform Assoc</source><year>2010</year><volume>17</volume><issue>5</issue><fpage>514</fpage><lpage>518</lpage><pub-id pub-id-type="doi">10.1136/jamia.2010.003947</pub-id><pub-id pub-id-type="medline">20819854</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gundersen</surname><given-names>T</given-names> </name><name name-style="western"><surname>B&#x00E6;r&#x00F8;e</surname><given-names>K</given-names> </name></person-group><article-title>The future ethics of artificial intelligence in medicine: making sense of collaborative models</article-title><source>Sci Eng Ethics</source><year>2022</year><month>04</month><day>1</day><volume>28</volume><issue>2</issue><fpage>17</fpage><pub-id pub-id-type="doi">10.1007/s11948-022-00369-2</pub-id><pub-id pub-id-type="medline">35362822</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gauthier</surname><given-names>MP</given-names> </name><name name-style="western"><surname>Law</surname><given-names>JH</given-names> </name><name name-style="western"><surname>Le</surname><given-names>LW</given-names> </name><etal/></person-group><article-title>Automating access to real-world evidence</article-title><source>JTO Clin Res Rep</source><year>2022</year><month>06</month><volume>3</volume><issue>6</issue><fpage>100340</fpage><pub-id pub-id-type="doi">10.1016/j.jtocrr.2022.100340</pub-id><pub-id pub-id-type="medline">35719866</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alva</surname><given-names>A</given-names> </name><name name-style="western"><surname>Nizam</surname><given-names>I</given-names> </name><name name-style="western"><surname>Gogos</surname><given-names>S</given-names> </name></person-group><article-title>Minimizing complications in bikini incision direct anterior approach total hip arthroplasty: a single surgeon series of 865 cases</article-title><source>J Exp Orthop</source><year>2021</year><month>01</month><day>4</day><volume>8</volume><issue>1</issue><fpage>1</fpage><pub-id pub-id-type="doi">10.1186/s40634-020-00318-7</pub-id><pub-id pub-id-type="medline">33394190</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Soza</surname><given-names>D</given-names> </name><name name-style="western"><surname>Pujol</surname><given-names>O</given-names> </name><name name-style="western"><surname>Lara</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Castellanos</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hern&#x00E1;ndez</surname><given-names>A</given-names> </name><name name-style="western"><surname>Barro</surname><given-names>V</given-names> </name></person-group><article-title>A comparative of a single novice surgeon&#x2019;s direct anterior approach and posterior approach learning curves in total hip arthroplasty: a retrospective cohort study</article-title><source>Eur J Orthop Surg Traumatol</source><year>2022</year><month>05</month><volume>32</volume><issue>4</issue><fpage>767</fpage><lpage>774</lpage><pub-id pub-id-type="doi">10.1007/s00590-021-03039-4</pub-id><pub-id pub-id-type="medline">34129119</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Barrett</surname><given-names>WP</given-names> </name><name name-style="western"><surname>Turner</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Leopold</surname><given-names>JP</given-names> </name></person-group><article-title>Prospective randomized study of direct anterior vs postero-lateral approach for total hip arthroplasty</article-title><source>J Arthroplasty</source><year>2013</year><month>10</month><volume>28</volume><issue>9</issue><fpage>1634</fpage><lpage>1638</lpage><pub-id pub-id-type="doi">10.1016/j.arth.2013.01.034</pub-id><pub-id pub-id-type="medline">23523485</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wernly</surname><given-names>D</given-names> </name><name name-style="western"><surname>Wegrzyn</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lallemand</surname><given-names>G</given-names> </name><name name-style="western"><surname>Mahlouly</surname><given-names>J</given-names> </name><name name-style="western"><surname>Tissot</surname><given-names>C</given-names> </name><name name-style="western"><surname>Antoniadis</surname><given-names>A</given-names> </name></person-group><article-title>Total hip arthroplasty through the direct anterior approach with and without the use of a traction table: a matched-control, retrospective, single-surgeon study</article-title><source>J Orthop Surg Res</source><year>2021</year><month>01</month><day>11</day><volume>16</volume><issue>1</issue><fpage>45</fpage><pub-id pub-id-type="doi">10.1186/s13018-020-02184-6</pub-id><pub-id pub-id-type="medline">33430917</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>De Geest</surname><given-names>T</given-names> </name><name name-style="western"><surname>Fennema</surname><given-names>P</given-names> </name><name name-style="western"><surname>Lenaerts</surname><given-names>G</given-names> </name><name name-style="western"><surname>De Loore</surname><given-names>G</given-names> </name></person-group><article-title>Adverse effects associated with the direct anterior approach for total hip arthroplasty: a Bayesian meta-analysis</article-title><source>Arch Orthop Trauma Surg</source><year>2015</year><month>08</month><volume>135</volume><issue>8</issue><fpage>1183</fpage><lpage>1192</lpage><pub-id pub-id-type="doi">10.1007/s00402-015-2258-y</pub-id><pub-id pub-id-type="medline">26081800</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Data sources, categories, and concept unique identifiers of all clinical data points.</p><media xlink:href="medinform_v13i1e64705_app1.docx" xlink:title="DOCX File, 38 KB"/></supplementary-material></app-group></back></article>