<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v10i2e30483</article-id>
      <article-id pub-id-type="pmid">35107432</article-id>
      <article-id pub-id-type="doi">10.2196/30483</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Disease Progression of Hypertrophic Cardiomyopathy: Modeling Using Machine Learning</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kahlon</surname>
            <given-names>Tanvir</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Li</surname>
            <given-names>Peng</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Bhadra</surname>
            <given-names>Presenjit</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Pičulin</surname>
            <given-names>Matej</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <address>
            <institution>Faculty of Computer and Information Science</institution>
            <institution>University of Ljubljana</institution>
            <addr-line>Večna pot 113</addr-line>
            <addr-line>Ljubljana, 1000</addr-line>
            <country>Slovenia</country>
            <phone>386 1 479 8226</phone>
            <email>matej.piculin@fri.uni-lj.si</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3883-476X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Smole</surname>
            <given-names>Tim</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5713-7628</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Žunkovič</surname>
            <given-names>Bojan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5085-2506</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Kokalj</surname>
            <given-names>Enja</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8158-767X</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Robnik-Šikonja</surname>
            <given-names>Marko</given-names>
          </name>
          <degrees>Prof Dr, PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1232-3320</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Kukar</surname>
            <given-names>Matjaž</given-names>
          </name>
          <degrees>Prof Dr, PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1242-7947</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Fotiadis</surname>
            <given-names>Dimitrios I</given-names>
          </name>
          <degrees>Prof Dr, PhD</degrees>
          <xref rid="aff02" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7362-5082</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Pezoulas</surname>
            <given-names>Vasileios C</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff02" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1872-693X</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Tachos</surname>
            <given-names>Nikolaos S</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff02" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8627-6352</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Barlocco</surname>
            <given-names>Fausto</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <xref rid="aff04" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4342-8459</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Mazzarotto</surname>
            <given-names>Francesco</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <xref rid="aff04" ref-type="aff">4</xref>
          <xref rid="aff05" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6159-9980</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Popović</surname>
            <given-names>Dejana</given-names>
          </name>
          <degrees>MD, Prof Dr, PhD</degrees>
          <xref rid="aff06" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6647-5872</ext-link>
        </contrib>
        <contrib id="contrib13" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Maier</surname>
            <given-names>Lars S</given-names>
          </name>
          <degrees>Prof Dr, PhD</degrees>
          <xref rid="aff07" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9915-4429</ext-link>
        </contrib>
        <contrib id="contrib14" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Velicki</surname>
            <given-names>Lazar</given-names>
          </name>
          <degrees>MD, Prof Dr, PhD</degrees>
          <xref rid="aff08" ref-type="aff">8</xref>
          <xref rid="aff09" ref-type="aff">9</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2907-819X</ext-link>
        </contrib>
        <contrib id="contrib15" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Olivotto</surname>
            <given-names>Iacopo</given-names>
          </name>
          <degrees>MD, Prof Dr</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <xref rid="aff04" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1751-9266</ext-link>
        </contrib>
        <contrib id="contrib16" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>MacGowan</surname>
            <given-names>Guy A</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff10" ref-type="aff">10</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2685-4165</ext-link>
        </contrib>
        <contrib id="contrib17" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Jakovljević</surname>
            <given-names>Djordje G</given-names>
          </name>
          <degrees>MD, Prof Dr, PhD</degrees>
          <xref rid="aff10" ref-type="aff">10</xref>
          <xref rid="aff11" ref-type="aff">11</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2686-6542</ext-link>
        </contrib>
        <contrib id="contrib18" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Filipović</surname>
            <given-names>Nenad</given-names>
          </name>
          <degrees>Prof Dr, PhD</degrees>
          <xref rid="aff12" ref-type="aff">12</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9964-5615</ext-link>
        </contrib>
        <contrib id="contrib19" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Bosnić</surname>
            <given-names>Zoran</given-names>
          </name>
          <degrees>Prof Dr, PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0501-7146</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff01">
        <label>1</label>
        <institution>Faculty of Computer and Information Science</institution>
        <institution>University of Ljubljana</institution>
        <addr-line>Ljubljana</addr-line>
        <country>Slovenia</country>
      </aff>
      <aff id="aff02">
        <label>2</label>
        <institution>Unit of Medical Technology and Intelligent Information Systems</institution>
        <institution>Department of Materials Science and Engineering</institution>
        <institution>University of Ioannina</institution>
        <addr-line>Ioannina</addr-line>
        <country>Greece</country>
      </aff>
      <aff id="aff03">
        <label>3</label>
        <institution>Department of Experimental and Clinical Medicine</institution>
        <institution>University of Florence</institution>
        <addr-line>Florence</addr-line>
        <country>Italy</country>
      </aff>
      <aff id="aff04">
        <label>4</label>
        <institution>Cardiomyopathy Unit</institution>
        <institution>Careggi University Hospital</institution>
        <institution>University of Florence</institution>
        <addr-line>Florence</addr-line>
        <country>Italy</country>
      </aff>
      <aff id="aff05">
        <label>5</label>
        <institution>National Heart and Lung Institute</institution>
        <institution>Imperial College London</institution>
        <addr-line>London</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff06">
        <label>6</label>
        <institution>Clinic for Cardiology</institution>
        <institution>Clinical Center of Serbia</institution>
        <institution>University of Belgrade</institution>
        <addr-line>Belgrade</addr-line>
        <country>Serbia</country>
      </aff>
      <aff id="aff07">
        <label>7</label>
        <institution>Department of Internal Medicine II (Cardiology, Pneumology, Intensive Care Medicine)</institution>
        <institution>University Hospital Regensburg</institution>
        <addr-line>Regensburg</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff08">
        <label>8</label>
        <institution>Faculty of Medicine</institution>
        <institution>University of Novi Sad</institution>
        <addr-line>Novi Sad</addr-line>
        <country>Serbia</country>
      </aff>
      <aff id="aff09">
        <label>9</label>
        <institution>Institute of Cardiovascular Diseases Vojvodina</institution>
        <addr-line>Sremska Kamenica</addr-line>
        <country>Serbia</country>
      </aff>
      <aff id="aff10">
        <label>10</label>
        <institution>Translational and Clinical Research Institute</institution>
        <institution>Faculty of Medical Sciences</institution>
        <institution>Newcastle University</institution>
        <addr-line>Newcastle upon Tyne</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff11">
        <label>11</label>
        <institution>Faculty of Health and Life Sciences</institution>
        <institution>Coventry University</institution>
        <addr-line>Coventry</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff12">
        <label>12</label>
        <institution>Bioengineering Research and Development Center</institution>
        <addr-line>Kragujevac</addr-line>
        <country>Serbia</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Matej Pičulin <email>matej.piculin@fri.uni-lj.si</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>2</month>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>2</day>
        <month>2</month>
        <year>2022</year>
      </pub-date>
      <volume>10</volume>
      <issue>2</issue>
      <elocation-id>e30483</elocation-id>
      <history>
        <date date-type="received">
          <day>18</day>
          <month>5</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>27</day>
          <month>9</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>27</day>
          <month>10</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>4</day>
          <month>12</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Matej Pičulin, Tim Smole, Bojan Žunkovič, Enja Kokalj, Marko Robnik-Šikonja, Matjaž Kukar, Dimitrios I Fotiadis, Vasileios C Pezoulas, Nikolaos S Tachos, Fausto Barlocco, Francesco Mazzarotto, Dejana Popović, Lars S Maier, Lazar Velicki, Iacopo Olivotto, Guy A MacGowan, Djordje G Jakovljević, Nenad Filipović, Zoran Bosnić. Originally published in JMIR Medical Informatics (https://medinform.jmir.org), 02.02.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on https://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2022/2/e30483" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Cardiovascular disorders in general are responsible for 30% of deaths worldwide. Among them, hypertrophic cardiomyopathy (HCM) is a genetic cardiac disease that is present in about 1 of 500 young adults and can cause sudden cardiac death (SCD).</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>Although the current state-of-the-art methods model the risk of SCD for patients, to the best of our knowledge, no methods are available for modeling the patient's clinical status up to 10 years ahead. In this paper, we propose a novel machine learning (ML)-based tool for predicting disease progression for patients diagnosed with HCM in terms of adverse remodeling of the heart during a 10-year period.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>The method consisted of 6 predictive regression models that independently predict future values of 6 clinical characteristics: left atrial size, left atrial volume, left ventricular ejection fraction, New York Heart Association functional classification, left ventricular internal diastolic diameter, and left ventricular internal systolic diameter. We supplemented each prediction with the explanation that is generated using the Shapley additive explanation method.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The final experiments showed that predictive error is lower on 5 of the 6 constructed models in comparison to experts (on average, by 0.34) or a consortium of experts (on average, by 0.22). The experiments revealed that semisupervised learning and the artificial data from virtual patients help improve predictive accuracies. The best-performing random forest model improved R<sup>2</sup> from 0.3 to 0.6.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>By engaging medical experts to provide interpretation and validation of the results, we determined the models' favorable performance compared to the performance of experts for 5 of 6 targets.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>hypertrophic cardiomyopathy</kwd>
        <kwd>disease progression</kwd>
        <kwd>machine learning</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>AI</kwd>
        <kwd>ML</kwd>
        <kwd>cardiomyopathy</kwd>
        <kwd>cardiovascular disease</kwd>
        <kwd>sudden cardiac death</kwd>
        <kwd>SCD</kwd>
        <kwd>prediction</kwd>
        <kwd>prediction model</kwd>
        <kwd>validation</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Recent reviews of machine learning (ML) applications in cardiovascular medicine [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>] suggest that the use of ML is on the rise and that it is being adopted by doctors in their daily practice. ML applications in cardiology are reflected by augmenting medical practice by contributing to early diagnosis, risk stratification, and personalized therapeutics. The examples of such applications in other domains include modeling disease progression of Alzheimer disease [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>], Parkinson disease [<xref ref-type="bibr" rid="ref5">5</xref>], multiple sclerosis [<xref ref-type="bibr" rid="ref6">6</xref>], chronic kidney disease [<xref ref-type="bibr" rid="ref7">7</xref>], chronic liver disease [<xref ref-type="bibr" rid="ref8">8</xref>], and others.</p>
        <p>Cardiovascular disorders in general are responsible for 30% of deaths worldwide. Among them specifically, hypertrophic cardiomyopathy (HCM) is a genetic cardiac disease that is a cause of sudden cardiac death (SCD), especially among young adults and athletes [<xref ref-type="bibr" rid="ref9">9</xref>]. Cardiovascular diseases represent groups of diseases that can greatly benefit from preemptive prediction, prevention, and proactive management; thus, this opens an opportunity for methods of artificial intelligence (AI) [<xref ref-type="bibr" rid="ref2">2</xref>]. Disease progression is especially hard to detect in slow-progressing diseases, such as HCM, which is present in about 1 of 500 young adults [<xref ref-type="bibr" rid="ref10">10</xref>]. Although HCM has 4 identified stages [<xref ref-type="bibr" rid="ref11">11</xref>], patients with HCM can experience a sudden cardiac arrest or the disease can slowly progress over several years. Currently, the state-of-the-art HCM Risk-SCD calculator method for risk stratification of patients diagnosed with HCM [<xref ref-type="bibr" rid="ref12">12</xref>] is widely used in practice. Although this method predicts the risk of SCD, no methods, to the best of our knowledge, are available for modeling the patient's clinical status up to 10 years ahead. Detection of cardiovascular risk for 10 years ahead is important and has been recently modeled for atherosclerotic cardiovascular disease [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        <p>In this paper, we propose a novel ML-based tool for predicting disease progression for patients diagnosed with HCM in terms of adverse remodeling of the heart during a 10-year period. The method consists of 6 contemporaneous predictive regression models that independently predict future values of the following 6 clinical characteristics: left atrial diameter (LA_d), left atrial volume (LA_Vol), left ventricular ejection fraction (LVEF), New York Heart Association (NYHA) functional classification, left ventricular internal diameter at end diastole (LVIDd), and left ventricular internal diameter at end systole (LVIDs). Each prediction is supplemented with the explanation that is generated using the Shapley additive explanation (SHAP) method [<xref ref-type="bibr" rid="ref14">14</xref>]. Comparison between current and future values of these 6 parameters, as well as the interpretation of the change, generated by explanation methods, can help cardiologists gain insight into the disease progression trend for a given patient.</p>
      </sec>
      <sec>
        <title>Machine Learning Methods in Medicine</title>
        <p>ML techniques are being frequently applied in medicine to improve the prediction of disease progression, extraction of medical knowledge for outcome research, therapy planning and support, and overall patient management [<xref ref-type="bibr" rid="ref15">15</xref>]. A wide variety of ML approaches can solve challenging problems in these tasks. For example, diseases such as Alzheimer disease, diabetes, and chronic obstructive pulmonary disease (COPD) progress slowly over the years. For modeling of COPD, a Markov model was proposed by Wang et al [<xref ref-type="bibr" rid="ref16">16</xref>], who also included a database of virtual patients. Their method successfully modeled progression trajectories, showing that multiple progression trajectories are possible for some diseases.</p>
        <p>In cardiology, there are several works addressing disease progression trends related to different cardiological diseases. With the increase in computational power, ML has become a tool to analyze nonlinear dependencies that are present either in relational data or in images. Juarez-Orozco et al [<xref ref-type="bibr" rid="ref17">17</xref>] emphasized the advantages of ML, especially deep learning, in cardiac nuclear imaging, where ML can aid with ischemia diagnosis and event prognosis. Sardar et al [<xref ref-type="bibr" rid="ref18">18</xref>] emphasized the advantages of AI in interventional cardiology, which is promising to bring a paradigm shift in the practice of medicine by improving real-time clinical decision making and standardizing robotic medical procedures. While focusing on the use of ML in electrocardiogram (ECG) analysis, Elul et al [<xref ref-type="bibr" rid="ref19">19</xref>] also stated the crucial disadvantages of ML, which include a lack of explanation, relating the automated diagnosis with medical knowledge, and transparency of the system’s limitations. In their work, the authors proceeded to flag individual predictions that are irrelevant or not useful. To summarize, the mentioned works characterize AI as a developing tool that, with the synergy between humans and machines, will help transform medical practice and clinical care.</p>
        <p>Further, a hybrid approach for progression of Parkinson disease [<xref ref-type="bibr" rid="ref5">5</xref>] was successfully used by combining a variety of ML methods from different families: clustering, dimensional reduction, and incremental support vector regression. Deep learning was used for predicting Alzheimer disease, on average, about 6 years in advance [<xref ref-type="bibr" rid="ref20">20</xref>] and for modeling Alzheimer disease progression [<xref ref-type="bibr" rid="ref4">4</xref>]. Conditional restricted Boltzmann machines were also used for prediction of disease progression [<xref ref-type="bibr" rid="ref3">3</xref>]. The authors simulated patient trajectories using 18 months of longitudinal data of around 1900 patients and showed that patient-level simulations are feasible using ML and appropriate data.</p>
        <p>Several other ML approaches also model disease progression well in other medical domains, such as kidney disease progression [<xref ref-type="bibr" rid="ref7">7</xref>]. In this work, 9 ML approaches were tested: linear regression (LR), elastic net regression, lasso regression, ridge regression, support vector machines (SVMs), random forests (RFs), k-nearest neighbors (KNNs), neural networks (NNs), and XGBoost. Similarly, ML models were applied to the problem of disease progression for hepatitis C virus [<xref ref-type="bibr" rid="ref8">8</xref>] for the 5-year prediction problem using longitudinal data. The authors' conclusion was that the boosted survival tree-based models using longitudinal data perform better than cross-sectional or linear models. Last but not least, ML was also used for disease progression and secondary progression detection for multiple sclerosis [<xref ref-type="bibr" rid="ref6">6</xref>]. Several ML models were evaluated for predictions of disease severity in 6-10 years, such as KNNs, decision trees, LR, and SVMs. SVMs performed best.</p>
        <p>To summarize, the overview indicates that ML models can be successfully applied to problems of predicting disease progression, which is also the goal of this paper. In the next subsection, we overview how ML approaches are used in cardiology, specifically for HCM, which is the focus of this paper.</p>
      </sec>
      <sec>
        <title>Machine Learning for Modeling Hypertrophic Cardiomyopathy</title>
        <p>Most ML contributions to cardiovascular medicine focus on risk stratification of patients. One of the biggest obstacles to using data for a broader variety of ML applications is that data are usually stored in diverse repositories, which are not readily usable for cardiovascular research, due to various data quality challenges [<xref ref-type="bibr" rid="ref2">2</xref>]. Where the data are readily available, different ML algorithms have been successfully used, such as Wasserstein generative adversarial networks [<xref ref-type="bibr" rid="ref21">21</xref>], convolutional NNs [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>], deep NNs [<xref ref-type="bibr" rid="ref24">24</xref>], and boosted decision trees [<xref ref-type="bibr" rid="ref25">25</xref>]. Some authors have tested multiple models, such as RFs, artificial NNs, SVMs, and Bayesian networks [<xref ref-type="bibr" rid="ref26">26</xref>], or a combination of J48, naive Bayes, KNNs, SVMs, RFs, bagging, and boosting [<xref ref-type="bibr" rid="ref27">27</xref>]. Cuocolo et al [<xref ref-type="bibr" rid="ref1">1</xref>] overviewed ML methods in cardiology, emphasizing their successful applications for building clinical predictive models, for analyzing ECG signals and image data. For the latter problems, the most successful methods were NNs, deep NNs, and convolutional networks. Advances in prediction accuracy have also been made by using deep NNs to make predictions based on fast, large-scale genome-wide association studies [<xref ref-type="bibr" rid="ref28">28</xref>].</p>
        <p>HCM is a severe disease for which 4 stages of progression have been identified in the medical literature [<xref ref-type="bibr" rid="ref11">11</xref>]. Current state-of-the-art ML mostly uses only statistical models, such as multivariate regression analysis, which uses preselected predictor variables of known medical importance. Cardiac magnetic resonance (CMR) images [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>] and echocardiographic diagnostics [<xref ref-type="bibr" rid="ref31">31</xref>] are found to be a good source of important attributes for HCM identification. Recently, researchers have started proposing ML-based risk stratification for patients diagnosed with comorbidities to separate patients into low- and high-risk categories or several categories on a scale [<xref ref-type="bibr" rid="ref32">32</xref>]. The medical literature is mostly focused on finding risk factors that identify increased risk of SCD in patients with HCM [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]. A study [<xref ref-type="bibr" rid="ref34">34</xref>] presenting the guidelines used in risk stratification for patients with HCM proposed potential SCD modifiers. Maron et al [<xref ref-type="bibr" rid="ref35">35</xref>] performed a similar study on older populations and also summarized risk factors that could prevent SCD. The continuation of this research [<xref ref-type="bibr" rid="ref36">36</xref>] aimed to develop an accurate strategy to assess the reliability of SCD prediction methods in prevention of SCD in patients diagnosed with HCM.</p>
        <p>It is important to note that patients with HCM who experience cardiac arrest are not identified by typical risk markers used in the American College of Cardiology or the statistical mathematical risk model by the European Society of Cardiology [<xref ref-type="bibr" rid="ref37">37</xref>]. Therefore, new risk factors have been and still need to be considered and developed to provide additional information to better assess HCM risk. In our work, we focus on modeling the future development of HCM by predicting the change in relevant cardiac parameters 10 years ahead.</p>
      </sec>
      <sec>
        <title>Aims and Contributions</title>
        <p>Novelties and contributions of this paper include:</p>
        <list list-type="bullet">
          <list-item>
            <p>A disease progression system that comprises models for prediction of 6 contemporaneous relevant clinical parameters that are relevant to HCM for 10 years ahead. The system includes the implementation of the explanation methodology that provides interpretability of predictive models.</p>
          </list-item>
          <list-item>
            <p>Analysis of predictive performance if training data are extended using semisupervised learning or with artificial patient data.</p>
          </list-item>
          <list-item>
            <p>Validation of predictive accuracy with medical experts by comparing ML and human accuracy and by analyzing sensibility of the computer-generated prediction explanations.</p>
          </list-item>
        </list>
        <p>The aim of this paper is to develop a system capable of detecting slow progression of HCM based on longitudinal data.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Modeling Disease Progression</title>
        <p>In this work, we modeled disease progression by predicting 6 relevant patient parameters 10 years in advance. These parameters are indicators of HCM and can be used to determine the stage of HCM according to the known guidelines [<xref ref-type="bibr" rid="ref37">37</xref>]. Additionally, a preliminary analysis was performed to verify the prediction strength of the chosen parameters, validating our choice, as described in the Data Set section. The proposed disease progression system (<xref rid="figure1" ref-type="fig">Figure 1</xref>) takes as input patients’ clinical data and data about their past disease-related events, such as dates of atrial fibrillation or syncope.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Overview of the proposed disease progression system. The system receives clinical data and disease-related events of a patient as input, uses virtual patient data and semisupervised learning for self-improvement, and returns the predictions and their explanation for 6 target variables.</p>
          </caption>
          <graphic xlink:href="medinform_v10i2e30483_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>The output of the system is a set of 6 contemporaneous target predictions for parameters:
             <list list-type="bullet"><list-item><p>LA_d</p></list-item><list-item><p>LA_Vol</p></list-item><list-item><p>LVEF</p></list-item><list-item><p>LVIDd</p></list-item><list-item><p>LVIDs</p></list-item><list-item><p>NYHA functional classification</p></list-item></list>
        </p>
        <p>In addition to predictions, the system also generates their explanations, revealing the factors with the largest impact on the increase or decrease in the 6 target variables throughout the 10-year period.</p>
        <p>We trained the proposed disease progression system using supervised ML techniques. To further improve the results, we augmented the original data using unlabeled data (semisupervised learning) and virtual patients’ data. We applied the semisupervised learning using patients without 10-year follow-ups and generated virtual patients’ data using various techniques for artificial data generation. The semisupervised learning first predicted patients' targets using the trained models on labeled data, so they could be afterward included into the training data set. In the following subsections, we describe the data set, predictive modeling with supervised models, use of semisupervised learning and virtual patient data, and generation of prediction explanations.</p>
      </sec>
      <sec>
        <title>Data Set</title>
        <p>The proposed approach was developed on a data set that was provided by the University of Florence as a result of its long-term clinical practice. The data set included patients who were enrolled over the past 40 years (<xref rid="figure2" ref-type="fig">Figure 2</xref>), and 1860 (80.24%) of 2318 patients had at least 1 available 10-year follow-up. They were followed for an average duration of about 7 years and ranging up to 37 years. The data set contains longitudinal clinical data for 2318 patients diagnosed with HCM or patients that had a relative diagnosed with HCM (1457 [62.86%] male and 861 [37.14%] female patients). During the patients' visits, various clinical tests and relevant disease-related events were recorded. These data included general data (gender, age, height, weight, etc), genetic data (detected mutations), clinical tests (echocardiogram [echo], Holter monitoring, blood test, CMR, stress test), prescribed medications (type, start date, termination date), and disease-related events (eg, SCD, heart failure, transplant, abnormal Holter, pacemaker or implantable cardioverter defibrillator implantation). Echo was the leading diagnostic reference technique that was performed for the vast majority of patients and thus represents the main source of data. CMR was additionally used selectively due to its greater accuracy in measuring volumes. Although echo and CMR are treated separately and never computationally compared to each other in medical practice, we used CMR, where available, as an additional data modality to possibly improve prediction accuracy. In total, there were 6227 events recorded, of which 4902 (78.72%) events occurred in patients who were primarily diagnosed with HCM. The structure of the data set therefore allowed observing how patients’ clinical characteristics change over time, which is essential for the desired modeling of HCM progression. The basic patient characteristics are shown in <xref ref-type="table" rid="table1">Table 1</xref> for continuous parameters, <xref ref-type="table" rid="table2">Table 2</xref> for binary parameters, and <xref ref-type="table" rid="table3">Table 3</xref> for the remaining parameters. The characteristics were extracted from 10,318 measurements in total. Additionally, <xref ref-type="table" rid="table4">Table 4</xref> shows the missing data numbers and percentages for the 6 selected target variables for their role as input or target variables.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Relationship between the amount of labeled and unlabeled data. The bars for Yes and No values are stacked, visually revealing the ratio between labeled and unlabeled data. Note that the rightmost columns do not have 10-year follow-up data, as they are less than 10 years.</p>
          </caption>
          <graphic xlink:href="medinform_v10i2e30483_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Basic characteristics of patients for basic continuous parameters (N=10,318).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="340"/>
            <col width="330"/>
            <col width="330"/>
            <thead>
              <tr valign="top">
                <td>Continuous parameter</td>
                <td>Mean (SD)</td>
                <td>Missing data, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Age (years)</td>
                <td>52.1 (18.6)</td>
                <td>4 (0.04)</td>
              </tr>
              <tr valign="top">
                <td>Weight (kg)</td>
                <td>73.4 (14.6)</td>
                <td>2381 (23.08)</td>
              </tr>
              <tr valign="top">
                <td>Height (cm)</td>
                <td>169 (10.3)</td>
                <td>2273 (22.03)</td>
              </tr>
              <tr valign="top">
                <td>Body mass index (BMI)</td>
                <td>25.6 (4.09)</td>
                <td>2423 (23.48)</td>
              </tr>
              <tr valign="top">
                <td>NYHA<sup>a</sup></td>
                <td>1.69 (0.73)</td>
                <td>983 (9.53)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>NYHA: New York Heart Association.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Basic characteristics of patients for basic binary parameters (N=10,318).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Binary parameter</td>
                <td>1-value, n (%)</td>
                <td>0-value, n (%)</td>
                <td>Missing, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Alcohol</td>
                <td>Yes, 103 (0.99)</td>
                <td>No, 10,215 (99)</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>Drug</td>
                <td>Yes, 18 (0.17)</td>
                <td>No, 10,300 (99.83)</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>Smoking</td>
                <td>Yes, 3437 (33.31)</td>
                <td>No, 6881 (66.69)</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>Pregnancy</td>
                <td>Yes, 443 (4.29)</td>
                <td>No, 9875 (95.71)</td>
                <td>2515 (24.37)</td>
              </tr>
              <tr valign="top">
                <td>Gender</td>
                <td>Male, 6400 (62.03)</td>
                <td>Female, 3918 (37.97)</td>
                <td>0</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Basic characteristics for groups of parameters (N=10,318)<sup>a</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="340"/>
            <col width="330"/>
            <col width="330"/>
            <thead>
              <tr valign="top">
                <td>Procedure</td>
                <td>Parameters, n</td>
                <td>Total missing values, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>ECG<sup>b</sup></td>
                <td>9</td>
                <td>45,839 (49.36)</td>
              </tr>
              <tr valign="top">
                <td>Echo<sup>c</sup></td>
                <td>26</td>
                <td>98,191 (36.60)</td>
              </tr>
              <tr valign="top">
                <td>CMR<sup>d</sup></td>
                <td>10</td>
                <td>81,174 (78.67)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>The table shows aggregated statistics for several parameters obtained from the same procedure. The percentage for each procedure is obtained as follows: [Total missing values/(Parameter × N)] × 100.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>ECG: electrocardiogram.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>Echo: echocardiogram.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>CMR: cardiovascular magnetic resonance.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Absolute number and percentage of missing values of target variables as class and as input (N=10,318).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <thead>
              <tr valign="bottom">
                <td>
                  <break/>
                </td>
                <td>LA_d<sup>a</sup>, n (%)</td>
                <td>LVEF<sup>b</sup>, n (%)</td>
                <td>NYHA<sup>c</sup>, n (%)</td>
                <td>LVIDd<sup>d</sup>, n (%)</td>
                <td>LVIDs<sup>e</sup>, n (%)</td>
                <td>LA_Vol<sup>f</sup>, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Target</td>
                <td>8569 (83.05)</td>
                <td>8481 (82.19)</td>
                <td>8313 (80.57)</td>
                <td>8607 (83.42)</td>
                <td>9336 (90.48)</td>
                <td>8631 (83.65)</td>
              </tr>
              <tr valign="top">
                <td>Input</td>
                <td>2691 (26.08)</td>
                <td>2399 (23.25)</td>
                <td>983 (9.53)</td>
                <td>2517 (24.39)</td>
                <td>5329 (51.65)</td>
                <td>3680 (35.67)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>LA_d: left atrial diameter.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>LVEF: left ventricular ejection fraction.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>NYHA: New York Heart Association.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>LVIDd: left ventricular internal diameter at end diastole.</p>
            </fn>
            <fn id="table4fn5">
              <p><sup>e</sup>LVIDs: left ventricular internal diameter at end systole.</p>
            </fn>
            <fn id="table4fn6">
              <p><sup>f</sup>LA_Vol: left atrial volume.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>First, we transformed the available data set into a suitable form for predicting a 10-year change in relevant parameters using ML. Similarly, in other real-world data sets, most of the clinical tests were missing many patients or measurements were not taken for the whole span of 10 years (<xref rid="figure2" ref-type="fig">Figure 2</xref>). To address this issue, we preprocessed the data as follows:</p>
        <list list-type="bullet">
          <list-item>
            <p>Formation of training examples: Since not all clinical tests can be conducted on the same day or in the same month, we defined a training example as a set of measurements within a time frame of 1 year. Such time frame corresponds to the annual regular visit period of patients and allows enough time for relevant changes in the observed parameters to become noticeable, as the disease slowly progresses. If the patient had a certain test performed multiple times within this time frame, multiple tests were treated as separate measurements. In case a certain type of test was not performed in the 1-year time frame, the corresponding variables were recorded as missing. Constructing training examples in this way yielded a data set with 13,386 examples, with 3.9 (SD 4.8) examples per patient.</p>
          </list-item>
          <list-item>
            <p>Imputation of missing data: The missing values in the data set, either because of nonperformed tests or because of erroneous input of data, were imputed by copying the closest past values (sensible because the progression of HCM is slow; used on numerical and categorical attributes), imputing values of a healthy patient (sampled from the normal distribution; used for numerical attributes), or imputing mean values where healthy values were unknown (used on numerical and categorical attributes). Since measurements were not taken at equidistant time intervals, we used linear interpolation for computing equidistant measurement approximations.</p>
          </list-item>
        </list>
        <p>We used the formed training examples as input to supervised learning algorithms. Prior to modeling, we evaluated the quality of attributes, which is important for decreasing learning complexity, avoiding overfitting, and, therefore, improving the simplicity and performance of ML methods. To facilitate learning with NNs, we also scaled the values to the interval [0,1] and encoded nominal values using the one-hot encoding method.</p>
        <p>We used RReliefF [<xref ref-type="bibr" rid="ref38">38</xref>], adaptation of the ReliefF feature selection algorithm, for regression problems. RReliefF calculates how well a feature’s values distinguish between distant labels of instances that are close to each other and considers feature interactions. We selected 21 (18.7%) of 112 attributes based on the average rank across all 6 target variables for further supervised learning. Feature scores for 21 selected features are shown in <xref ref-type="table" rid="table5">Table 5</xref>, along with their average ranks across 6 trained predictive models. After removing highly correlated features (eg, the weight feature that correlates to the body surface area [BSA] and height), the final set of attributes contained all target variables (regardless of their rank) and the best-performing attributes, based on average rank.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Selected attributes using RReliefF.<sup>a</sup></p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="260"/>
            <col width="90"/>
            <col width="90"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="110"/>
            <col width="120"/>
            <thead>
              <tr valign="bottom">
                <td colspan="2">Variable<sup>b</sup></td>
                <td>LA_d<sup>c</sup> score</td>
                <td>LVEF<sup>d</sup> score</td>
                <td>NYHA<sup>e</sup> score</td>
                <td>LVIDd<sup>f</sup> score</td>
                <td>LVIDs<sup>g</sup> score</td>
                <td>LA_Vol<sup>h</sup> score</td>
                <td>Average rank</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="9">
                  <bold>Anthropometric parameters</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>Age</italic>
                </td>
                <td>0.198</td>
                <td>0.194</td>
                <td>0.166</td>
                <td>0.142</td>
                <td>0.166</td>
                <td>0.158</td>
                <td>1.000</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>Gender</italic>
                </td>
                <td>0.051</td>
                <td>0.037</td>
                <td>0.043</td>
                <td>0.055</td>
                <td>0.058</td>
                <td>0.022</td>
                <td>12.500</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>Height</italic>
                </td>
                <td>0.057</td>
                <td>0.064</td>
                <td>0.045</td>
                <td>0.075</td>
                <td>0.051</td>
                <td>0.029</td>
                <td>9.167</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>BSA</italic>
                  <sup>i</sup>
                </td>
                <td>0.075</td>
                <td>0.073</td>
                <td>0.053</td>
                <td>0.095</td>
                <td>0.085</td>
                <td>0.045</td>
                <td>4.167</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Risk factors</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>Smoking</italic>
                </td>
                <td>0.063</td>
                <td>0.046</td>
                <td>0.052</td>
                <td>0.032</td>
                <td>0.069</td>
                <td>0.082</td>
                <td>7.500</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>Presence of hypercholesterolemia</italic>
                </td>
                <td>0.072</td>
                <td>0.042</td>
                <td>0.052</td>
                <td>0.039</td>
                <td>0.044</td>
                <td>0.056</td>
                <td>9.667</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>History of syncope</td>
                <td>0.026</td>
                <td>0.036</td>
                <td>0.029</td>
                <td>0.022</td>
                <td>0.029</td>
                <td>0.048</td>
                <td>20.000</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>Family history of HCM</italic>
                  <sup>j</sup>
                </td>
                <td>0.056</td>
                <td>0.060</td>
                <td>0.061</td>
                <td>0.047</td>
                <td>0.052</td>
                <td>0.066</td>
                <td>5.833</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Family history of SCD<sup>k</sup></td>
                <td>0.027</td>
                <td>0.051</td>
                <td>0.032</td>
                <td>0.031</td>
                <td>0.051</td>
                <td>0.049</td>
                <td>14.667</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Clinical, ECG<sup>l</sup>, and echo<sup>m</sup> parameters</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>NYHA</td>
                <td>0.011</td>
                <td>0.017</td>
                <td>0.069</td>
                <td>0.007</td>
                <td>0.027</td>
                <td>0.022</td>
                <td>33.000</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Presence of atrial fibrillation</td>
                <td>0.055</td>
                <td>0.036</td>
                <td>0.048</td>
                <td>0.018</td>
                <td>0.026</td>
                <td>0.068</td>
                <td>16.333</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>QRS duration</td>
                <td>0.035</td>
                <td>0.046</td>
                <td>0.029</td>
                <td>0.039</td>
                <td>0.026</td>
                <td>0.039</td>
                <td>17.167</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>Interventricular septum (</italic>
                  <italic>IVS)</italic>
                </td>
                <td>0.043</td>
                <td>0.052</td>
                <td>0.049</td>
                <td>0.041</td>
                <td>0.057</td>
                <td>0.052</td>
                <td>8.167</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LA_d</td>
                <td>0.078</td>
                <td>0.037</td>
                <td>0.036</td>
                <td>0.018</td>
                <td>0.031</td>
                <td>0.070</td>
                <td>15.000</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LA_Vol</td>
                <td>0.055</td>
                <td>0.029</td>
                <td>0.026</td>
                <td>0.012</td>
                <td>0.025</td>
                <td>0.059</td>
                <td>24.000</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LVIDs</td>
                <td>0.017</td>
                <td>0.022</td>
                <td>0.027</td>
                <td>0.029</td>
                <td>0.043</td>
                <td>0.031</td>
                <td>25.167</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LVIDd</td>
                <td>0.021</td>
                <td>0.017</td>
                <td>0.017</td>
                <td>0.036</td>
                <td>0.044</td>
                <td>0.026</td>
                <td>27.667</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LVEF</td>
                <td>0.018</td>
                <td>0.051</td>
                <td>0.019</td>
                <td>0.014</td>
                <td>0.050</td>
                <td>0.013</td>
                <td>27.833</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Genetics</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>Mutation MYBPC3</italic>
                </td>
                <td>0.045</td>
                <td>0.041</td>
                <td>0.039</td>
                <td>0.051</td>
                <td>0.052</td>
                <td>0.059</td>
                <td>9.667</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <italic>Mutation MYH7</italic>
                </td>
                <td>0.037</td>
                <td>0.044</td>
                <td>0.034</td>
                <td>0.040</td>
                <td>0.066</td>
                <td>0.023</td>
                <td>14.667</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Negative genetics</td>
                <td>0.036</td>
                <td>0.037</td>
                <td>0.027</td>
                <td>0.043</td>
                <td>0.030</td>
                <td>0.031</td>
                <td>18.667</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>The table shows RReliefF feature scores and the average ranks for each target variable.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>Names of the 10 highest-ranked variables are italicized.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>LA_d: left atrial diameter.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>LVEF: left ventricular ejection fraction.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>NYHA: New York Heart Association.</p>
            </fn>
            <fn id="table5fn6">
              <p><sup>f</sup>LVIDd: left ventricular internal diameter at end diastole.</p>
            </fn>
            <fn id="table5fn7">
              <p><sup>g</sup>LVIDs: left ventricular internal diameter at end systole.</p>
            </fn>
            <fn id="table5fn8">
              <p><sup>h</sup>LA_Vol: left atrial volume.</p>
            </fn>
            <fn id="table5fn9">
              <p><sup>i</sup>BSA: body surface area.</p>
            </fn>
            <fn id="table5fn10">
              <p><sup>j</sup>HCM: hypertrophic cardiomyopathy.</p>
            </fn>
            <fn id="table5fn11">
              <p><sup>k</sup>SCD: sudden cardiac death.</p>
            </fn>
            <fn id="table5fn12">
              <p><sup>l</sup>ECG: electrocardiogram.</p>
            </fn>
            <fn id="table5fn13">
              <p><sup>m</sup>Echo: echocardiogram.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Predictive Modeling With Supervised and Semisupervised Machine Learning</title>
        <p>To model the relationship between input patient data and target variables, we applied the following supervised learning algorithms:</p>
        <list list-type="bullet">
          <list-item>
            <p>RFs [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>] are an ensemble prediction model that construct multiple randomized decision trees. The implementations of an RF classifier in the R statistical package (library ranger) and the Python Scikit-Lean package [<xref ref-type="bibr" rid="ref41">41</xref>] were used. Each forest used between 500 and 1500 trees, and the Gini index was used as the attribute-splitting rule.</p>
          </list-item>
          <list-item>
            <p>Gradient boosting (XGBoost) [<xref ref-type="bibr" rid="ref42">42</xref>] is an ensemble of weak decision tree predictors, implemented in the open source software library XGBoost.</p>
          </list-item>
          <list-item>
            <p>LR is a traditional method of finding a linear dependence between attributes and the selected target variable.</p>
          </list-item>
          <list-item>
            <p>NNs mimic the architecture and working of brain neurons. We used 1 input and 1 output layer and 1 or several hidden layers. In the optimization process, we optimized several learning parameters, such as the learning rate, number of hidden layers, sizes of layers, regularization, sample weights, class weights, dropout, and batch normalization.</p>
          </list-item>
        </list>
        <p>The best hyperparameters of these algorithms were tuned using Bayesian optimization and random search implemented in <italic>keras-tuner</italic> [<xref ref-type="bibr" rid="ref43">43</xref>].</p>
      </sec>
      <sec>
        <title>Semisupervised Learning and Virtual Patients</title>
        <p>Semisupervised learning is increasingly used in medicine, especially for medical image segmentation [<xref ref-type="bibr" rid="ref44">44</xref>-<xref ref-type="bibr" rid="ref46">46</xref>]. This approach allows labeling a large amount of unlabeled data using only a small portion of labeled data. The majority (ie, 83.9% averaged over 6 target variables) of patients' data did not have records for the follow-up after 10 years. These unlabeled data were used as examples for semisupervised learning, producing a teacher model. The unlabeled examples were labeled with the supervised learning predictive model (see the Predictive Modeling With Supervised and Semisupervised Machine Learning section) and added to the training set. After that, a new model (also called a student model) was trained and kept if it achieved better performance on the test set than the teacher model.</p>
        <p>To further improve the results of semisupervised learning, we used artificially generated data (ie, virtual patients). Virtual data generation can sometimes replace experiments in biomedical experiments on animals [<xref ref-type="bibr" rid="ref47">47</xref>]. Specifically in cardiovascular modeling, patient-specific virtual patient modeling has recently made major progress in improving diagnoses [<xref ref-type="bibr" rid="ref48">48</xref>]. We evaluated the performance and appropriateness of several virtual patient data generators for this task, such as the generator based on the multivariate normal and log-normal distribution (MVND and log-MVND) [<xref ref-type="bibr" rid="ref49">49</xref>], and nonparametric methods using supervised tree ensembles, unsupervised tree ensembles, radial basis function–based NNs [<xref ref-type="bibr" rid="ref50">50</xref>], and Bayesian networks [<xref ref-type="bibr" rid="ref51">51</xref>]. As the final data generator, we chose the unsupervised tree ensembles, which exhibited the highest level of agreement between the real and the virtual distributions, computed with the Kolmogorov-Smirnoff goodness-of-fit statistical test [<xref ref-type="bibr" rid="ref52">52</xref>]. We generated 10,000 virtual patient examples, with 20 most important features, listed in Data Set section.</p>
      </sec>
      <sec>
        <title>Explanation of the Predictive Model</title>
        <p>Supervised ML models often exhibit a black-box nature, meaning that they can model data but not provide an explanation for the contained knowledge as well as the reasoning used in predictions. This means that the models lack transparency and interpretability. To address this, explanation methods provide justification for each prediction and assess features with the highest impact [<xref ref-type="bibr" rid="ref53">53</xref>]. This is important in risk-sensitive ML application areas, such as medicine, where the predictions of ML models need to be understood as they may represent a basis for further medical interventions.</p>
        <p>In our work, we applied the SHAP method [<xref ref-type="bibr" rid="ref14">14</xref>], which is a model-agnostic method, generating an explanation for different ML models in a unified form. The method uses theoretically sound concepts of Shapley values from cooperative game theory for computing contributions of each individual attribute value and of each attribute overall. The generated explanations visualize the most relevant attributes that contribute to higher or lower prediction values. The explanations can be computed either for a single patient’s predictions or summarized over all patients to discover more general relationships between attributes and the model’s predictions.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Models’ Comparison</title>
        <p>To evaluate and compare the performance of the 6 predictive models, we used stratified 10-fold cross-validation. For each of the 6 predictive problems, 4 different regression models were evaluated (LR, RF, gradient-boosted [GB] trees, and NN). The following parameters were varied in tests:</p>
        <list list-type="bullet">
          <list-item>
            <p>Application of semisupervised learning (denoted with S)</p>
          </list-item>
          <list-item>
            <p>Addition of virtual patients' data into the learning data set (denoted with VP)</p>
          </list-item>
          <list-item>
            <p>Use of all 112 features (denoted with All) or only a subset of the 21 best features (denoted with Subset)</p>
          </list-item>
          <list-item>
            <p>Interpolation of data points so that measurements were equidistant (denoted with I)</p>
          </list-item>
        </list>
        <p>In all, 28 different combinations of the parameters were used in experiments. Some combinations were omitted due to limitations (eg, VP generators cannot generate data for all 112 attributes, so VP was evaluated only with the subset of attributes) or excessive time complexity (eg, the use of virtual patients with NNs).</p>
        <sec>
          <title>Performance of Predictive Models</title>
          <p>To compare the accuracy of the obtained models, we computed the following 4 metrics: mean absolute error (MAE), root-mean-square error (RMSE), and 2 variations of the relative root-mean-square error (RRMSE<sub>mean</sub> and RRMSE<sub>const</sub>). The MAE measures the average absolute difference between predicted and true values over all examples in the test set. The RMSE addresses the issue that the squared values of the MSE are hard to interpret. The RRMSE measures the relative ratio between the obtained model and the baseline model. We computed 2 variations of the RRMSE with 2 different baseline models: mean predictor and constant predictor. With the RRMSE<sub>mean</sub>, we compared the performance of the obtained model to the model that returned the mean of the target variable over all patients (mean predictor), while with the RRMSE<sub>const</sub>, we compared the obtained model to the model that assumed that the value of the target variable would remain constant/unchanged over the 10-year period (constant predictor).</p>
          <p>We summarized (<xref ref-type="table" rid="table6">Table 6</xref>) the performance of the best-performing predictive models (RF, LR, GB, NN) and parameters (S, VP, All/Subset) for each target variable. We could see that the top-performing regression models were the RF and the GB tree for all target variables. We achieved the best results by applying semisupervised learning (S) for all target variables and using virtual patients (VP) for 5 of 6 target variables. For all targets, the best results were obtained by learning from a subset of the 21 most important features. The values of both RRMSE metrics revealed that the model performs better than the baseline models (their values are less than 1.0), with the model for the LA_d target achieving the lowest predictive error.</p>
          <p>To further evaluate the contribution of different data augmentation strategies, we compared the results on different patient sets: original (All features), subset of best features (Subset), virtual patients (VP), semisupervised learning (S), and the combination of the latter 2 (S + VP). The obtained results, shown for the best-performing RF model, are given in <xref rid="figure3" ref-type="fig">Figure 3</xref>, which compares the R<sup>2</sup> metrics for each individual target parameter. The additional detailed results for the other models are given in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The obtained results reveal the benefits of reducing the feature space, as well as applying the used data augmentation methods.</p>
          <p>In the following subsection, we apply the explanation methodology that helps interpret the computed predictions and their contributing feature values.</p>
          <table-wrap position="float" id="table6">
            <label>Table 6</label>
            <caption>
              <p>Comparison of the best-performing models for each target variable.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="170"/>
              <col width="170"/>
              <col width="170"/>
              <col width="170"/>
              <col width="160"/>
              <col width="160"/>
              <thead>
                <tr valign="bottom">
                  <td>Target</td>
                  <td>Model and parameter</td>
                  <td>MAE<sup>a</sup></td>
                  <td>RMSE<sup>b</sup></td>
                  <td>RRMSE<sup>c</sup><sub>mean</sub></td>
                  <td>RRMSE<sub>const</sub></td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>LA_d<sup>d</sup></td>
                  <td>RF<sup>e</sup>: S<sup>f</sup>+VP<sup>g</sup>+Subset</td>
                  <td>3.4</td>
                  <td>4.73</td>
                  <td>0.54</td>
                  <td>0.46</td>
                </tr>
                <tr valign="top">
                  <td>LA_Vol<sup>h</sup></td>
                  <td>RF: S+VP+Subset</td>
                  <td>18.4</td>
                  <td>26.73</td>
                  <td>0.56</td>
                  <td>0.47</td>
                </tr>
                <tr valign="top">
                  <td>LVEF<sup>i</sup></td>
                  <td>GB<sup>j</sup>: S+Subset</td>
                  <td>4.92</td>
                  <td>6.73</td>
                  <td>0.67</td>
                  <td>0.61</td>
                </tr>
                <tr valign="top">
                  <td>LVIDd<sup>k</sup></td>
                  <td>RF: S+VP+Subset</td>
                  <td>3.53</td>
                  <td>5.26</td>
                  <td>0.68</td>
                  <td>0.64</td>
                </tr>
                <tr valign="top">
                  <td>LVIDs<sup>l</sup></td>
                  <td>RF: S+VP+Subset</td>
                  <td>3.42</td>
                  <td>4.81</td>
                  <td>0.66</td>
                  <td>0.56</td>
                </tr>
                <tr valign="top">
                  <td>NYHA<sup>m</sup></td>
                  <td>RF: S+VP+Subset</td>
                  <td>0.39</td>
                  <td>0.5</td>
                  <td>0.67</td>
                  <td>0.66</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table6fn1">
                <p><sup>a</sup>MAE: mean absolute error.</p>
              </fn>
              <fn id="table6fn2">
                <p><sup>b</sup>RMSE: root-mean-square error.</p>
              </fn>
              <fn id="table6fn3">
                <p><sup>c</sup>RRMSE: relative root-mean-square error.</p>
              </fn>
              <fn id="table6fn4">
                <p><sup>d</sup>LA_d: left atrial diameter.</p>
              </fn>
              <fn id="table6fn5">
                <p><sup>e</sup>RF: random forest.</p>
              </fn>
              <fn id="table6fn6">
                <p><sup>f</sup>S: application of semisupervised learning.</p>
              </fn>
              <fn id="table6fn7">
                <p><sup>g</sup>VP: addition of virtual patients' data into the learning data set.</p>
              </fn>
              <fn id="table6fn8">
                <p><sup>h</sup>LA_Vol: left atrial volume.</p>
              </fn>
              <fn id="table6fn9">
                <p><sup>i</sup>LVEF: left ventricular ejection fraction.</p>
              </fn>
              <fn id="table6fn10">
                <p><sup>j</sup>GB: gradient boosted.</p>
              </fn>
              <fn id="table6fn11">
                <p><sup>k</sup>LVIDd: left ventricular internal diameter at end diastole.</p>
              </fn>
              <fn id="table6fn12">
                <p><sup>l</sup>LVIDs: left ventricular internal diameter at end systole.</p>
              </fn>
              <fn id="table6fn13">
                <p><sup>m</sup>NYHA: New York Heart Association.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Plotted results for the R<sup>2</sup> statistic for each target variable using different sets (input parameters). Note that VP, S, and S + VP are used on feature subsets. LA_d: left atrial diameter; LA_Vol: left atrial volume; LVEF: left ventricular ejection fraction; LVIDd: left ventricular internal diameter at end diastole; LVIDs: left ventricular internal diameter at end systole; NYHA: New York Heart Association; S: application of semisupervised learning; VP: addition of virtual patients' data into the learning data set.</p>
            </caption>
            <graphic xlink:href="medinform_v10i2e30483_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Explanation of Predictions</title>
          <p>To augment the output of prediction models, we applied the SHAP method [<xref ref-type="bibr" rid="ref14">14</xref>] for computing explanations of individual predictions. The explanation of a single prediction consists of relevant textual, graphical, and numerical data that allows understanding of the relationships between the features of the patient and the model’s prediction. It also consists of a list of the most relevant features that influence the prediction, along with their contribution values that define whether the feature value either supports the predicted value or opposes it. The direction of the impact (ie, sign of the contribution value) is denoted using different colors.</p>
          <p>An example of the explanation generated for the prediction for the target LA_d (<xref rid="figure4" ref-type="fig">Figure 4</xref>) is presented here. Features’ contributions are sorted in descending order, and the graph contains only the features for which the sum of their contributions reflects 95% of the difference between the initial parameter value and the predicted value after 10 years. The green and red bars thus denote positive and negative contributions of the impact for individual feature values, respectively, showing the factors contributing to the increase or decrease in the LA_d value. We can see that the LA_d, atrial fibrillation, age, mutation MYBPC3, and LVIDs features contributed to the increase in the predicted value for LA_d over time, while the LA_Vol and mutation MYH7 features contributed to the decrease in the predicted value for LA_d. Because the overall increasing impact was more prominent, the final predicted value (51.34) was higher than the baseline prediction, which is also the current patients' value of LA_d (46.00). Larger magnitudes of the features' contributions correspond to larger changes in the prediction value. For example, LA_d contributed the most (approximately 30%) to the increase in the predicted value.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Example of an explanation of the prediction for the target variable LA_d. LA_d: left atrial diameter; LA_Vol: left atrial volume; LVIDs: left ventricular internal diameter at end systole.</p>
            </caption>
            <graphic xlink:href="medinform_v10i2e30483_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>Validation With Medical Experts</title>
        <p>Besides evaluation of prediction models with statistical measures conducted in 2 previous sections, we engaged medical experts to provide further interpretation and validation of the results. First, we compared the accuracy of predictive models with the accuracy of human experts, which was obtained by using a survey (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). Second, we checked whether prediction explanations were sensible and consistent with the experts' medical knowledge about HCM.</p>
        <p>We prepared a questionnaire for medical experts and distributed it to several medical universities and cardiology clinics. The questionnaire included data about complete medical cases (measurements, events, and medication data) for 10 patients, and the experts were asked to study them and complete the following 2 tasks:</p>
        <list list-type="bullet">
          <list-item>
            <p>Predict the magnitude of the 10-year change in the 6 studied clinical parameters (LA_d, LA_Vol, LVEF, LVIDd, LVIDs, and NYHA) and mark it on a discrete scale from –3 to 3, where –3 and 3 represented the biggest-possible decrease and increase, respectively. Possible magnitudes of change were represented using discrete intervals, as the prediction of an exact value is a difficult task that does not take place in medical practice.</p>
          </list-item>
          <list-item>
            <p>Evaluate whether the statements generated from the explanation (eg, “The current value of parameter LA_d will cause a decrease in LA_d”) are true or false. For each patient, 6 such statements were generated, covering the features with the highest contribution. More specifically, the questionnaire included evaluation questions for 6 parameters that contribute to a change in LA_d, 4 for LA_Vol, 5 for LVEF, 6 for LVIDd, 7 for LVIDs, and 4 for NYHA.</p>
          </list-item>
        </list>
        <p>The questionnaire was fully completed by 13 experts with 16 (SD 8) years of experience. In the following subsections, we present the analysis of the answers.</p>
        <sec>
          <title>Validation of Prediction Accuracy</title>
          <p>To compare the prediction accuracy between the experts and the ML model, we first discretized the model's predictions into discrete intervals so that they could be compared to the discrete intervals, predicted by the experts. We performed the discretization using bins of width 0<italic>.</italic>25<italic>σ</italic>, where <italic>σ</italic> is the SD of the variable. Further, we calculated the following prediction errors:</p>
          <list list-type="bullet">
            <list-item>
              <p>Mean prediction error of the discretized model prediction (denoted with MD)</p>
            </list-item>
            <list-item>
              <p>Mean prediction error made by individual medical experts (denoted with E)</p>
            </list-item>
            <list-item>
              <p>Mean prediction error of the consortium prediction (ie, the average prediction of all doctors, denoted with C</p>
            </list-item>
          </list>
          <p>We could see that the mean prediction error of the discretized model MD (<xref ref-type="table" rid="table7">Table 7</xref>) was the lowest for all target variables except for LA_d. The mean errors of consortium predictions C were lower than the predictions of individual experts for all parameters, which indicates that the mutual consolidation of different doctors' opinions reduced the error of their joint predictions. The consortium prediction error also turned out to be the lowest for the parameter LA_d and thus better than the error of the ML model.</p>
          <table-wrap position="float" id="table7">
            <label>Table 7</label>
            <caption>
              <p>Mean absolute error (MAE) of the discretized model predictions (MD), individual experts (E), and the entire consortium (C).</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="250"/>
              <col width="250"/>
              <col width="250"/>
              <col width="250"/>
              <thead>
                <tr valign="top">
                  <td>Target/prediction</td>
                  <td>Model (MD), MAE (SD)</td>
                  <td>Expert (E), MAE (SD)</td>
                  <td>Consortium (C), MAE (SD)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>NYHA<sup>a</sup></td>
                  <td>
                    <italic>0.30</italic>
                    <italic>(0.48)</italic>
                    <sup>b</sup>
                  </td>
                  <td>0.84 (0.69)</td>
                  <td>0.56 (0.34)</td>
                </tr>
                <tr valign="top">
                  <td>LA_d <sup>c</sup></td>
                  <td>1.70 (0.82)</td>
                  <td>1.69 (0.97)</td>
                  <td><italic>1.66</italic> (<italic>0.70</italic>)<sup>b</sup></td>
                </tr>
                <tr valign="top">
                  <td>LA_Vol<sup>d</sup></td>
                  <td>
                    <italic>1.00</italic>
                    <italic>(0.82)</italic>
                    <sup>b</sup>
                  </td>
                  <td>1.25 (0.98)</td>
                  <td>1.13 (0.63)</td>
                </tr>
                <tr valign="top">
                  <td>LVIDd<sup>e</sup></td>
                  <td>
                    <italic>0.80</italic>
                    <italic>(0.63)</italic>
                    <sup>b</sup>
                  </td>
                  <td>1.09 (0.91)</td>
                  <td>1.00 (0.77)</td>
                </tr>
                <tr valign="top">
                  <td>LVIDs<sup>f</sup></td>
                  <td>
                    <italic>0.50</italic>
                    <italic>(0.71)</italic>
                    <sup>b</sup>
                  </td>
                  <td>1.02 (0.86)</td>
                  <td>0.88 (0.68)</td>
                </tr>
                <tr valign="top">
                  <td>LVEF<sup>g</sup></td>
                  <td>
                    <italic>0.90</italic>
                    <italic>(0.88)</italic>
                    <sup>b</sup>
                  </td>
                  <td>1.32 (0.90)</td>
                  <td>1.28 (0.79)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table7fn1">
                <p><sup>a</sup>NYHA: New York Heart Association.</p>
              </fn>
              <fn id="table7fn2">
                <p><sup>b</sup>The lowest achieved errors are italicized.</p>
              </fn>
              <fn id="table7fn3">
                <p><sup>c</sup>LA_d: left atrial diameter.</p>
              </fn>
              <fn id="table7fn4">
                <p><sup>d</sup>LA_Vol: left atrial volume.</p>
              </fn>
              <fn id="table7fn5">
                <p><sup>e</sup>LVIDd: left ventricular internal diameter at end diastole.</p>
              </fn>
              <fn id="table7fn6">
                <p><sup>f</sup>LVIDs: left ventricular internal diameter at end systole.</p>
              </fn>
              <fn id="table7fn7">
                <p><sup>g</sup>LVEF: left ventricular ejection fraction.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Validation of the Model Explanation</title>
          <p>To validate the generated model explanations, we analyzed the agreement of experts with statements generated about the features' influence in 2 steps. First, we calculated the agreement ratio for individual features that were included in the questionnaire, grouped by each of the 6 target variables. Second, we calculated the overall agreement of experts with the explanation for each of the 6 target parameters, based on the agreement data about all features that contributed to their prediction.</p>
          <p>The results (<xref ref-type="table" rid="table8">Table 8</xref>) of the analysis provided the ratio of agreement between different parameters for each target variable, as well as their overall agreement. The highest agreement ratio was achieved for target attributes NYHA (1.00), LA_Vol (0.75), and LVIDd (0.67). The last column (Average agreement) summarizes the results across all used features. The results, in decreasing order, of the last column show that the majority of the experts agreed, especially with the explanations for the targets NYHA (average agreement of 0.73) and LVIDd (average agreement of 0.52). By comparing <xref ref-type="table" rid="table7">Tables 7</xref> and <xref ref-type="table" rid="table8">8</xref>, we consistently see that the experts least agreed with explanations for the target LA_d, for which the predictive model achieved a larger error than individual experts or the entire consortium. In cases where the predictive model achieved better predictive accuracy than the experts (<xref ref-type="table" rid="table7">Table 7</xref>) and the agreement of the experts with the explanation was lower (<xref ref-type="table" rid="table8">Table 8</xref>), for example, for LVEF, LA_Vol, and LVIDs, there are 3 possible explanations:</p>
          <list list-type="bullet">
            <list-item>
              <p>The generated explanation might, indeed, provide incorrect information.</p>
            </list-item>
            <list-item>
              <p>The generated explanation might explain novel relationships between features and target parameters that have not been observed or documented so far.</p>
            </list-item>
            <list-item>
              <p>It was hard for the experts to evaluate the claims in the questionnaire about the influence of particular features, as these tasks deviate from the established medical practice and require the experts to rely on their subjective experience.</p>
            </list-item>
          </list>
          <p>For establishing the reasons for imperfect agreement between the explanation and the experts, further investigation is therefore required. We can conclude that the results provide some evidence that the generated prediction explanation might provide a complementary view at the prediction of HCM-related parameters. Such explanations might represent a tool that the experts could consult while making their decisions.</p>
          <table-wrap position="float" id="table8">
            <label>Table 8</label>
            <caption>
              <p>Agreement ratios between experts and prediction explanations for parameters that contribute to predicting each target variable. The last two columns provide summary statistics.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="330"/>
              <col width="170"/>
              <col width="300"/>
              <col width="170"/>
              <thead>
                <tr valign="top">
                  <td colspan="2">Target variable and parameters</td>
                  <td>Expert agreement</td>
                  <td colspan="2">Summary</td>
                </tr>
                <tr valign="bottom">
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Ratio of agreed features from at least 50% of experts, n</td>
                  <td>Average agreement, n</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="5">
                    <bold>NYHA<sup>a</sup></bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>LA_d</italic>
                    <sup>b</sup>
                  </td>
                  <td>
                    <italic>0.77</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>Age</italic>
                  </td>
                  <td>
                    <italic>0.77</italic>
                    <sup>c</sup>
                  </td>
                  <td>1.00 (4/4)</td>
                  <td>0.73</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>LA_Vol</italic>
                    <sup>d</sup>
                  </td>
                  <td>
                    <italic>0.62</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>Atrial fibrillation</italic>
                  </td>
                  <td>
                    <italic>0.77</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="5">
                    <bold>LVIDd<sup>e</sup></bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>BSA<sup>f</sup></td>
                  <td>0.15</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>Gender</italic>
                  </td>
                  <td>
                    <italic>0.85</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>LVIDd</italic>
                  </td>
                  <td>
                    <italic>0.65</italic>
                    <sup>c</sup>
                  </td>
                  <td>0.67 (4/6)</td>
                  <td>0.52</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>QRS duration</italic>
                  </td>
                  <td>
                    <italic>0.69</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LVEF<sup>g</sup></td>
                  <td>0.23</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>Mutation MYH7</italic>
                  </td>
                  <td>
                    <italic>0.54</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="5">
                    <bold>LVEF</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>QRS duration</td>
                  <td>0.38</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>Presence of hypercholesterolemia</italic>
                  </td>
                  <td>
                    <italic>0.54</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Syncope</td>
                  <td>0.46</td>
                  <td>0.40 (2/5)</td>
                  <td>0.49</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>Gene_Testing_Performed</italic>
                  </td>
                  <td>
                    <italic>0.69</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>NYHA</td>
                  <td>0.38</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="5">
                    <bold>LA_Vol</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>LA_Vol</italic>
                  </td>
                  <td>
                    <italic>0.69</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>BSA</italic>
                  </td>
                  <td>
                    <italic>0.54</italic>
                    <sup>c</sup>
                  </td>
                  <td>0.75 (3/4)</td>
                  <td>0.48</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Age</td>
                  <td>0.15</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>Atrial fibrillation</italic>
                  </td>
                  <td>
                    <italic>0.54</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="5">
                    <bold>LVIDs</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LA_d</td>
                  <td>0.38</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LVIDd</td>
                  <td>0.38</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>LA_Vol</italic>
                  </td>
                  <td>
                    <italic>0.62</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>BSA</italic>
                  </td>
                  <td>
                    <italic>0.85</italic>
                    <sup>c</sup>
                  </td>
                  <td>0.43 (3/7)</td>
                  <td>0.47</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>Mutation MYBPC3</italic>
                  </td>
                  <td>
                    <italic>0.62</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Interventricular septum (IVS)</td>
                  <td>0.38</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Family history of HCM<sup>h</sup></td>
                  <td>0.08</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="5">
                    <bold>LA</bold>
                    <bold>_d</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <italic>LA_d</italic>
                  </td>
                  <td>
                    <italic>0.85</italic>
                    <sup>c</sup>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Atrial fibrillation</td>
                  <td>0.15</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>BSA</td>
                  <td>0.08</td>
                  <td>0.17 (1/6)</td>
                  <td>0.36</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>IVS</td>
                  <td>0.38</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Age</td>
                  <td>0.31</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LVEF</td>
                  <td>0.38</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table8fn1">
                <p><sup>a</sup>NYHA: New York Heart Association.</p>
              </fn>
              <fn id="table8fn2">
                <p><sup>b</sup>LA_d: left atrial diameter.</p>
              </fn>
              <fn id="table8fn3">
                <p><sup>c</sup>Names of parameters with agreement higher than 50% are italicized.</p>
              </fn>
              <fn id="table8fn4">
                <p><sup>d</sup>LA_Vol: left atrial volume.</p>
              </fn>
              <fn id="table8fn5">
                <p><sup>e</sup>LVIDd: left ventricular internal diameter at end diastole.</p>
              </fn>
              <fn id="table8fn6">
                <p><sup>f</sup>BSA: body surface area.</p>
              </fn>
              <fn id="table8fn7">
                <p><sup>g</sup>LVEF: left ventricular ejection fraction.</p>
              </fn>
              <fn id="table8fn8">
                <p><sup>i</sup>HCM: hypertrophic cardiomyopathy.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Results</title>
        <p>We presented a disease progression system for patients diagnosed with HCM that is based on predicting 6 target parameters (LA_d, LA_Vol, LVIDd, LVIDs, LVEF, and NYHA) for 10 years ahead using supervised ML models. The experiments revealed good ML performance for all targets, with the achieved predictive error lower than the error of the default predictors. The experiments also revealed that semisupervised learning and the artificial data from virtual patients helped achieve even higher predictive accuracy for all 6 targets. Finally, we validated our approach with human experts using a structured questionnaire and determined the models' favorable performance compared to performance of experts for 5 of 6 targets.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>The design of the study carried several limitations, stemming from the fact that this work was based on real-world data that are expensive to obtain and are subject to noise. The first limitation of this study is that it was based only on a single medical center data set. To further validate this study, it would be beneficial to independently evaluate the models with data sets from other centers or extend the existing data set with more data. Additionally, the benefit for including more data could also be in diminishing a potential bias of our data set, which could potentially include a population distribution that is different from other medical centers and thus different ranges of recorded parameters, which we did, in fact, observe in some cases. Additionally, in the perfect but rather unrealistic scenario due to its cost, both data modalities (echo and CMR) would be available for all patients, which would allow us to use the CMR data as an additional data source for all patients. Due to the unavailability of such data at the time of the study or data that were structured differently, we leave this for our further work.</p>
        <p>Further, to prepare the data to be used for ML and obtain stable predictions, we used several preprocessing and data augmentation steps. Since we are dealing with real medical data, this opens questions of how different data transformations influence our predictions. Hence, a sensitivity study of the results would be required, as well as determining how the patient’s record time frame and predicted risk time frame influence the achieved accuracies. An additional limitation of the performed validation was that the ML results were compared to the inputs of medical experts in the structured survey instead of their free diagnoses and evaluations. Although this was required to unify the structure of human answers to enable statistical comparisons, the form of survey might introduce its own bias.</p>
        <p>The described limitations, along with our further research questions and ideas, open several ideas for future study directions. First, we will evaluate the proposed system on an independent cardiological data set (eg, the Sarcomeric Human Cardiomyopathy Registry [SHaRe]) [<xref ref-type="bibr" rid="ref54">54</xref>]. Second, as our current approach provides future predictions for 6 independent parameters, the outputs will be further combined into a single risk prediction of high/low risk, which can further improve HCM health management initiative [<xref ref-type="bibr" rid="ref32">32</xref>]. To achieve this, a combination of models' output analysis and domain experts' input would be required. Finally, further ways for improvement of predictive accuracy will be tested (additional predictive models and feature selection techniques, including deep learning), as well as determining the reasons for the experts' disagreement with some of the explanation components.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>Although ML can have limitations in medicine [<xref ref-type="bibr" rid="ref2">2</xref>], in this work, we showed the importance of using computer models in cardiology by predicting disease progression of HCM patients 10 years ahead, which could be used to prevent SCD. Additionally, the results confirmed findings in Chen et al [<xref ref-type="bibr" rid="ref44">44</xref>], Gu et al [<xref ref-type="bibr" rid="ref45">45</xref>], and Bai et al [<xref ref-type="bibr" rid="ref46">46</xref>] that additional artificial data and semisupervised learning can provide additional low-cost and low-risk data using already available medical knowledge, increasing the predictive performance. Simple explanations of predictions contribute to the trust of provided predictions and ease the decision of experts. We hope that our work will further contribute to the goal of developing constructive strategies to prevent SCD in patients with HCM, as motivated by Maron et al [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Bar graphs of parameter influence for each model used.</p>
        <media xlink:href="medinform_v10i2e30483_app1.png" xlink:title="PNG File , 257 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>A sample of the questionnaire for the first patient.</p>
        <media xlink:href="medinform_v10i2e30483_app2.pdf" xlink:title="PDF File  (Adobe PDF File), 597 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BSA</term>
          <def>
            <p>body surface area</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CMR</term>
          <def>
            <p>cardiac magnetic resonance</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">COPD</term>
          <def>
            <p>chronic obstructive pulmonary disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ECG</term>
          <def>
            <p>electrocardiogram</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">Echo</term>
          <def>
            <p>echocardiogram</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">GB</term>
          <def>
            <p>gradient boosted</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">HCM</term>
          <def>
            <p>hypertrophic cardiomyopathy</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">KNN</term>
          <def>
            <p>k-nearest neighbors</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">LA_d</term>
          <def>
            <p>left atrial diameter</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">LA_Vol</term>
          <def>
            <p>left atrial volume</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">LR</term>
          <def>
            <p>linear regression</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">LVEF</term>
          <def>
            <p>left ventricular ejection fraction LVIDd: left ventricular internal diameter at end diastole</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">LVIDs</term>
          <def>
            <p>left ventricular internal diameter at end systole</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">MAE</term>
          <def>
            <p>mean absolute error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">MVND</term>
          <def>
            <p>multivariate normal distribution</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">NN</term>
          <def>
            <p>neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb19">NYHA</term>
          <def>
            <p>New York Heart Association</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb20">RF</term>
          <def>
            <p>random forest</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb21">RMSE</term>
          <def>
            <p>root-mean-square error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb22">RRMSE</term>
          <def>
            <p>relative root-mean-square error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb23">SCD</term>
          <def>
            <p>sudden cardiac death</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb24">SHAP</term>
          <def>
            <p>Shapley additive explanation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb25">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This project received funding from the European Union’s Horizon 2020 research and innovation program (grant agreement no. 777204; www.silicofcm.eu). This paper reflects only the authors’ views. The European Commission is not responsible for any use that may be made of the information it contains.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cuocolo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Perillo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>De Rosa</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ugga</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Petretta</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Current applications of big data and machine learning in cardiology</article-title>
          <source>J Geriatr Cardiol</source>
          <year>2019</year>
          <month>08</month>
          <volume>16</volume>
          <issue>8</issue>
          <fpage>601</fpage>
          <lpage>607</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31555327"/>
          </comment>
          <pub-id pub-id-type="doi">10.11909/j.issn.1671-5411.2019.08.002</pub-id>
          <pub-id pub-id-type="medline">31555327</pub-id>
          <pub-id pub-id-type="pii">jgc-16-08-601</pub-id>
          <pub-id pub-id-type="pmcid">PMC6748901</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shameer</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Dudley</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sengupta</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Machine learning in cardiovascular medicine: are we there yet?</article-title>
          <source>Heart</source>
          <year>2018</year>
          <month>07</month>
          <volume>104</volume>
          <issue>14</issue>
          <fpage>1156</fpage>
          <lpage>1164</lpage>
          <pub-id pub-id-type="doi">10.1136/heartjnl-2017-311198</pub-id>
          <pub-id pub-id-type="medline">29352006</pub-id>
          <pub-id pub-id-type="pii">heartjnl-2017-311198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fisher</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Walsh</surname>
              <given-names>JR</given-names>
            </name>
            <collab>Coalition Against Major Diseases</collab>
          </person-group>
          <article-title>Machine learning for comprehensive forecasting of Alzheimer's disease progression</article-title>
          <source>Sci Rep</source>
          <year>2019</year>
          <month>09</month>
          <day>20</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>13622</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-019-49656-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-019-49656-2</pub-id>
          <pub-id pub-id-type="medline">31541187</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-019-49656-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC6754403</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Nho</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Predicting Alzheimer's disease progression using multi-modal deep learning approach</article-title>
          <source>Sci Rep</source>
          <year>2019</year>
          <month>02</month>
          <day>13</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>1952</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-018-37769-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-018-37769-z</pub-id>
          <pub-id pub-id-type="medline">30760848</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-018-37769-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC6374429</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nilashi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ibrahim</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmadi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Shahmoradi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Farahmand</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A hybrid intelligent system for the prediction of Parkinson's disease progression using machine learning techniques</article-title>
          <source>Biocybern Biomed Eng</source>
          <year>2018</year>
          <volume>38</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1016/j.bbe.2017.09.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pinto</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Oliveira</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Batista</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cruz</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Pinto</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Correia</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Martins</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Teixeira</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Prediction of disease progression and outcomes in multiple sclerosis with machine learning</article-title>
          <source>Sci Rep</source>
          <year>2020</year>
          <month>12</month>
          <day>03</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>21038</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-020-78212-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-020-78212-6</pub-id>
          <pub-id pub-id-type="medline">33273676</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-020-78212-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7713436</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Guan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Comparison and development of machine learning tools in the prediction of chronic kidney disease progression</article-title>
          <source>J Transl Med</source>
          <year>2019</year>
          <month>04</month>
          <day>11</day>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>119</fpage>
          <lpage>13</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://translational-medicine.biomedcentral.com/articles/10.1186/s12967-019-1860-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12967-019-1860-0</pub-id>
          <pub-id pub-id-type="medline">30971285</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12967-019-1860-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6458616</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Konerman</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Beste</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Van</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Saini</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>Nallamothu</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Ioannou</surname>
              <given-names>GN</given-names>
            </name>
            <name name-style="western">
              <surname>Waljee</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <article-title>Machine learning models to predict disease progression among veterans with hepatitis C virus</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <month>1</month>
          <day>4</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>e0208141</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0208141"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0208141</pub-id>
          <pub-id pub-id-type="medline">30608929</pub-id>
          <pub-id pub-id-type="pii">PONE-D-18-18442</pub-id>
          <pub-id pub-id-type="pmcid">PMC6319806</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lyon</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mincholé</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bueno-Orovio</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Improving the clinical understanding of hypertrophic cardiomyopathy by combining patient data, machine learning and computer simulations: a case study</article-title>
          <source>Morphologie</source>
          <year>2019</year>
          <month>12</month>
          <volume>103</volume>
          <issue>343</issue>
          <fpage>169</fpage>
          <lpage>179</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1286-0115(19)30052-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.morpho.2019.09.001</pub-id>
          <pub-id pub-id-type="medline">31570308</pub-id>
          <pub-id pub-id-type="pii">S1286-0115(19)30052-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC6913520</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maron</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Gardin</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Flack</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Gidding</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Kurosaki</surname>
              <given-names>TT</given-names>
            </name>
            <name name-style="western">
              <surname>Bild</surname>
              <given-names>DE</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of hypertrophic cardiomyopathy in a general population of young adults. Echocardiographic analysis of 4111 subjects in the CARDIA Study. Coronary artery risk development in (young) adults</article-title>
          <source>Circulation</source>
          <year>1995</year>
          <month>08</month>
          <day>15</day>
          <volume>92</volume>
          <issue>4</issue>
          <fpage>785</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1161/01.cir.92.4.785</pub-id>
          <pub-id pub-id-type="medline">7641357</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Olivotto</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cecchi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Poggesi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yacoub</surname>
              <given-names>MH</given-names>
            </name>
          </person-group>
          <article-title>Patterns of disease progression in hypertrophic cardiomyopathy: an individualized approach to clinical staging</article-title>
          <source>Circ Heart Fail</source>
          <year>2012</year>
          <month>07</month>
          <day>01</day>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>535</fpage>
          <lpage>46</lpage>
          <pub-id pub-id-type="doi">10.1161/CIRCHEARTFAILURE.112.967026</pub-id>
          <pub-id pub-id-type="medline">22811549</pub-id>
          <pub-id pub-id-type="pii">5/4/535</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Mahony</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jichi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Pavlou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Monserrat</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Anastasakis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rapezzi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Biagini</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gimeno</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Limongelli</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>McKenna</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Omar</surname>
              <given-names>RZ</given-names>
            </name>
            <name name-style="western">
              <surname>Elliott</surname>
              <given-names>PM</given-names>
            </name>
            <collab>Hypertrophic Cardiomyopathy Outcomes Investigators</collab>
          </person-group>
          <article-title>A novel clinical risk prediction model for sudden cardiac death in hypertrophic cardiomyopathy (HCM risk-SCD)</article-title>
          <source>Eur Heart J</source>
          <year>2014</year>
          <month>08</month>
          <day>07</day>
          <volume>35</volume>
          <issue>30</issue>
          <fpage>2010</fpage>
          <lpage>20</lpage>
          <pub-id pub-id-type="doi">10.1093/eurheartj/eht439</pub-id>
          <pub-id pub-id-type="medline">24126876</pub-id>
          <pub-id pub-id-type="pii">eht439</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andy</surname>
              <given-names>AU</given-names>
            </name>
            <name name-style="western">
              <surname>Guntuku</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Adusumalli</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Asch</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Groeneveld</surname>
              <given-names>PW</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Predicting cardiovascular risk using social media data: performance evaluation of machine-learning models</article-title>
          <source>JMIR Cardio</source>
          <year>2021</year>
          <month>02</month>
          <day>19</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>e24473</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cardio.jmir.org/2021/1/e24473/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24473</pub-id>
          <pub-id pub-id-type="medline">33605888</pub-id>
          <pub-id pub-id-type="pii">v5i1e24473</pub-id>
          <pub-id pub-id-type="pmcid">PMC8411430</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>A unified approach to interpreting model predictions</article-title>
          <year>2017</year>
          <month>12</month>
          <conf-name>Proceedings of the 31st International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>Dec 4, 2017</conf-date>
          <conf-loc>Long Beach, CA, USA</conf-loc>
          <fpage>4768</fpage>
          <lpage>4777</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Magoulas</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Prentza</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Machine learning in medical applications</article-title>
          <source>Lecture Notes in Computer Science</source>
          <year>2001</year>
          <month>9</month>
          <day>20</day>
          <publisher-loc>Berlin, Heidelberg</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>300</fpage>
          <lpage>307</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Sontag</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Unsupervised learning of disease progression models</article-title>
          <year>2014</year>
          <conf-name>Proceedings of the 20th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>Aug 2014</conf-date>
          <conf-loc>New York, NY, USA</conf-loc>
          <fpage>85</fpage>
          <lpage>94</lpage>
          <pub-id pub-id-type="doi">10.1145/2623330.2623754</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Juarez-Orozco</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Martinez-Manzanera</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Storti</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Knuuti</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Machine learning in the evaluation of myocardial ischemia through nuclear cardiology</article-title>
          <source>Curr Cardiovasc Imaging Rep</source>
          <year>2019</year>
          <month>2</month>
          <day>9</day>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>1</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1007/s12410-019-9480-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sardar</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Abbott</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Kundu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Aronow</surname>
              <given-names>HD</given-names>
            </name>
            <name name-style="western">
              <surname>Granada</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Giri</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Impact of artificial intelligence on interventional cardiology: from decision-making aid to advanced interventional procedure assistance</article-title>
          <source>JACC Cardiovasc Interv</source>
          <year>2019</year>
          <month>07</month>
          <day>22</day>
          <volume>12</volume>
          <issue>14</issue>
          <fpage>1293</fpage>
          <lpage>1303</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1936-8798(19)31095-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jcin.2019.04.048</pub-id>
          <pub-id pub-id-type="medline">31320024</pub-id>
          <pub-id pub-id-type="pii">S1936-8798(19)31095-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elul</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenberg</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Schuster</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bronstein</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Yaniv</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Meeting the unmet needs of clinicians from AI systems showcased for cardiology with deep-learning-based ECG analysis</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2021</year>
          <month>06</month>
          <day>15</day>
          <volume>118</volume>
          <issue>24</issue>
          <fpage>e2020620118</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&#38;pmid=34099565"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.2020620118</pub-id>
          <pub-id pub-id-type="medline">34099565</pub-id>
          <pub-id pub-id-type="pii">2020620118</pub-id>
          <pub-id pub-id-type="pmcid">PMC8214673</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Kawczynski</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Trivedi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Harnish</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jenkins</surname>
              <given-names>NW</given-names>
            </name>
            <name name-style="western">
              <surname>Lituiev</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Copeland</surname>
              <given-names>TP</given-names>
            </name>
            <name name-style="western">
              <surname>Aboian</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Mari Aparici</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Behr</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Flavell</surname>
              <given-names>RR</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zalocusky</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Nardo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Seo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hawkins</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez Pampaloni</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hadley</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Franc</surname>
              <given-names>BL</given-names>
            </name>
          </person-group>
          <article-title>A deep learning model to predict a diagnosis of Alzheimer disease by using F-FDG PET of the brain</article-title>
          <source>Radiology</source>
          <year>2019</year>
          <month>02</month>
          <volume>290</volume>
          <issue>2</issue>
          <fpage>456</fpage>
          <lpage>464</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30398430"/>
          </comment>
          <pub-id pub-id-type="doi">10.1148/radiol.2018180958</pub-id>
          <pub-id pub-id-type="medline">30398430</pub-id>
          <pub-id pub-id-type="pmcid">PMC6358051</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Seah</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kitchen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gaillard</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Dixon</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Chest radiographs in congestive heart failure: visualizing neural network learning</article-title>
          <source>Radiology</source>
          <year>2019</year>
          <month>02</month>
          <volume>290</volume>
          <issue>2</issue>
          <fpage>514</fpage>
          <lpage>522</lpage>
          <pub-id pub-id-type="doi">10.1148/radiol.2018180887</pub-id>
          <pub-id pub-id-type="medline">30398431</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ohta</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yunaga</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kitao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fukuda</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ogawa</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Detection and classification of myocardial delayed enhancement patterns on MR images with deep neural networks: a feasibility study</article-title>
          <source>Radiol Artif Intell</source>
          <year>2019</year>
          <month>05</month>
          <volume>1</volume>
          <issue>3</issue>
          <fpage>e180061</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33937791"/>
          </comment>
          <pub-id pub-id-type="doi">10.1148/ryai.2019180061</pub-id>
          <pub-id pub-id-type="medline">33937791</pub-id>
          <pub-id pub-id-type="pmcid">PMC8017383</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Attia</surname>
              <given-names>ZI</given-names>
            </name>
            <name name-style="western">
              <surname>Kapa</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lopez-Jimenez</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>McKie</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Ladewig</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Satam</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Pellikka</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Enriquez-Sarano</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Noseworthy</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Munger</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Asirvatham</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Carter</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <article-title>Screening for cardiac contractile dysfunction using an artificial intelligence-enabled electrocardiogram</article-title>
          <source>Nat Med</source>
          <year>2019</year>
          <month>01</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>70</fpage>
          <lpage>74</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-018-0240-2</pub-id>
          <pub-id pub-id-type="medline">30617318</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-018-0240-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kwon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>An algorithm based on deep learning for predicting in‐hospital cardiac arrest</article-title>
          <source>JAHA</source>
          <year>2018</year>
          <month>07</month>
          <day>03</day>
          <volume>7</volume>
          <issue>13</issue>
          <fpage>e008678</fpage>
          <pub-id pub-id-type="doi">10.1161/jaha.118.008678</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adler</surname>
              <given-names>ED</given-names>
            </name>
            <name name-style="western">
              <surname>Voors</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Macheret</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Braun</surname>
              <given-names>OO</given-names>
            </name>
            <name name-style="western">
              <surname>Urey</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Sama</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Tadel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Campagnari</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Greenberg</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Yagil</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Improving risk prediction in heart failure using machine learning</article-title>
          <source>Eur J Heart Fail</source>
          <year>2020</year>
          <month>01</month>
          <day>12</day>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>139</fpage>
          <lpage>147</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/ejhf.1628"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/ejhf.1628</pub-id>
          <pub-id pub-id-type="medline">31721391</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Daghistani</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Elshawi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sakr</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Thwayee</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Mallah</surname>
              <given-names>MH</given-names>
            </name>
          </person-group>
          <article-title>Predictors of in-hospital length of stay among cardiac patients: a machine learning approach</article-title>
          <source>Int J Cardiol</source>
          <year>2019</year>
          <month>08</month>
          <day>01</day>
          <volume>288</volume>
          <fpage>140</fpage>
          <lpage>147</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijcard.2019.01.046</pub-id>
          <pub-id pub-id-type="medline">30685103</pub-id>
          <pub-id pub-id-type="pii">S0167-5273(18)34602-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gjoreski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gradišek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gams</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Simjanoska</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Peterlin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Poglajen</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Chronic heart failure detection from heart sounds using a stack of machine-learning classifiers</article-title>
          <year>2017</year>
          <month>8</month>
          <day>21</day>
          <conf-name>13th International Conference on Intelligent Environments</conf-name>
          <conf-date>2017</conf-date>
          <conf-loc>Seoul, South Korea</conf-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>14</fpage>
          <pub-id pub-id-type="doi">10.1109/ie.2017.19</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oguz</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sen</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>O'Donnell</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Gibbons</surname>
              <given-names>GH</given-names>
            </name>
          </person-group>
          <article-title>Genotype-driven identification of a molecular network predictive of advanced coronary calcium in ClinSeq® and Framingham Heart Study cohorts</article-title>
          <source>BMC Syst Biol</source>
          <year>2017</year>
          <month>10</month>
          <day>26</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>99</fpage>
          <lpage>14</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcsystbiol.biomedcentral.com/articles/10.1186/s12918-017-0474-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12918-017-0474-5</pub-id>
          <pub-id pub-id-type="medline">29073909</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12918-017-0474-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC5659034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rowin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Maron</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The role of cardiac MRI in the diagnosis and risk stratification of hypertrophic cardiomyopathy</article-title>
          <source>Arrhythmia Electrophysiol Rev Internet Radcliffe Cardiology Dec</source>
          <year>2016</year>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.15420/aer.2016:13:3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hoey</surname>
              <given-names>ETD</given-names>
            </name>
            <name name-style="western">
              <surname>Teoh</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Ganeshan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Simpson</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Watkin</surname>
              <given-names>RW</given-names>
            </name>
          </person-group>
          <article-title>The emerging role of cardiovascular MRI for risk stratification in hypertrophic cardiomyopathy</article-title>
          <source>Clin Radiol</source>
          <year>2014</year>
          <month>03</month>
          <volume>69</volume>
          <issue>3</issue>
          <fpage>221</fpage>
          <lpage>30</lpage>
          <pub-id pub-id-type="doi">10.1016/j.crad.2013.11.012</pub-id>
          <pub-id pub-id-type="medline">24412355</pub-id>
          <pub-id pub-id-type="pii">S0009-9260(13)00543-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hiemstra</surname>
              <given-names>YL</given-names>
            </name>
            <name name-style="western">
              <surname>Debonnaire</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bootsma</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schalij</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bax</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Delgado</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Marsan</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and prognostic implications of right ventricular dysfunction in patients with hypertrophic cardiomyopathy</article-title>
          <source>Am J Cardiol</source>
          <year>2019</year>
          <month>08</month>
          <day>15</day>
          <volume>124</volume>
          <issue>4</issue>
          <fpage>604</fpage>
          <lpage>612</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amjcard.2019.05.021</pub-id>
          <pub-id pub-id-type="medline">31204037</pub-id>
          <pub-id pub-id-type="pii">S0002-9149(19)30588-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Just</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <source>Understanding Risk Stratification, Comorbidities, and the Future of Healthcare</source>
          <year>2014</year>
          <access-date>2015-06-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.slideshare.net/healthcatalyst1/understanding-risk-stratification-comorbidities-and-the-future-of-healthcare">https://www.slideshare.net/healthcatalyst1/understanding-risk-stratification-comorbidities-and-the-future-of-healthcare</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hess</surname>
              <given-names>OM</given-names>
            </name>
          </person-group>
          <article-title>Risk stratification in hypertrophic cardiomyopathy</article-title>
          <source>J Am Coll Cardiol</source>
          <year>2003</year>
          <month>09</month>
          <volume>42</volume>
          <issue>5</issue>
          <fpage>880</fpage>
          <lpage>881</lpage>
          <pub-id pub-id-type="doi">10.1016/s0735-1097(03)00838-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Steriotis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Risk stratification in hypertrophic cardiomyopathy</article-title>
          <source>Eur Cardiol</source>
          <year>2015</year>
          <month>07</month>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>31</fpage>
          <lpage>36</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30310420"/>
          </comment>
          <pub-id pub-id-type="doi">10.15420/ecr.2015.10.01.31</pub-id>
          <pub-id pub-id-type="medline">30310420</pub-id>
          <pub-id pub-id-type="pmcid">PMC6159455</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maron</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rowin</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Casey</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Haas</surname>
              <given-names>TS</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Udelson</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Garberich</surname>
              <given-names>RF</given-names>
            </name>
            <name name-style="western">
              <surname>Lesser</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Appelbaum</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Maron</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Risk stratification and outcome of patients with hypertrophic cardiomyopathy ≥60 years of age</article-title>
          <source>Circulation</source>
          <year>2013</year>
          <month>02</month>
          <day>05</day>
          <volume>127</volume>
          <issue>5</issue>
          <fpage>585</fpage>
          <lpage>593</lpage>
          <pub-id pub-id-type="doi">10.1161/circulationaha.112.136085</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maron</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Rowin</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wessler</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Mooney</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fatima</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Koethe</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Romashko</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Link</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Maron</surname>
              <given-names>BJ</given-names>
            </name>
          </person-group>
          <article-title>Enhanced American College of Cardiology/American Heart Association strategy for prevention of sudden cardiac death in high-risk patients with hypertrophic cardiomyopathy</article-title>
          <source>JAMA Cardiol</source>
          <year>2019</year>
          <month>07</month>
          <day>01</day>
          <volume>4</volume>
          <issue>7</issue>
          <fpage>644</fpage>
          <lpage>657</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31116360"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamacardio.2019.1391</pub-id>
          <pub-id pub-id-type="medline">31116360</pub-id>
          <pub-id pub-id-type="pii">2733139</pub-id>
          <pub-id pub-id-type="pmcid">PMC6537832</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gersh</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Maron</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bonow</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dearani</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fifer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Link</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Naidu</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Nishimura</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Ommen</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Rakowski</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Seidman</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Towbin</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Udelson</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Yancy</surname>
              <given-names>CW</given-names>
            </name>
            <collab>American College of Cardiology Foundation/American Heart Association Task Force on Practice Guidelines</collab>
            <collab>American Association for Thoracic Surgery</collab>
            <collab>American Society of Echocardiography</collab>
            <collab>American Society of Nuclear Cardiology</collab>
            <collab>Heart Failure Society of America</collab>
            <collab>Heart Rhythm Society</collab>
            <collab>Society for Cardiovascular AngiographyInterventions</collab>
            <collab>Society of Thoracic Surgeons</collab>
          </person-group>
          <article-title>2011 ACCF/AHA guideline for the diagnosis and treatment of hypertrophic cardiomyopathy: a report of the American College of Cardiology Foundation/American Heart Association Task Force on Practice Guidelines</article-title>
          <source>Circulation</source>
          <year>2011</year>
          <month>12</month>
          <day>13</day>
          <volume>124</volume>
          <issue>24</issue>
          <fpage>e783</fpage>
          <lpage>831</lpage>
          <pub-id pub-id-type="doi">10.1161/CIR.0b013e318223e2bd</pub-id>
          <pub-id pub-id-type="medline">22068434</pub-id>
          <pub-id pub-id-type="pii">CIR.0b013e318223e2bd</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Robnik-Šikonja</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kononenko</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>An adaptation of Relief for attribute estimation in regression</article-title>
          <year>1997</year>
          <conf-name>Proceedings of the Fourteenth International Conference on Machine Learning (ICML) 1997</conf-name>
          <conf-date>1997</conf-date>
          <conf-loc>Nashville, TN, USA</conf-loc>
          <fpage>296</fpage>
          <lpage>304</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Flaxman</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Vahdatpour</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>James</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>CJ</given-names>
            </name>
            <collab>Population Health Metrics Research Consortium (PHMRC)</collab>
          </person-group>
          <article-title>Random forests for verbal autopsy analysis: multisite validation study using clinical diagnostic gold standards</article-title>
          <source>Popul Health Metr</source>
          <year>2011</year>
          <month>08</month>
          <day>04</day>
          <volume>9</volume>
          <fpage>29</fpage>
          <lpage>11</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pophealthmetrics.biomedcentral.com/articles/10.1186/1478-7954-9-29"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1478-7954-9-29</pub-id>
          <pub-id pub-id-type="medline">21816105</pub-id>
          <pub-id pub-id-type="pii">1478-7954-9-29</pub-id>
          <pub-id pub-id-type="pmcid">PMC3160922</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Malley</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Kruppa</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dasgupta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Malley</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Ziegler</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Probability machines: consistent probability estimation using nonparametric learning machines</article-title>
          <source>Methods Inf Med</source>
          <year>2012</year>
          <volume>51</volume>
          <issue>1</issue>
          <fpage>74</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21915433"/>
          </comment>
          <pub-id pub-id-type="doi">10.3414/ME00-01-0052</pub-id>
          <pub-id pub-id-type="medline">21915433</pub-id>
          <pub-id pub-id-type="pii">00-01-0052</pub-id>
          <pub-id pub-id-type="pmcid">PMC3250568</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abraham</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Eickenberg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gervais</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mueller</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kossaifi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thirion</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for neuroimaging with scikit-learn</article-title>
          <source>Front Neuroinform</source>
          <year>2014</year>
          <month>2</month>
          <day>21</day>
          <volume>8</volume>
          <fpage>14</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fninf.2014.00014"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fninf.2014.00014</pub-id>
          <pub-id pub-id-type="medline">24600388</pub-id>
          <pub-id pub-id-type="pmcid">PMC3930868</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>XGBoost: a scalable tree boosting system</article-title>
          <year>2016</year>
          <conf-name>Proceedings of the 22th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining KDD '16</conf-name>
          <conf-date>Aug 13, 2016</conf-date>
          <conf-loc>San Francisco, CA, USA</conf-loc>
          <publisher-loc>USA</publisher-loc>
          <publisher-name>Association for Computing Machinery</publisher-name>
          <fpage>785</fpage>
          <lpage>794</lpage>
          <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Malley</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bursztein</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Long</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chollet</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Invernizzi</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <source>keras-team/keras-tuner: Hyperparameter Tuning for Humans</source>
          <access-date>2021-03-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/keras-team/keras-tuner">https://github.com/keras-team/keras-tuner</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bortsova</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Juárez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>van</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>de</surname>
              <given-names>BM</given-names>
            </name>
          </person-group>
          <article-title>Multi-task attention-based semi-supervised learning for medical image segmentation</article-title>
          <source>Lect Notes Comput Sci</source>
          <year>2019</year>
          <fpage>457</fpage>
          <lpage>465</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-32248-9_51</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>You</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Harada</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Semi-supervised learning in medical images through graph-embedded random forest</article-title>
          <source>Front Neuroinform</source>
          <year>2020</year>
          <month>11</month>
          <day>10</day>
          <volume>14</volume>
          <fpage>601829</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fninf.2020.601829"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fninf.2020.601829</pub-id>
          <pub-id pub-id-type="medline">33240071</pub-id>
          <pub-id pub-id-type="pmcid">PMC7683389</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Oktay</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Sinclair</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Suzuki</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rajchl</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tarroni</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Semi-supervised learning for network-based cardiac MR image segmentation</article-title>
          <source>Lecture Notes in Computer Science</source>
          <year>2017</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>253</fpage>
          <lpage>260</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Viceconti</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Henney</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Morley-Fletcher</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>In silico clinical trials: how computer simulation will transform the biomedical industry</article-title>
          <source>Int J Clin Trials</source>
          <year>2016</year>
          <month>05</month>
          <day>09</day>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>37</fpage>
          <pub-id pub-id-type="doi">10.18203/2349-3259.ijct20161408</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Niederer</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Lumens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Trayanova</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Computational models in cardiology</article-title>
          <source>Nat Rev Cardiol</source>
          <year>2019</year>
          <month>02</month>
          <volume>16</volume>
          <issue>2</issue>
          <fpage>100</fpage>
          <lpage>111</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30361497"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41569-018-0104-y</pub-id>
          <pub-id pub-id-type="medline">30361497</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41569-018-0104-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC6556062</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tannenbaum</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Holford</surname>
              <given-names>NHG</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Peck</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Mould</surname>
              <given-names>DR</given-names>
            </name>
          </person-group>
          <article-title>Simulation of correlated continuous and categorical variables using a single multivariate distribution</article-title>
          <source>J Pharmacokinet Pharmacodyn</source>
          <year>2006</year>
          <month>12</month>
          <volume>33</volume>
          <issue>6</issue>
          <fpage>773</fpage>
          <lpage>94</lpage>
          <pub-id pub-id-type="doi">10.1007/s10928-006-9033-1</pub-id>
          <pub-id pub-id-type="medline">17053984</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Robnik Šikonja</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Dataset comparison workflows</article-title>
          <source>IJDS</source>
          <year>2018</year>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>126</fpage>
          <lpage>145</lpage>
          <pub-id pub-id-type="doi">10.1504/ijds.2018.10013385</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bøtcher</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Dethlefsen</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>DEAL: a package for learning Bayesian networks</article-title>
          <source>J Stat Softw</source>
          <year>2003</year>
          <publisher-loc>Aalborg University</publisher-loc>
          <publisher-name>Department of Mathematical Sciences</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>D'Agostino</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Stephens</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Goodness-of-Fit Techniques</source>
          <year>1986</year>
          <publisher-loc>New York, NY, USA</publisher-loc>
          <publisher-name>Marcel Dekker</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Robnik-Šikonja</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bohanec</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Perturbation-Based Explanations of Prediction Models</source>
          <year>2018</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>159</fpage>
          <lpage>175</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="web">
          <source>SHaRe</source>
          <access-date>2021-05-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://theshareregistry.org/home/patient">https://theshareregistry.org/home/patient</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
