<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e73353</article-id><article-id pub-id-type="doi">10.2196/73353</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Cardiorenal Interorgan Assessment via a Novel Clustering Method Using Dynamic Time Warping on Electrocardiogram: Model Development and Validation Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Zhao</surname><given-names>Sally</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Ye</surname><given-names>Zhan</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Adhin</surname><given-names>Bhavna</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Vuori</surname><given-names>Matti</given-names></name><degrees>LM</degrees><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Laukkanen</surname><given-names>Jari</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff6">6</xref><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><collab>FinnGen</collab><xref ref-type="aff" rid="aff8">8</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Fisch</surname><given-names>Sudeshna</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib></contrib-group><aff id="aff1"><institution>Pfizer (United States)</institution><addr-line>New York</addr-line><country>United States</country></aff><aff id="aff2"><institution>Pfizer (United States)</institution><addr-line>1 Portland St</addr-line><addr-line>Boston</addr-line><addr-line>MA</addr-line><country>United States</country></aff><aff id="aff3"><institution>Pfizer (United States)</institution><addr-line>Austin</addr-line><addr-line>TX</addr-line><country>United States</country></aff><aff id="aff4"><institution>Turku University Hospital</institution><addr-line>Turku</addr-line><country>Finland</country></aff><aff id="aff5"><institution>Institute for Molecular Medicine Finland</institution><addr-line>Helsinki</addr-line><country>Finland</country></aff><aff id="aff6"><institution>Institute of Clinical Medicine, University of Eastern Finland</institution><addr-line>Kuopio</addr-line><country>Finland</country></aff><aff id="aff7"><institution>Department of Medicine, Wellbeing Services County of Central Finland</institution><addr-line>Jyv&#x00E4;skyl&#x00E4;</addr-line><country>Finland</country></aff><aff id="aff8"><institution>University of Helsinki</institution><addr-line>Helsinki</addr-line><country>Finland</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Kopeva</surname><given-names>K</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Elechi</surname><given-names>Kelechi</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Misra</surname><given-names>Neeladri</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Madugula</surname><given-names>Sita Sirisha</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Zhan Ye, PhD, Pfizer (United States), 1 Portland St, Boston, MA, United States, 1 6175513000; <email>zhan.ye@pfizer.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>12</day><month>8</month><year>2025</year></pub-date><volume>13</volume><elocation-id>e73353</elocation-id><history><date date-type="received"><day>03</day><month>03</month><year>2025</year></date><date date-type="rev-recd"><day>30</day><month>05</month><year>2025</year></date><date date-type="accepted"><day>04</day><month>06</month><year>2025</year></date></history><copyright-statement>&#x00A9; Sally Zhao, Zhan Ye, Bhavna Adhin, Matti Vuori, Jari Laukkanen, FinnGen, Sudeshna Fisch. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 12.8.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2025/1/e73353"/><abstract><sec><title>Background</title><p>The heart and kidneys have vital functions in the human body that reciprocally influence each other physiologically. Pathological changes in 1 organ can damage the other. Epidemiologic studies show that greater than 50% of patients with heart failure (HF) have preserved ejection fraction (HFpEF). Additionally, 1 in 6 patients identified as having chronic kidney disease (CKD) also has HF. Thus, it is important to be able to predict and identify the cardiorenal relationship between HFpEF and CKD.</p></sec><sec><title>Objective</title><p>Creating an electrocardiogram (ECG)-enabled model that stratifies suspected patients with HFpEF would help identify CKD-enriched HFpEF clusters and phenogroups. Simultaneously, a minimal set of significant ECG features derived from the stratification model would aid precision medicine and practical diagnoses due to being more accessible and widely readable than a large set of clinical inputs. Furthermore, the validation of the existing cardiorenal relationship using this ECG-enabled model may lead to better biological understanding.</p></sec><sec sec-type="methods"><title>Methods</title><p>Using unsupervised clustering on all extractable ECG features from FinnGen, patients with an indication of HFpEF (filtered by left ventricular ejection fraction [LVEF] values &#x2265;50% and N-terminal pro B-type natriuretic peptide [NT-proBNP] values &#x003E;450 pg/mL) were categorized into different phenogroups and analyzed for CKD risk. After isolating significant predictive ECG features, unsupervised clustering and risk analysis were performed again to demonstrate the efficacy of using a minimal set of features for phenogrouping. These clusters were then compared to clusters formed using dynamic time warping (DTW) on raw ECG time series electrical signals. Afterward, these clusters were analyzed for CKD enrichment.</p></sec><sec sec-type="results"><title>Results</title><p>The PR interval and QRS duration stood out as significant features and were used as the minimal feature set. After generating and comparing clusters (k-means with all extracted ECG features, k-means with a minimal feature set, and DTW with full lead II ECG waveform), the DTW-generated clusters were most stable. ANOVA analysis also showed that several HFpEF clusters exhibited a deviation of CKD risk from baseline, allowing for further trajectory analysis. Specifically, the creatinine levels (a proxy for CKD) of several DTW-created clusters showed significant differences from the average. Based on the Jaccard score, the DTW clusters also showed the greatest alignment to baseline comparison clusters created by clustering on creatinine. In comparison, the other 2 sets of clusters (created by all extracted ECG features and the minimal set) performed similarly.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This project validates both the known cardiorenal relationship between HFpEF and CKD and the importance of the PR interval and QRS duration. After exploring the use of ECG data for patient clustering and stratification, DTW clustering with lead II waveforms resulted in the most clinically meaningful clusters in the context of HFpEF and CKD. This methodology may prove useful in exploring ECG clustering applications outside of HFpEF as well.</p></sec></abstract><kwd-group><kwd>data analysis</kwd><kwd>clustering</kwd><kwd>electrocardiogram</kwd><kwd>heart failure</kwd><kwd>chronic renal insufficiency</kwd><kwd>ECG</kwd><kwd>cardiorenal</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>This paper examines the relationship between a specific subtype of heart failure (HF), heart failure with preserved ejection fraction (HFpEF), and chronic kidney disease (CKD) marked by progressive renal failure [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>], emphasizing the pathophysiological connections. It explores the potential use of technology in trials and clinical management by leveraging simple and widely accessible clinical tools such as electrocardiograms (ECGs) to predict the underlying risk in subgroups and to enable earlier and more precise interventions. Such interventions can improve patient outcomes for chronic diseases of cardiovascular or overlapping renal origin [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref6">6</xref>].</p></sec><sec id="s1-2"><title>Biological Rationale</title><p>HF and renal failure are 2 interrelated conditions that often coexist, significantly impacting patient outcomes [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. The intricate and bidirectional relationship between the heart and kidneys illustrated in <xref ref-type="fig" rid="figure1">Figure 1</xref>, often referred to as the cardiorenal axis, underscores the significant unmet need to understand how dysfunction in 1 organ can precipitate or exacerbate dysfunction in the other, so that patients at risk for progression can be precisely diagnosed for earlier intervention before full onset of disease, thus improving the odds of better patient outcome [<xref ref-type="bibr" rid="ref10">10</xref>].</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Illustration of the cardiorenal relationship and functional mediators.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e73353_fig01.png"/></fig><p>HF, which is marked by the heart&#x2019;s inability to pump blood effectively, initiates a series of physiological changes that can negatively impact renal function. Reduced cardiac output in HF leads to decreased renal perfusion, triggering compensatory mechanisms such as the activation of the renin-angiotensin-aldosterone system and sympathetic nervous system [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>].</p><p>Although these mechanisms initially aim to preserve renal function and maintain blood pressure, their chronic activation can produce adverse effects, including increased sodium and water retention, further worsening heart failure symptoms and contributing to renal impairment [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. HFpEF is characterized by the heart&#x2019;s inability to relax (diastolic defect) and fill properly, leading to heart failure symptoms despite a normal ejection fraction (systolic function).</p><p>Conversely, renal failure can significantly affect cardiac function. The kidneys regulate fluid and electrolyte balance, blood pressure, and the elimination of metabolic waste products. When renal function declines, fluid overload, electrolyte imbalances, and the accumulation of uremic toxins can occur, adding strain on the heart. This may lead to worsening HF, creating a cycle of deteriorating cardiac and renal function. This bidirectional nature of the heart-kidney interaction underscores the complexity of managing patients with both HF and renal failure. The ability to better predict risk in these vulnerable cohorts would be beneficial for disease understanding and clinical trial recruitment.</p></sec><sec id="s1-3"><title>ECG for Clustering</title><p>Recent advancements in artificial intelligence and machine learning have shown potential in predicting and managing the risks associated with cardiorenal syndrome. Artificial intelligence&#x2013;enabled models, for example, using ECG and biomarkers, have demonstrated promise in clinical care settings [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>].</p><p>An additional use of such an ECG model in drug development could be to identify patients with HFpEF who may demonstrate a potential risk profile for worsening kidney function based on a screening ECG. Such patients may demonstrate other comorbidities such as hypertension, diabetes, or obesity, as stated earlier. This underlying and hidden risk can be revealed early for an improved understanding of the associated risks with renally cleared cardiovascular drugs. The cardiac-specific electric signals provide significant discriminatory power for endophenotyping within the broader HFpEF spectrum [<xref ref-type="bibr" rid="ref17">17</xref>]. By leveraging machine learning-based unsupervised cluster analysis, this study aims to phenomap patients with HFpEF, enhancing the understanding and prediction of cardiorenal risk through a generalizable and interpretable ECG-based machine learning model.</p><p>Evaluating the importance of ECG features for unsupervised clustering can be difficult. A lot of tabular health care data, including the extracted ECG features, are highly correlated, which may lead to poor clustering results in practice. This also makes feature selection through Lasso very difficult. Reducing dimensionality often makes interpretability difficult as well, which is especially an issue for health care research. Thus, finding an unsupervised method that clusters high-dimensional correlated data through feature selection rather than dimension reduction would be very helpful [<xref ref-type="bibr" rid="ref18">18</xref>].</p></sec><sec id="s1-4"><title>Dynamic Time Warping With ECG</title><p>Dynamic time warping (DTW) measures the similarity between 2 temporal sequences and, thus, can be used as a metric for clustering temporal sequences. By creating a nonlinear alignment of time sequences that are of different lengths or exhibit time shift, it can calculate the Euclidean distance between points of the 2 warped sequences. DTW has been frequently used for longitudinal and trajectory analysis, including in health care settings [<xref ref-type="bibr" rid="ref19">19</xref>]. Due to the temporal nature of ECGs, DTW has been used to classify ECG frames and has been shown to be effective in finding nonlinear clusters of ECGs [<xref ref-type="bibr" rid="ref20">20</xref>]. Previous literature and studies for DTW ECG clustering use the lead II recording wavelengths due to the lead II wavelength being generally considered the best view of the electrical signals because of the electrode&#x2019;s placement [<xref ref-type="bibr" rid="ref19">19</xref>].</p><p>ECGs are particularly appropriate for this combination of DTW-supported unsupervised clustering and feature analysis. First, the assumption that patients themselves, rather than the extracted ECG values, are independent and identically distributed is much easier to meet. This may make unsupervised clustering results more promising than on extracted ECG data (which would be correlated tabular data). By treating each ECG record as a singular data point, we can perform DTW on the ECG as a time series. DTW is a technique that calculates the optimal match between given sequences (it can be thought of as clustering curves via distance rather than individual data points). This way, different clusters of ECG records can be formed and then analyzed for disease endpoint incidence, cluster stability, and other performance metrics.</p><p>Many studies focus on the relationship between HFpEF and electrocardiographic (ECG) features, but our work attempts to explore the cross-organ interactions between the heart and kidney in HFpEF by using an algorithm that uses specific features within ECG features as novel predictors of cardiorenal risk. Small changes in the electroconductance system of the heart can have a big impact on the hemodynamic load on the heart, exacerbating the load, and over time, affecting volume overload [<xref ref-type="bibr" rid="ref10">10</xref>] on the kidneys. However, such small changes in ECG, which may appear early, may not always be clinically apparent and can often be missed. In patients with HFpEF, clinical phenotype can be associated with diabetes, hypertension, and obesity [<xref ref-type="bibr" rid="ref21">21</xref>]. Using an ECG model to identify nonobvious patterns in the electrical signals of the heart captured through a standard ECG (12 leads) can serve as indicators for left ventricular dysfunction associated with HFpEF and can potentially also identify potential signals for renal risk in a subset of patients. This study seeks to validate the established cardiorenal relationship through ECG data analysis and investigate a novel approach for clustering in HFpEF subgroups using ECG data.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Ethical Considerations</title><p>The real-world electronic health data used from the FinnGen database, provided for analysis, were already anonymized by FinnGen. The ethics status, data collection process, consent process, and approvals can be seen in the original study [<xref ref-type="bibr" rid="ref22">22</xref>]. This study&#x2019;s data analysis was approved by the FinnGen Committee. Due to this, there was no need to seek further ethics board approval.</p></sec><sec id="s2-2"><title>Dataset Description</title><p>The FinnGen study is a large-scale genomics initiative that has analyzed over 500,000 Finnish biobank samples and correlated genetic variation with health data to understand disease mechanisms and predispositions. The project is a collaboration between research organizations and biobanks within Finland and international industry partners [<xref ref-type="bibr" rid="ref22">22</xref>]. This public-private partnership aggregates data from 9 different Finnish biobanks, research institutes, university hospitals, and 13 international pharmaceutical partners along with the Finnish Biobank Cooperative. Sample collection and data releases began in 2017, and the main phase of sample collection ended with FinnGen2 in 2023.</p><p>The Expansion Area 3 (EA3) studies aim to collect data on diseases that may not be present within existing FinnGen registries. Among these data is the EA3 Heart Failure Study cohort, which compiles relevant cardiovascular data from 4&#x2010;6 participating hospital biobanks. The study contains ECG files, ejection fraction values (40,809 individuals), and laboratory measurements (40,024 individuals) with B-type natriuretic peptide (BNP), proBNP, and creatinine values. Since the study is aggregated from several different existing biobanks, not all individuals have the same laboratory measurements. This project used the EA3 Heart Failure study, individuals with ECG, ejection fraction, and laboratories with creatinine and proBNP values all present.</p><p>The methods for extracting relevant features are changing and evolving over time [<xref ref-type="bibr" rid="ref23">23</xref>], but the idea remains the same. The ECG follows a characteristic PQRST wave that occurs in a periodic pattern. Each peak, trough, or section of this wave represents electrical signals of the heart and can be evaluated for further meaning. Clinicians can look at the ECG visually for meaning, but signal processing techniques can also retrieve the mathematical values from the waves themselves. Since there are multiple electrodes for measuring the ECG, this is usually taken from lead II signals (<xref ref-type="fig" rid="figure2">Figure 2</xref>) [<xref ref-type="bibr" rid="ref24">24</xref>] or aggregated.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>A sample lead II ECG wave. ECG: electrocardiogram.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e73353_fig02.png"/></fig></sec><sec id="s2-3"><title>Data Preprocessing</title><p>The dataset was restricted to the population with HFpEF (<xref ref-type="table" rid="table1">Table 1</xref>). This was determined by selecting individuals with ejection fraction values greater than or equal to 50 and exhibiting HF at that time (<xref ref-type="fig" rid="figure3">Figure 3</xref>). All selected individuals were verified to have HF diagnoses (either I9 HF or I9 HF NS). Only ECGs recorded within a 6-month period of the heart failure diagnosis or laboratory indicative of HF were used in this study. Creatinine values were used as a proxy for the presence of CKD. The EA3 HF Cohort contained 1,626,275 laboratory records for 40,024 unique individuals. Among these, there were 7170 complete ECGs (extracted ECG values and raw ECG signals) and creatinine laboratory records for 3864 unique individuals with HFpEF (<xref ref-type="fig" rid="figure3">Figure 3</xref>). The raw lead II ECG signals each contained 5000 points of data and were taken from individual ECG files within the EA3 HF cohort. These signals were directly input into the DTW algorithm. It was these ECG and laboratory records that were used for clustering and analysis (<xref ref-type="fig" rid="figure4">Figure 4</xref>). Specifically, the data groups to be clustered included extracted ECG values, a minimal set of extracted ECG values, and raw lead II signals.</p><p>Clusters created through hierarchical clustering on creatinine served as a baseline for CKD risk, against which the ECG-enabled clusters were compared. This comparison aimed to evaluate the effectiveness of ECG-enabled clusters in stratifying patients with CKD risk within the context of HFpEF.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>A characteristics average table to give a better understanding of the clustering cohort. This cohort is comprised of individuals who have characteristics that indicate HFpEF (LVEF&#x2265;50% and NT-proBNP&#x003E;450 pg/mL).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Clustering cohort baseline characteristics</td><td align="left" valign="top">Values</td></tr></thead><tbody><tr><td align="left" valign="top">Age (years), mean (SD)</td><td align="left" valign="top">71.16 (11.32)</td></tr><tr><td align="left" valign="top">Women, n (%)</td><td align="left" valign="top">3478 (48.5)</td></tr><tr><td align="left" valign="top">BMI (kg/m<sup>2</sup>), %</td><td align="left" valign="top">28.4</td></tr><tr><td align="left" valign="top">NT-proBNP (pg/mL)</td><td align="left" valign="top">2018.1</td></tr><tr><td align="left" valign="top">LVEF<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> (%)</td><td align="left" valign="top">60.25</td></tr><tr><td align="left" valign="top">Creatinine (&#x00B5;mol/L)</td><td align="left" valign="top">103.02</td></tr><tr><td align="left" valign="top">Height (cm)</td><td align="left" valign="top">170.3</td></tr><tr><td align="left" valign="top">Weight (kg)</td><td align="left" valign="top">82.7</td></tr><tr><td align="left" valign="top">Current smoker, n (%)</td><td align="left" valign="top">882 (12.3)</td></tr><tr><td align="left" valign="top">Chronic kidney disease, n (%)</td><td align="left" valign="top">115 (1.6)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>LVEF: left ventricular ejection fraction.</p></fn><fn id="table1fn2"><p><sup>b</sup>NT-proBNP: N-terminal pro B-type natriuretic peptide.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>An illustration of the data processing flow and the sources of the dataset. CKD: chronic kidney disease; ECG: electrocardiogram; Expansion Area 3; HFpEF: heart failure with preserved ejection fraction.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e73353_fig03.png"/></fig><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>An illustration of the methodology workflow. FinnGen ECG and laboratory records are used to create different sets of clusters: Creatinine clusters (hierarchical clusters based off creatinine labs to be used as a baseline indication for CKD), ECG feature clusters (clusters created using all extracted ECG features), PR-QRS clusters (clusters created using top variables determined to be significant in predicting CKD in HFpEF), and DTW clusters (clusters created using DTW on the raw ECG time series). For each set of clusters, 5 groups were formed. CKD: chronic kidney disease; DTW: dynamic time warping; ECG: electrocardiogram; HFpEF: heart failure with preserved ejection fraction.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e73353_fig04.png"/></fig></sec><sec id="s2-4"><title>Statistical Analysis</title><p>Univariate analysis was first performed for exploratory purposes. Distributions and averages of the extracted ECG values (ie, ventricular rate, PR interval, QRS duration, QT corrected, P axis, R axis, T axis, QRS count, Q onset, Q offset, P onset, P offset, T offset, atrial rate, and QT interval) were calculated. A 1-tailed <italic>t</italic> test was conducted for all extracted ECG variables to determine if there was a significant difference between patients with non-CKD and CKD HFpEF ECG values. It was shown that all extracted features were indeed significantly different with a significance level of .05 (<xref ref-type="fig" rid="figure5">Figure 5</xref>). Survival analysis was also conducted using a Cox proportional hazard model and a Kaplan-Meier curve.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Distribution of significant extracted ECG values (QRS Duration and PR Interval) between patients who are CKD-positive and CKD-negative. CKD: chronic kidney disease; ECG: electrocardiogram; HF: heart failure; HFpEF: heart failure with preserved ejection fraction.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e73353_fig05.png"/></fig><p>Multivariate analysis of the extracted features was also conducted. It must be noted that the method may not be wholly accurate because  the correlation between the extracted features is derived from the ECG waveform itself and can have some overlap (<xref ref-type="fig" rid="figure6">Figure 6</xref>). It must be noted that the method may not be wholly accurate because of the correlation between the extracted features. Additionally, these features lose some information in terms of the time component. However, it provides good exploratory insight into which combination of features would perform well for both CKD prediction and patient phenotyping.</p><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>A heatmap showing the correlation between extracted ECG features. ECG: electrocardiogram.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e73353_fig06.png"/></fig></sec><sec id="s2-5"><title>Determining the Number of Clusters</title><p>To determine the number of clusters created, elbow curves (<xref ref-type="fig" rid="figure7">Figure 7</xref>) were created and analyzed to determine which number of clusters would be optimal. As both elbow charts exhibit diminishing returns at around the 5-cluster mark, it was determined that 5 clusters would be generated and compared.</p><fig position="float" id="figure7"><label>Figure 7.</label><caption><p>Elbow curves for extracted feature and DTW hierarchical clustering. This was used to determine the optimal number of clusters (t=5). The number of clusters was determined using these elbow charts and by seeing where the reduction in inertia or cut threshold has diminishing returns. DTW: dynamic time warping. WCSS: within-cluster sum of squares.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e73353_fig07.png"/></fig></sec><sec id="s2-6"><title>Extracted Feature Clustering</title><p>Several methods were used, including principal component analysis (PCA), significance, and Lasso feature selection. Relevant hyperparameters (eg, &#x03B1; for Lasso dropout) were tuned iteratively to find the top 5 (5 is predefined) features. For PCA, 50 simulations were run for stability and robustness purposes. In every simulation, the FinnGen data were randomly sampled (training=0.8, 80% from all data) and PCA was conducted on this random sample to select the top 5 ranked features. The top 5 features in order are: ventricular rate, PR interval, QRS duration, QT corrected, and P axis. As for Lasso regression, the top features were QRS duration, QT interval, R axis, QT corrected, and PR interval. In terms of significance, the top features were ventricular rate, PR interval, QRS duration, QT corrected, and P axis, with the average explained variance reported in <xref ref-type="table" rid="table2">Table 2</xref> on the top features identified from multiple methods. From this exploration, we can see that the PR interval and QRS duration were always selected as top features.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>A table ranking component (electrocardiogram variable) importance by average explained variance. PR interval and QRS duration are among the top 3 extracted variables. Ventricular rate was not chosen because it was not selected among the top 5 features during Lasso regression.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">PCA<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> component</td><td align="left" valign="top">ECG<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> variable</td><td align="left" valign="top">Average explained variance</td></tr></thead><tbody><tr><td align="char" char="." valign="top">0</td><td align="left" valign="top">Ventricular rate</td><td align="left" valign="top">0.276</td></tr><tr><td align="char" char="." valign="top">1</td><td align="left" valign="top">PR interval</td><td align="left" valign="top">0.251</td></tr><tr><td align="char" char="." valign="top">2</td><td align="left" valign="top">QRS duration</td><td align="left" valign="top">0.156</td></tr><tr><td align="char" char="." valign="top">3</td><td align="left" valign="top">QT corrected</td><td align="left" valign="top">0.122</td></tr><tr><td align="char" char="." valign="top">4</td><td align="left" valign="top">P axis</td><td align="left" valign="top">0.091</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>PCA: principal component analysis.</p></fn><fn id="table2fn2"><p><sup>b</sup>ECG: electrocardiogram.</p></fn></table-wrap-foot></table-wrap><p>However, despite bootstrapping for stability and generalizability, the clusters formed from PR interval and QRS duration had low stability and consensus, despite performing better than clustering on all features. This is probably due to the correlated nature of the extracted ECG features. Thus, hierarchical clustering using DTW distance calculations was also performed to consider the correlation.</p></sec><sec id="s2-7"><title>DTW Clustering</title><p>The ECG lead II data were split into a training, validation, and test sets, each with 500 different unique individuals. Every patient&#x2019;s lead II data included 5000 signals. These were then clustered using hierarchical clustering with the Ward method. The Ward method was chosen because it is close in functionality to k-means, which makes it intuitive and interpretable. However, it also performs better than k-means on uncovering clusters of uneven size and irregular non-spherical clusters. Exploratory analysis has shown the clusters to be uneven and not guaranteed to be regular, which makes the Ward method a good fit.</p><p>DTW was used to determine the similarity between two time series. In this case, the time series would be the lead II ECG signals. This was done by calculating the Euclidean distance between each point after finding the best alignment of the 2 sequences (<xref ref-type="fig" rid="figure8">Figure 8</xref>). In order to find the best alignment or shift, the distance between pairs of points is compared, and the minimum distance is taken. This is done for the entirety of the 2 sequences. After creating a matrix representation for the costs associated with each alignment, the algorithm returns the minimum cost&#x2014;that is, the minimum distance between aligned time series. For the regular ECGs, little shift was needed to occur. No normalization techniques were applied to the ECG lead II records. For faster processing speeds, the code was parallelized using the Python (Python Software Foundation) multiprocessing module.</p><p>Afterward, creatinine values were associated with every ECG, and the average creatinine value was calculated for every cluster. The average creatinine value of the population with HFpEF was 101.51 umol/l. Additionally, all clusters were validated through bootstrapping the data. Multiple subsets of 500 were created and clustered. This was performed to measure the stability and generalizability of the various clusters. Since the k-means and hierarchical algorithms are not consistent and exact in their results every time, this was necessary to ensure that the observed clusters (and their associated creatinine values) remained stable.</p><fig position="float" id="figure8"><label>Figure 8.</label><caption><p>Pseudocode demonstrating the flow of the DTW algorithm and the generation of the matrix used for determining similarity between two separate time series. DTW: dynamic time warping.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e73353_fig08.png"/></fig></sec><sec id="s2-8"><title>Creatinine Clusters</title><p>Since all clusters were created in an unsupervised manner, there was no true baseline to compare the cluster labels to. Thus, the 5 clusters formed by hierarchical clustering on the creatinine laboratory values were created as a stand-in. Being a waste product from muscle and protein breakdown, creatinine levels can serve as an estimation of kidney function and a metric for CKD. Thus, comparing the extracted ECG value and DTW-formed clusters to these creatinine-based clusters can demonstrate the former&#x2019;s capabilities in demonstrating creatinine enrichment and, subsequently, CKD enrichment.</p><p>Cluster stability was measured using the silhouette score [<xref ref-type="bibr" rid="ref25">25</xref>], co-cluster occurrence (Jaccard score), and Rand index [<xref ref-type="bibr" rid="ref26">26</xref>]. For the hierarchical clustering on the DTW-determined distance, the Jaccard index was determined to be a more relevant metric than the silhouette score. Compared to naively clustering on extracted features, the clusters were shown to be more stable.</p><p>Average features were calculated for every ECG cluster. ANOVA (<xref ref-type="table" rid="table3">Table 3</xref>) was conducted to determine any significant extracted feature difference between the clusters.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>ANOVA test on all extracted ECG<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> values between the 5 clusters identified in the ECG feature clusters.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">ECG variable</td><td align="left" valign="bottom"><italic>F</italic> test (<italic>df</italic>)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Ventricular rate</td><td align="left" valign="top">46.945 (4, 495)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">PR interval</td><td align="left" valign="top">2.466 (4, 495)</td><td align="left" valign="top">.062</td></tr><tr><td align="left" valign="top">QRS duration</td><td align="left" valign="top">42.311 (4, 495)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">QT corrected</td><td align="left" valign="top">14.901 (4, 495)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">P axis</td><td align="left" valign="top">.498 (4, 495)</td><td align="left" valign="top">.684</td></tr><tr><td align="left" valign="top">R axis</td><td align="left" valign="top">61.873 (4, 495)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">T axis</td><td align="left" valign="top">.226 (4, 495)</td><td align="left" valign="top">.878</td></tr><tr><td align="left" valign="top">QRS count</td><td align="left" valign="top">47.793 (4, 495)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Q onset</td><td align="left" valign="top">15.444 (4, 495)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Q offset</td><td align="left" valign="top">28.054 (4, 495)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">P onset</td><td align="left" valign="top">5.614 (4, 495)</td><td align="left" valign="top">.001</td></tr><tr><td align="left" valign="top">P offset</td><td align="left" valign="top">3.295 (4, 495)</td><td align="left" valign="top">.020</td></tr><tr><td align="left" valign="top">T offset</td><td align="left" valign="top">28.427 (4, 495)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Atrial rate</td><td align="left" valign="top">14.475 (4, 495)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">QT interval</td><td align="left" valign="top">29.769 (4, 495)</td><td align="left" valign="top">&#x003C;.001</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>ECG: electrocardiogram.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Clustering on Extracted ECG Features</title><p>The top 2 features determined are QRS duration and PR interval. Both of these features were unique among the top 5 ranked features in every method used (significance, Lasso, and PCA).</p><p>Although there is a difference between CKD incidence when clustering on all available ECG features compared to clustering on the significant ECG features (PR interval and QRS duration), the difference may be too small to be clinically significant.</p></sec><sec id="s3-2"><title>Clustering With DTW</title><p>Regardless of how many clusters the parameter is set for with hierarchical clustering, clustering with DTW consistently yielded approximately 5 groups (<xref ref-type="fig" rid="figure9">Figure 9</xref>). This phenomenon could be seen in both the testing and validation sets, and also when bootstrapping.</p><fig position="float" id="figure9"><label>Figure 9.</label><caption><p>Hierarchical clustering on the validation set. It can be seen that approximately 5 clusters form which match up to the number of clusters estimated using the elbow method on the extracted ECG values. Due to the number of time series that were clustered, there were too many labels to list individually. ECG: electrocardiogram.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e73353_fig09.png"/></fig><p><xref ref-type="fig" rid="figure10">Figure 10</xref> shows that there were creatinine differences among DTW clusters. Additionally, all extracted ECG features with the exception of P axis, T axis, and PR interval were shown to be statistically significant from cluster to cluster (<xref ref-type="table" rid="table3">Table 3</xref>). This indicates that the clusters did measurably separate the ECG time series, not just by time series shape but also by the relevant values or sections that would be extracted from the series.</p><p>Based on the Jaccard Score, the DTW-created clusters are most similar to the creatinine-based clusters (<xref ref-type="fig" rid="figure11">Figure 11</xref>). This indicates that it is a better stand-in for CKD enrichment than clustering solely on ECG extracted features.</p><fig position="float" id="figure10"><label>Figure 10.</label><caption><p>Creatinine value distribution among the 5 clusters identified in dynamic time warping clusters.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e73353_fig10.png"/></fig><fig position="float" id="figure11"><label>Figure 11.</label><caption><p>Jaccard score heatmap that compares the clusters&#x2019; similarities to each other. DTW: dynamic time warping; ECG: electrocardiogram.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e73353_fig11.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>From the results, the PR interval and QRS duration are shown to be the extracted ECG variables most associated with CKD in the HFpEF cohort. This follows the biological rationale as the PR interval and QRS complex are 2 important features of an ECG signal that capture both time and spatial dynamics of a cardiac cycle. Each aspect of the selected ECG features can provide valuable information about the heart&#x2019;s function. Since the heart pumps blood systemically and into the lungs and kidneys, the electric signals may also inform about any altered hemodynamics in the latter organs [<xref ref-type="bibr" rid="ref27">27</xref>].</p><p>The PR interval represents the time it takes for the electrical impulse to travel from the sinoatrial node, through the atria, to the ventricles. A prolonged PR interval may indicate a delay in the conduction of the electrical impulse, which can be caused by various conditions and is often suggestive of atrial abnormalities (eg, atrial volume and strain). The atrial changes can, in turn, affect subsequent changes in the ventricular contraction phase [<xref ref-type="bibr" rid="ref28">28</xref>].</p><p>The QRS complex represents the depolarization of the ventricles, which triggers the contraction of the ventricles and the pumping of blood out of the heart into systemic circulation. The duration of the QRS complex is an important indicator of the heart&#x2019;s function, and a prolongation may indicate a delay in the conduction of the electrical impulse through the ventricles, which can be caused by various conditions, including bundle branch blocks, ventricular hypertrophy, or myocardial infarction [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. There is evidence to suggest that abnormalities in the PR interval and QRS duration may be associated with an increased risk of kidney disease in patients with HFpEF [<xref ref-type="bibr" rid="ref28">28</xref>].</p><p>To make the connection from the heart to the kidney as shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>, it is important to note that these 2 time intervals reflect the heart&#x2019;s electrical conductance system and are intricately linked to cardiac relaxation, also known as diastole. During diastole, the heart fills with blood after the contraction of the ventricles, and this relaxation phase is important for maintaining adequate blood flow to the whole body, a capacity that is often lost in some patients with HFpEF.</p><p>ANOVA analysis shows significant differences between the creatinine levels of the 5 clusters generated by DTW. Not all the clusters&#x2019; creatinine levels differ significantly, but clusters 1 and 2 (<xref ref-type="fig" rid="figure10">Figure 10</xref>) do exhibit statistically significant differences. This means that DTW-enabled clustering was capable of stratifying patients with HFpEF with differing creatinine levels and thus differing CKD risk levels.</p><p>Despite the supported relationship between PR interval and QRS duration with CKD in HFpEF, the PR-QRS clusters did not demonstrate much similarity with the established creatinine clusters. Additionally, these PR-QRS clusters demonstrated low stability and less pronounced CKD incidence rates among the individual clusters. However, the PR-QRS clusters&#x2019; Jaccard similarity with the creatinine scores (0.09) and silhouette scores was similar to that of the ECG Feature clusters&#x2019; Jaccard similarity (0.11) with the creatinine scores and silhouette scores. This indicates that clustering on PR-QRS performs similarly to clustering on all extracted ECG features&#x2014;further demonstrating that a relationship exists between PR interval and QRS duration with CKD in HFpEF. Nevertheless, due to the cluster instability and low Jaccard similarity with the creatinine baseline, it could not be used to inform clinical decisions.</p><p>DTW clusters performed much better than the PR-QRS clusters and ECG feature clusters in terms of Jaccard similarity (0.37) to the established creatinine baseline. Although the cluster groupings were not perfectly equivalent, the similarity demonstrates the potential application of using DTW for ECG clustering. This is intuitively expected due to the DTW being able to fully use the entire ECG signal. Previous literature has also supported the clustering capabilities of DTW for ECG and other signal-based records.</p><p>However, the specific reason why DTW performed better remains to be seen. Knowing the difference between the information DTW clustering captures compared to the information extracted ECG features clustering captures would be helpful. This could be used for better understanding of the statistical aspects of DTW application for clustering, as well as the cardiorenal relationship between HFpEF and CKD in this case. DTW&#x2019;s better performance implies that the full lead II waveform contains more data than the extracted ECG features&#x2014;minimal set or otherwise. This means that solely using extracted ECG features when working with ECG data analysis may lead to some loss of context.</p></sec><sec id="s4-2"><title>Limitations</title><p>There were certain limitations to the dataset, most notably with regard to its demographics. As the FinnGen study aggregates data from Finnish biobanks, the population is overwhelmingly Finnish and lacks heterogeneity that may pose a challenge to generalizability to other populations. Certain patients were also overrepresented in the dataset. The average patient with HFpEF had 5 ECGs spaced over a 1-year period. However, there were patients who had many ECG records (greater than 5) and patients with only a few ECG records. The FinnGen EA3 Heart Failure cohort is also not representative of all HF or patients with HFpEF. This means that extrapolating this project&#x2019;s results to the wider population may not yield good results. There are disease differences between FinnGen and the external population&#x2014;the renal and cardiovascular outcomes may not perform well.</p><p>Additionally, although all data were sourced from the FinnGen EA3 Heart Failure cohort, the cohort itself is comprised of several different biobanks, and each biobank provides differing amounts of data. ECG data were only available from the Central Finland Biobank. This meant that, while some patients had characteristics that indicated HFpEF, they could not be included in this study since they lacked ECG data. This data limitation introduces bias as it means all individual data is effectively from the Central Finland Biobank.</p><p>HFpEF itself is also difficult to diagnose, and the current diagnosis is multifaceted, with many clinical parameters. Due to a lack of diagnosis codes in the FinnGen EA3 Heart Failure cohort, clinical diagnosis of HFpEF could not be obtained. We used the FinnGen R12 cohort to confirm that the selected dataset had HF diagnostic codes (either I9 Heart Failure or I9 Heart Failure NS). Thus, using this in combination with the LVEF and NT-proBNP values (some of the main parameters for HFpEF), the selected individuals are indicated for HFpEF. Although this selected cohort may not be purely composed of clinically diagnosed patients with HFpEF, there could have also been  a greater likelihood of finding an enrichment for patients with HFpEF. Furthermore, as the biological rationale behind the hypothesis is on the cardiorenal associations between the heart and kidneys, it is the specific heart features (ie, hypercontractility and failure) that are most relevant rather than a clinical diagnosis. The relationship between the heart and kidneys is already known to exist, so this cohort serves as a sort of positive control.</p><p>Due to the lack of diagnosis codes in the EA3 Heart Failure Cohort, CKD was also difficult to label. Even with diagnosis codes, it is entirely possible that this subset may be underdiagnosed. Creatinine laboratory records provided in the EA3 Heart Failure Cohort were used as proxies for CKD. Estimated glomerular filtration rate could have also been used, but these data were not as complete as the creatinine records and would have severely limited the cohort.</p><p>There are also confounding factors, such as medications or co-morbidities, that may affect both ECG readings and creatinine levels. Unfortunately, the lack of medications and co-morbidities from the dataset is a limitation that can be rectified in the future through validation on an external dataset such as the FinnGen R12 Cohort.</p><p>In addition, DTW also has its own limitations. Although it does consider the entire ECG signal, it reduces it down to a singular similarity metric (ie, distance) that may be reductive. Additionally, it is very computationally intensive and sensitive to noise. Extracted ECG values are not as sensitive to noise.</p><p>The main challenge with DTW was the time needed for calculations&#x2014;it took a long time for every calculation. Since the distance needed to be calculated for every possible time series pair (of which there were 14,000 due to an average of 5 ECGs per patient), this was very time-consuming. Since all analysis took place within the FinnGen sandbox, which is a closed environment, not all packages were available. This included the conventional packages for DTW calculations. This was further parallelized using Python&#x2019;s multiprocessing library for efficiency&#x2019;s sake.</p></sec><sec id="s4-3"><title>Future Directions</title><p>Applying ECG clustering with DTW to other disease areas for similar cluster enrichment analysis may be fruitful. Previous literature has demonstrated the capabilities of ECG for risk prediction in both cardiovascular and non-cardiovascular disease areas. Analyzing the differences in cluster enrichment analysis with DTW and classic supervised risk prediction approaches may be informative.</p><p>Further work could also segment the ECG time signals. In doing so, each area could be examined for its contribution to the DTW-determined signal similarity or distance. This way, the parts of the ECG that most affect the DTW distance could be identified and determined. However, this method would be very computationally intensive&#x2014;even more so than the current approach, which requires calculations for every pairwise ECG combination. Additionally, the FinnGen sandbox that houses the EA3 Heart Failure study only allows select Python packages to be installed and used (eg, the most popular and well-known ones such as <italic>pandas</italic>, <italic>numpy</italic>, <italic>matplotlib</italic>, <italic>scikit-learn</italic>, and more). DTW-related packages such as <italic>fastdtw</italic>, <italic>dtaidistance</italic>, or <italic>tslearn</italic> are not available on the server and must be manually coded and parallelized. This work would also need to be done for any signal segmentation DTW analysis.</p><p>Other future work involves incorporating DTW distance as a representation into autoencoders. Previous literature in both ECG and non-ECG areas has shown autoencoders to be accurate for disease trajectory and risk assessment. Incorporating not just the extracted ECG signals into autoencoders, but perhaps also a DTW score can be helpful.</p><p>Additionally, this study did not consider all comorbidities that are known to be associated with HFpEF [<xref ref-type="bibr" rid="ref1">1</xref>], nor did it account for associated changes due to medication use in the selected cohort, for example, blood pressure control. As such, the study has limited its scope to cardiac-specific criteria and specific analytes (eg, creatinine in its methodology to understand the direct cardiorenal association). In the future, we may want to understand the potential synergies and constraints derived from adding more features, which may improve the accuracy of the prediction. In particular, we may want to evaluate the combinatorial effect of underlying physiology, medication, preexisting diseases, urinary and blood-based metabolic and protein biomarkers, and genetics that may interact with each other and our selected features. While lack of various associated clinical data may be a limitation of this study, we propose that our approach minimizes noncardiac effects that may often mask the true association between organs, for example, changes in blood pressure or pulmonary changes that may also be seen in HFpEF that have shown as a phenogroup in earlier studies [<xref ref-type="bibr" rid="ref17">17</xref>], do not stand in conflict with our methodology. As we validate our study using other public datasets, for example, the UK Biobank, we would consider expanding the scope of the analysis.</p><p>As for practical adoption for clinical practice, the model itself is currently exploratory. The DTW-enabled clusters do show promise for patient stratification and exhibit statistically significant results in the context of HFpEF and CKD, but the associations may not be strong enough to be clinically relevant. However, the model does further validate the cardiorenal relationship and also shows ECG data to be particularly useful for phenogrouping. It showcases the relationship in a well-established cohort with good clinical phenotyping and ECG data. Specifically, the full lead II waveform is most beneficial for detecting CKD risk in patients with HFpEF&#x2014;more so than any single or set of extracted ECG variables. Relying on extracted ECG variables may not give the full picture. With this information in mind, health care providers can be more aware during clinical practice. In a research setting, this information about ECG data extraction is important as it shows that not using the full waveform could lead to loss of data. The model built will be useful in expanding research beyond the relationship between ECG from patients with HFpEF to other interesting clinical phenotypes as well.</p></sec><sec id="s4-4"><title>Conclusions</title><p>From the results, the PR interval and QRS duration are shown to be the extracted ECG variables most associated with CKD in the HFpEF cohort. This follows the biological rationale as the PR interval and QRS complex are 2 important features of an ECG signal that capture both time and spatial dynamics of a cardiac cycle. The DTW application for ECG clustering would also be fruitful to explore.</p></sec></sec></body><back><ack><p>The authors would like to thank Sabrina Hsueh, Asa Hedman, Craig Hyde, and the FinnGen team for their careful review of the manuscript and for their support for this study. The authors would also like to acknowledge the participants and investigators of the FinnGen study. This research was funded by Pfizer, Inc.</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are available in the FinnGen EA3 Heart Failure repository [<xref ref-type="bibr" rid="ref22">22</xref>].The data were publicly made available by FinnGen. Based on National and European regulations, access to individual-level sensitive health data must be approved by national authorities for specific research projects and for specifically listed and approved researchers. The health data described here was generated and provided by the National Health Register Authorities (Finnish Institute of Health and Welfare, Statistics Finland, KELA, Digital and Population Data Services Agency) and approved, either by the individual authorities or by the Finnish Data Authority, Findata, for use in the FinnGen project. Therefore, we, the authors of this paper, are not in a position to grant access to individual-level data to others. However, any researcher can apply for the health register data from the Finnish Data Authority Findata and for individual-level genotype data from Finnish biobanks via the Fingenious portal hosted by the Finnish Biobank Cooperative FINBB.</p></sec></notes><fn-group><fn fn-type="con"><p>SF conceptualized the study design and provided the initial hypothesis based off the existing known cardiorenal relationship. Both SZ and ZY conducted the statistical analysis. SZ conducted all the analyses within the FinnGen sandbox and provided the figures while ZY helped inform design and validation. BA was responsible for the data informatics parts and also overlooked the manuscript editing as a medical writer. SZ, ZY, SF, and BA all wrote and prepared the initial manuscript draft. MV and JL supported the FinnGen data collection. Additionally, MV provided key medical insights and provided the ECG data in the FinnGen EA3 Heart Failure repository.</p></fn><fn fn-type="conflict"><p>SF, ZY, and BA are employees and shareholders of Pfizer, Inc. SZ was an intern at Pfizer Inc. at the time of the work and a full-time student at Columbia University.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CKD</term><def><p>chronic kidney disease</p></def></def-item><def-item><term id="abb2">DTW</term><def><p>dynamic time warping</p></def></def-item><def-item><term id="abb3">EA3</term><def><p>Expansion Area 3</p></def></def-item><def-item><term id="abb4">ECG</term><def><p>electrocardiogram</p></def></def-item><def-item><term id="abb5">HF</term><def><p>heart failure</p></def></def-item><def-item><term id="abb6">HFpEF</term><def><p>heart failure with preserved ejection fraction</p></def></def-item><def-item><term id="abb7">PCA</term><def><p>principal component analysis</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Oktay</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Shah</surname><given-names>SJ</given-names> </name></person-group><article-title>Diagnosis and management of heart failure with preserved ejection fraction: 10 key lessons</article-title><source>Curr Cardiol Rev</source><year>2015</year><volume>11</volume><issue>1</issue><fpage>42</fpage><lpage>52</lpage><pub-id pub-id-type="doi">10.2174/1573403x09666131117131217</pub-id><pub-id pub-id-type="medline">24251461</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vallon</surname><given-names>V</given-names> </name><name name-style="western"><surname>Verma</surname><given-names>S</given-names> </name></person-group><article-title>Effects of SGLT2 inhibitors on kidney and cardiovascular function</article-title><source>Annu Rev Physiol</source><year>2021</year><month>02</month><day>10</day><volume>83</volume><issue>1</issue><fpage>503</fpage><lpage>528</lpage><pub-id pub-id-type="doi">10.1146/annurev-physiol-031620-095920</pub-id><pub-id pub-id-type="medline">33197224</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Parikh</surname><given-names>KS</given-names> </name><name name-style="western"><surname>Sharma</surname><given-names>K</given-names> </name><name name-style="western"><surname>Fiuzat</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Heart failure with preserved ejection fraction expert panel report: current controversies and implications for clinical trials</article-title><source>JACC: Hear Fail</source><year>2018</year><volume>6</volume><issue>8</issue><fpage>619</fpage><lpage>632</lpage><pub-id pub-id-type="doi">10.1016/j.jchf.2018.06.008</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gadaleta</surname><given-names>M</given-names> </name><name name-style="western"><surname>Harrington</surname><given-names>P</given-names> </name><name name-style="western"><surname>Barnhill</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Prediction of atrial fibrillation from at-home single-lead ECG signals without arrhythmias</article-title><source>NPJ Digit Med</source><year>2023</year><month>12</month><day>12</day><volume>6</volume><issue>1</issue><fpage>229</fpage><pub-id pub-id-type="doi">10.1038/s41746-023-00966-w</pub-id><pub-id pub-id-type="medline">38087028</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mc Causland</surname><given-names>FR</given-names> </name><name name-style="western"><surname>Lefkowitz</surname><given-names>MP</given-names> </name><name name-style="western"><surname>Claggett</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Angiotensin-neprilysin inhibition and renal outcomes in heart failure with preserved ejection fraction</article-title><source>Circulation</source><year>2020</year><month>09</month><day>29</day><volume>142</volume><issue>13</issue><fpage>1236</fpage><lpage>1245</lpage><pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.120.047643</pub-id><pub-id pub-id-type="medline">32845715</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Al Younis</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Hadjileontiadis</surname><given-names>LJ</given-names> </name><name name-style="western"><surname>Khandoker</surname><given-names>AH</given-names> </name><etal/></person-group><article-title>Prediction of heart failure patients with distinct left ventricular ejection fraction levels using circadian ECG features and machine learning</article-title><source>PLOS ONE</source><year>2024</year><volume>19</volume><issue>5</issue><fpage>e0302639</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0302639</pub-id><pub-id pub-id-type="medline">38739639</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Triposkiadis</surname><given-names>F</given-names> </name><name name-style="western"><surname>Giamouzis</surname><given-names>G</given-names> </name><name name-style="western"><surname>Parissis</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Reframing the association and significance of co&#x2010;morbidities in heart failure</article-title><source>European J Heart Fail</source><year>2016</year><month>07</month><volume>18</volume><issue>7</issue><fpage>744</fpage><lpage>758</lpage><pub-id pub-id-type="doi">10.1002/ejhf.600</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Szlagor</surname><given-names>M</given-names> </name><name name-style="western"><surname>Dybiec</surname><given-names>J</given-names> </name><name name-style="western"><surname>M&#x0142;ynarska</surname><given-names>E</given-names> </name><name name-style="western"><surname>Rysz</surname><given-names>J</given-names> </name><name name-style="western"><surname>Franczyk</surname><given-names>B</given-names> </name></person-group><article-title>Chronic kidney disease as a comorbidity in heart failure</article-title><source>Int J Mol Sci</source><year>2023</year><month>02</month><day>3</day><volume>24</volume><issue>3</issue><fpage>2988</fpage><pub-id pub-id-type="doi">10.3390/ijms24032988</pub-id><pub-id pub-id-type="medline">36769308</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gabbin</surname><given-names>B</given-names> </name><name name-style="western"><surname>Meraviglia</surname><given-names>V</given-names> </name><name name-style="western"><surname>Mummery</surname><given-names>CL</given-names> </name><etal/></person-group><article-title>Toward human models of cardiorenal syndrome in vitro</article-title><source>Front Cardiovasc Med</source><year>2022</year><volume>9</volume><fpage>889553</fpage><pub-id pub-id-type="doi">10.3389/fcvm.2022.889553</pub-id><pub-id pub-id-type="medline">35694669</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McCullough</surname><given-names>PA</given-names> </name><name name-style="western"><surname>Amin</surname><given-names>A</given-names> </name><name name-style="western"><surname>Pantalone</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Ronco</surname><given-names>C</given-names> </name></person-group><article-title>Cardiorenal nexus: a review with focus on combined chronic heart and kidney failure, and insights from recent clinical trials</article-title><source>J Am Heart Assoc</source><year>2022</year><month>06</month><day>7</day><volume>11</volume><issue>11</issue><fpage>e024139</fpage><pub-id pub-id-type="doi">10.1161/JAHA.121.024139</pub-id><pub-id pub-id-type="medline">35616212</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jung</surname><given-names>S</given-names> </name><name name-style="western"><surname>Bosch</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kolwelter</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Renal and intraglomerular haemodynamics in chronic heart failure with preserved and reduced ejection fraction</article-title><source>ESC Heart Fail</source><year>2021</year><month>04</month><volume>8</volume><issue>2</issue><fpage>1562</fpage><lpage>1570</lpage><pub-id pub-id-type="doi">10.1002/ehf2.13257</pub-id><pub-id pub-id-type="medline">33559346</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Srivaratharajah</surname><given-names>K</given-names> </name><name name-style="western"><surname>Coutinho</surname><given-names>T</given-names> </name><name name-style="western"><surname>deKemp</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Reduced myocardial flow in heart failure patients with preserved ejection fraction</article-title><source>Circ Heart Fail</source><year>2016</year><month>07</month><volume>9</volume><issue>7</issue><fpage>e002562</fpage><pub-id pub-id-type="doi">10.1161/CIRCHEARTFAILURE.115.002562</pub-id><pub-id pub-id-type="medline">27413034</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Okita</surname><given-names>J</given-names> </name><name name-style="western"><surname>Nakata</surname><given-names>T</given-names> </name><name name-style="western"><surname>Uchida</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Development and validation of a machine learning model to predict time to renal replacement therapy in patients with chronic kidney disease</article-title><source>BMC Nephrol</source><year>2024</year><month>03</month><day>16</day><volume>25</volume><issue>1</issue><fpage>101</fpage><pub-id pub-id-type="doi">10.1186/s12882-024-03527-9</pub-id><pub-id pub-id-type="medline">38493099</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Buglioni</surname><given-names>A</given-names> </name><name name-style="western"><surname>Burnett</surname><given-names>JC</given-names> </name></person-group><article-title>Pathophysiology and the cardiorenal connection in heart failure. Circulating hormones: biomarkers or mediators</article-title><source>Clin Chim Acta</source><year>2015</year><month>03</month><day>30</day><volume>443</volume><issue>3&#x2013;8</issue><fpage>3</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1016/j.cca.2014.10.027</pub-id><pub-id pub-id-type="medline">25445413</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chousou</surname><given-names>PA</given-names> </name><name name-style="western"><surname>Chattopadhyay</surname><given-names>R</given-names> </name><name name-style="western"><surname>Tsampasian</surname><given-names>V</given-names> </name><name name-style="western"><surname>Vassiliou</surname><given-names>VS</given-names> </name><name name-style="western"><surname>Pugh</surname><given-names>PJ</given-names> </name></person-group><article-title>Electrocardiographic predictors of atrial fibrillation</article-title><source>Med Sci (Basel)</source><year>2023</year><month>04</month><day>7</day><volume>11</volume><issue>2</issue><fpage>30</fpage><pub-id pub-id-type="doi">10.3390/medsci11020030</pub-id><pub-id pub-id-type="medline">37092499</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kitzman</surname><given-names>DW</given-names> </name><name name-style="western"><surname>Upadhya</surname><given-names>B</given-names> </name><name name-style="western"><surname>Felker</surname><given-names>GM</given-names> </name></person-group><article-title>A biomarker approach to understanding HFpEF</article-title><source>J Am Coll Cardiol</source><year>2020</year><month>03</month><day>24</day><volume>75</volume><issue>11</issue><fpage>1296</fpage><lpage>1298</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2020.01.020</pub-id><pub-id pub-id-type="medline">32192655</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hedman</surname><given-names>&#x00C5;K</given-names> </name><name name-style="western"><surname>Hage</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sharma</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Identification of novel pheno-groups in heart failure with preserved ejection fraction using machine learning</article-title><source>Heart</source><year>2020</year><month>03</month><volume>106</volume><issue>5</issue><fpage>342</fpage><lpage>349</lpage><pub-id pub-id-type="doi">10.1136/heartjnl-2019-315481</pub-id><pub-id pub-id-type="medline">31911501</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aguiar</surname><given-names>H</given-names> </name><name name-style="western"><surname>Santos</surname><given-names>M</given-names> </name><name name-style="western"><surname>Watkinson</surname><given-names>P</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>T</given-names> </name></person-group><article-title>Learning of cluster-based feature importance for electronic health record time-series</article-title><source>Proc Mach Learn Res</source><year>2022</year><access-date>2025-07-30</access-date><volume>162</volume><fpage>161</fpage><lpage>179</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://proceedings.mlr.press/v162/aguiar22a.html">https://proceedings.mlr.press/v162/aguiar22a.html</ext-link></comment></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shorten</surname><given-names>GP</given-names> </name><name name-style="western"><surname>Burke</surname><given-names>MJ</given-names> </name></person-group><article-title>Use of dynamic time warping for accurate ECG signal timing characterization</article-title><source>J Med Eng Technol</source><year>2014</year><month>05</month><volume>38</volume><issue>4</issue><fpage>188</fpage><lpage>201</lpage><pub-id pub-id-type="doi">10.3109/03091902.2014.902514</pub-id><pub-id pub-id-type="medline">24758391</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Kinsner</surname><given-names>W</given-names> </name></person-group><article-title>ECG frame classification using dynamic time warping</article-title><conf-name>IEEE CCECE2002 Canadian Conference on Electrical and Computer Engineering</conf-name><conf-date>May 12-15, 2002</conf-date><conf-loc>Winnipeg, Man, Canada</conf-loc><fpage>1105</fpage><lpage>1110</lpage><pub-id pub-id-type="doi">10.1109/CCECE.2002.1013101</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Borlaug</surname><given-names>BA</given-names> </name></person-group><article-title>Evaluation and management of heart failure with preserved ejection fraction</article-title><source>Nat Rev Cardiol</source><year>2020</year><month>09</month><volume>17</volume><issue>9</issue><fpage>559</fpage><lpage>573</lpage><pub-id pub-id-type="doi">10.1038/s41569-020-0363-2</pub-id><pub-id pub-id-type="medline">32231333</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kurki</surname><given-names>MI</given-names> </name><name name-style="western"><surname>Karjalainen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Palta</surname><given-names>P</given-names> </name><etal/></person-group><article-title>FinnGen provides genetic insights from a well-phenotyped isolated population</article-title><source>Nature New Biol</source><year>2023</year><month>01</month><volume>613</volume><issue>7944</issue><fpage>508</fpage><lpage>518</lpage><pub-id pub-id-type="doi">10.1038/s41586-022-05473-8</pub-id><pub-id pub-id-type="medline">36653562</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Singh</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Krishnan</surname><given-names>S</given-names> </name></person-group><article-title>ECG signal feature extraction trends in methods and applications</article-title><source>Biomed Eng Online</source><year>2023</year><month>03</month><day>8</day><volume>22</volume><issue>1</issue><fpage>22</fpage><pub-id pub-id-type="doi">10.1186/s12938-023-01075-1</pub-id><pub-id pub-id-type="medline">36890566</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Stor&#x00E5;s</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Andersen</surname><given-names>OE</given-names> </name><name name-style="western"><surname>Lockhart</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Usefulness of heat map explanations for deep-learning&#x2013;based electrocardiogram analysis</article-title><source>Diagnostics (Basel)</source><year>2023</year><month>07</month><day>11</day><volume>13</volume><issue>14</issue><fpage>2345</fpage><pub-id pub-id-type="doi">10.3390/diagnostics13142345</pub-id><pub-id pub-id-type="medline">37510089</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rousseeuw</surname><given-names>PJ</given-names> </name></person-group><article-title>Silhouettes: A graphical aid to the interpretation and validation of cluster analysis</article-title><source>J Comput Appl Math</source><year>1987</year><month>11</month><volume>20</volume><fpage>53</fpage><lpage>65</lpage><pub-id pub-id-type="doi">10.1016/0377-0427(87)90125-7</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rand</surname><given-names>WM</given-names> </name></person-group><article-title>Objective criteria for the evaluation of clustering methods</article-title><source>J Am Stat Assoc</source><year>1971</year><month>12</month><volume>66</volume><issue>336</issue><fpage>846</fpage><lpage>850</lpage><pub-id pub-id-type="doi">10.1080/01621459.1971.10482356</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Verbrugge</surname><given-names>FH</given-names> </name><name name-style="western"><surname>Guazzi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Testani</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Borlaug</surname><given-names>BA</given-names> </name></person-group><article-title>Altered hemodynamics and end-organ damage in heart failure</article-title><source>Circulation</source><year>2020</year><month>09</month><day>8</day><volume>142</volume><issue>10</issue><fpage>998</fpage><lpage>1012</lpage><pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.119.045409</pub-id><pub-id pub-id-type="medline">32897746</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Unger</surname><given-names>ED</given-names> </name><name name-style="western"><surname>Dubin</surname><given-names>RF</given-names> </name><name name-style="western"><surname>Deo</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Association of chronic kidney disease with abnormal cardiac mechanics and adverse outcomes in patients with heart failure and preserved ejection fraction</article-title><source>Eur J Heart Fail</source><year>2016</year><month>01</month><volume>18</volume><issue>1</issue><fpage>103</fpage><lpage>112</lpage><pub-id pub-id-type="doi">10.1002/ejhf.445</pub-id><pub-id pub-id-type="medline">26635076</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sung</surname><given-names>KT</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Chi</surname><given-names>PC</given-names> </name><etal/></person-group><article-title>QRS fragmentation in preserved ejection fraction heart failure: functional insights, pathological correlates, and prognosis</article-title><source>J Am Heart Assoc</source><year>2023</year><month>03</month><day>21</day><volume>12</volume><issue>6</issue><fpage>e028105</fpage><pub-id pub-id-type="doi">10.1161/JAHA.122.028105</pub-id><pub-id pub-id-type="medline">36892085</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sivri</surname><given-names>F</given-names> </name><name name-style="western"><surname>Icen</surname><given-names>YK</given-names> </name><name name-style="western"><surname>Koca</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Selvester QRS score is a predictor of mortality in heart failure with preserved ejection fraction</article-title><source>Arq Bras Cardiol</source><year>2023</year><volume>120</volume><issue>9</issue><fpage>e20230235</fpage><pub-id pub-id-type="doi">10.36660/abc.20230235</pub-id><pub-id pub-id-type="medline">37820175</pub-id></nlm-citation></ref></ref-list></back></article>