<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v14i1e80343</article-id><article-id pub-id-type="doi">10.2196/80343</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Machine Learning Prediction of Progression to Dialysis in Patients With Polycystic Kidney Disease: Population-Based Retrospective Cohort Study</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Chang</surname><given-names>Cheng-Hao</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Chen</surname><given-names>Mingchih</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Tsai</surname><given-names>Ming-Hsien</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Huang</surname><given-names>Yen-Chun</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Liou</surname><given-names>Hung-Hsiang</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Shia</surname><given-names>Ben-Chang</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Liang</surname><given-names>Chingying</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Fang</surname><given-names>Yu-Wei</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Division of Nephrology, Department of Internal Medicine, Shin-Kong Wu Ho-Su Memorial Hospital</institution><addr-line>No.95, Wen-Chang Road, Shih-lin District</addr-line><addr-line>Taipei</addr-line><country>Taiwan</country></aff><aff id="aff2"><institution>Graduate Institute of Business Administration, College of Management, Fu Jen Catholic University</institution><addr-line>New Taipei City</addr-line><country>Taiwan</country></aff><aff id="aff3"><institution>AI Development Center, Fu Jen Catholic University</institution><addr-line>New Taipei City</addr-line><country>Taiwan</country></aff><aff id="aff4"><institution>Department of Medicine, Fu Jen Catholic University School of Medicine</institution><addr-line>New Taipei City</addr-line><country>Taiwan</country></aff><aff id="aff5"><institution>Department of Artificial Intelligence, Tamkang University</institution><addr-line>New Taipei City</addr-line><country>Taiwan</country></aff><aff id="aff6"><institution>Division of Nephrology, Department of Internal Medicine, Hsin-Jen Hospital</institution><addr-line>New Taipei City</addr-line><country>Taiwan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib><contrib contrib-type="editor"><name name-style="western"><surname>Benis</surname><given-names>Arriel</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Duan</surname><given-names>Shao-Bin</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Chai</surname><given-names>Soo See</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Yu-Wei Fang, MD, PhD, Division of Nephrology, Department of Internal Medicine, Shin-Kong Wu Ho-Su Memorial Hospital, No.95, Wen-Chang Road, Shih-lin District, Taipei, 111, Taiwan, 886-912376017; <email>m005916@gmail.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>16</day><month>3</month><year>2026</year></pub-date><volume>14</volume><elocation-id>e80343</elocation-id><history><date date-type="received"><day>09</day><month>07</month><year>2025</year></date><date date-type="rev-recd"><day>14</day><month>02</month><year>2026</year></date><date date-type="accepted"><day>17</day><month>02</month><year>2026</year></date></history><copyright-statement>&#x00A9; Cheng-Hao Chang, Mingchih Chen, Ming-Hsien Tsai, Yen-Chun Huang, Hung-Hsiang Liou, Ben-Chang Shia, Chingying Liang, Yu-Wei Fang. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 16.3.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2026/1/e80343"/><abstract><sec><title>Background</title><p>Autosomal dominant polycystic kidney disease (ADPKD), characterized by progressive cyst growth and renal decline, is the leading genetic cause of end&#x2010;stage renal disease.</p></sec><sec><title>Objective</title><p>This study aims to develop and validate machine learning (ML) models for predicting the risk of progression to dialysis in patients with ADPKD using a nationwide administrative database. Early identification of high-risk patients is critical for timely monitoring.</p></sec><sec sec-type="methods"><title>Methods</title><p>This retrospective cohort study used data from Taiwan&#x2019;s National Health Insurance Research Database (2007&#x2010;2018) to identify newly diagnosed patients with ADPKD. Six ML algorithms, including logistic regression, random forest, and extreme gradient boosting (XGBoost), were employed to predict progression to dialysis. Models were developed using 10-fold cross-validation, with the Synthetic Minority Oversampling Technique applied within training folds to address class imbalance. An ensemble-based feature selection strategy was implemented to identify the most robust predictors and optimize final model performance. Model evaluation was conducted using a strict temporal split.</p></sec><sec sec-type="results"><title>Results</title><p>The study included 1856 patients with ADPKD, of whom 302 (16.27%) progressed to dialysis. Multivariable Cox regression identified several significant risk factors, including age 66 years and older (hazard ratio [HR] 4.63, 95% CI 2.71&#x2010;7.92; <italic>P</italic>&#x003C;.001), anemia (HR 4.33, 95% CI 3.25&#x2010;5.78; <italic>P</italic>&#x003C;.001), congestive heart failure (HR 1.81, 95% CI 1.29&#x2010;2.54; <italic>P</italic>&#x003C;.001), and acute kidney injury (HR 1.69, 95% CI 1.19&#x2010;2.41; <italic>P</italic>=.003). Among the ML models, the XGBoost model, using an optimized set of 27 features, demonstrated the highest predictive performance on the held-out temporal test set (accuracy 98.3%; area under the curve 0.955; <italic>F</italic><sub>1</sub>-score 0.800; Brier score 0.022). The top predictors in the XGBoost model largely aligned with age, comorbidity burden, anemia, and cardiovascular disease markers. Medication use (eg, anticoagulants, loop diuretics, febuxostat) was also among the most influential predictors; however, medication-related predictors should be interpreted as proxies for disease complexity rather than direct risk modulators.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>ML models can predict dialysis risk in patients with ADPKD using administrative data with temporal validation. This approach may support risk stratification by helping identify individuals at higher predicted risk who may warrant closer monitoring and further specialist evaluation.</p></sec></abstract><kwd-group><kwd>autosomal dominant polycystic kidney disease</kwd><kwd>ADPKD</kwd><kwd>artificial intelligence</kwd><kwd>machine learning</kwd><kwd>dialysis risk</kwd><kwd>predictive modeling</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>Polycystic kidney disease (PKD) is the leading genetic cause of end-stage renal disease (ESRD). The most common mutations in PKD occur in the <italic>PKD1</italic> or <italic>PKD2</italic> gene, which encode the proteins polycystin-1 and polycystin-2, respectively. These mutations result in abnormal cell proliferation, fluid secretion, and differentiation, leading to the formation and growth of cysts [<xref ref-type="bibr" rid="ref1">1</xref>]. The progressive nature of renal cysts may cause structural and functional changes in the kidney. According to the latest guidelines, the estimated prevalence of PKD varies widely, ranging from approximately 2 to 14 per 10,000 individuals, depending on the study methodology and population characteristics [<xref ref-type="bibr" rid="ref2">2</xref>].</p><p>Contemporary management of autosomal dominant polycystic kidney disease (ADPKD) has evolved to include both the management of associated complications and direct interventions aimed at the disease mechanism. A cornerstone of care remains the control of hypertension, a common and impactful complication. Angiotensin-converting enzyme inhibitors (ACEIs) and angiotensin II receptor blockers (ARBs) are widely recommended for their established efficacy in blood pressure control and proteinuria mitigation [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. In addition, lifestyle interventions, such as dietary sodium restriction and weight management, play a crucial role in preserving renal function [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. In parallel, disease-modifying therapies, such as the vasopressin V2 receptor antagonist tolvaptan, have been developed to slow cyst growth in select patients with rapidly progressing disease, who are often identified using prognostic markers such as genetic status or total kidney volume (TKV) [<xref ref-type="bibr" rid="ref7">7</xref>]. Furthermore, other medications, such as statins and metformin, are frequently prescribed to manage concurrent conditions in this population, though their role as primary treatment options for ADPKD itself remains under investigation [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>].</p></sec><sec id="s1-2"><title>Study Objective</title><p>While risk stratification using advanced tools is crucial for guiding specialized treatments, a significant need remains for risk assessment methods based on accessible, routinely collected data. Currently, the gold-standard models for prognostication in ADPKD include the Mayo Imaging Classification, which utilizes height-adjusted TKV and patient age to predict the rate of estimated glomerular filtration rate (eGFR) decline, and the PROPKD score, which integrates genetic information (<italic>PKD1</italic> vs <italic>PKD2</italic> mutation type) with early clinical manifestations [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Although these models are invaluable, their broad implementation is often hindered by their dependence on specialized and resource-intensive evaluations. For instance, the Mayo Classification requires magnetic resonance imaging (MRI) or computed tomography to measure TKV, while the PROPKD score necessitates comprehensive genetic sequencing. These resources can be costly and are not universally available in all clinical settings, creating a gap for more scalable screening tools.</p><p>In parallel with these clinical tools, artificial intelligence (AI) has been increasingly used in ADPKD management. AI models have been developed to predict glomerular filtration rate decline, aiding in the early identification of high-risk patients and facilitating proactive management [<xref ref-type="bibr" rid="ref12">12</xref>]. In imaging-based classifications, deep learning algorithms have been applied to automate ADPKD severity assessment, enhancing objectivity and reducing interobserver variability [<xref ref-type="bibr" rid="ref13">13</xref>]. AI has also been instrumental in TKV quantification, a crucial prognostic marker in ADPKD. Deep learning-based segmentation models have demonstrated high accuracy in automated kidney segmentation from MRI and computed tomography images, significantly reducing manual workload [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. While these advancements improve disease monitoring, they often still rely on the availability of imaging or detailed clinical data, leaving a gap for predictive models that can leverage more widely accessible administrative data to forecast hard clinical end points.</p><p>Therefore, this study aimed to develop and validate an AI-assisted model to identify significant predictors of progression to dialysis in patients with ADPKD using a nationwide administrative database. We evaluated multiple machine learning (ML) algorithms using a prespecified temporal split for model development and evaluation and summarized predictors to enhance interpretability and clinical usability. Our goal was to create a complementary tool for risk stratification, potentially aiding clinicians in monitoring patients and identifying those who may warrant more specialized evaluation.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Data Sources</title><p>This retrospective cohort study was based on the National Health Insurance Research Database (NHIRD), which is derived from Taiwan&#x2019;s universal compulsory health insurance system covering nearly 99% of the 23 million individuals in Taiwan since 1998 [<xref ref-type="bibr" rid="ref16">16</xref>]. The database includes patients&#x2019; hospitalization and outpatient visit records, and each individual was continuously followed. Disease diagnoses were coded according to the International Classification of Diseases, Ninth Revision, Clinical Modification (<italic>ICD-9</italic>-CM). The NHI Administration fully adopted <italic>ICD-10</italic>-CM for clinical records in 2016.</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>This study was conducted in accordance with the principles of the Declaration of Helsinki and was reviewed and approved by the Ethics Review Board of Shin-Kong Wu Ho-Su Memorial Hospital (approval number 20211008R). The requirement for informed consent was waived by the review board because this study involved a secondary analysis of routinely collected administrative data, and no direct contact with individual participants occurred. The original data collection procedures and this secondary analysis were approved without the need for additional consent.</p><p>All data obtained from the NHIRD were fully deidentified prior to analysis. Personal identifiers were removed by the data holder, and the authors had no access to information that could be used to identify individual patients. Data access and analysis were conducted in compliance with relevant data protection regulations.</p><p>No financial or other compensation was provided to participants, as this study did not involve direct recruitment or interaction with human subjects.</p><p>The manuscript and all supplementary materials did not include any images or information that could lead to the identification of individual participants.</p></sec><sec id="s2-3"><title>Study Design and Population</title><p>&#x2003;We identified new-onset ADPKD cases from the Catastrophic Illness Patient Registry between 2007 and 2018. To minimize potential misclassification bias from ICD coding, we implemented stringent validation criteria for both the primary diagnosis and comorbidities. The identification of patients with ADPKD followed a 2-step process: subjects were first identified using ICD diagnostic codes, and their diagnosis was then validated against Taiwan&#x2019;s Catastrophic Illness Patient Registry. A catastrophic illness certificate requires formal review and approval by physicians, ensuring a high degree of diagnostic accuracy for our study cohort [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref19">19</xref>].</p><p>The index date was defined as the first date on which a patient met the ADPKD case definition and had validation in the Catastrophic Illness Patient Registry. Baseline predictors were ascertained during the 365-day lookback period preceding the index date.</p><p>To construct a clean incident cohort and reduce reverse causation, we excluded individuals aged below 19 years or above 85 years, those with missing core administrative information (eg, sex, age, or index date), and those with evidence of ADPKD during the 2005 to 2006 washout period. We also excluded patients with any evidence of dialysis (hemodialysis or peritoneal dialysis) before the index date and those with kidney transplantation before the index date. Patients were followed from the index date until initiation of dialysis, death, or December 31, 2019, whichever occurred first.</p></sec><sec id="s2-4"><title>Baseline Variables</title><p>The dataset includes a variety of demographic, clinical, and medication-related variables for individuals with ADPKD. The key demographic variables include sex and age. Clinical variables encompass a variety of diseases grouped as cerebrovascular (intracranial aneurysms, ischemic stroke, and hemorrhagic stroke), cardiovascular (hypertension, atrial fibrillation, congestive heart failure [CHF], peripheral vascular disease, arrhythmia, and ischemic heart disease), gastrointestinal (liver cirrhosis, peptic ulcer, diverticulosis, cholangitis, and acute pancreatitis), renal and urological (urinary tract infection [UTI] and acute kidney injury [AKI]), pulmonary (chronic obstructive pulmonary disease [COPD], pneumonia, and asthma), metabolic (dyslipidemia, diabetes mellitus, and gout), mental (dementia, anxiety, and depression), and other (glaucoma and anemia). Each comorbidity was confirmed if the corresponding diagnosis code appeared in at least 1 hospitalization record or at least 3 outpatient visit records within the 365-day lookback period preceding the index date.</p><p>Medication variables cover a broad spectrum, including antihypertensives (beta-blockers, alpha-blockers, ACEIs/ARBs, calcium channel blockers [CCBs], methyldopa, hydralazine, minoxidil, clonidine, potassium-sparing diuretics, thiazide diuretics, and loop diuretics), antidiabetic drugs (metformin, sulfonylureas, dipeptidyl peptidase-4 inhibitors, thiazolidinediones, other oral hypoglycemic agents, rapid-acting insulins, and long-acting insulins), antimetabolic agents (statins, fenofibrate, and other lipid-lowering agents), urate-lowering agents (benzbromarone, allopurinol, febuxostat), and other medications (nonsteroidal anti-inflammatory drugs [NSAIDs], sedative hypnotics, tranexamic acid, mammalian target of rapamycin inhibitors, sodium bicarbonate, anticoagulants, antiplatelet agents, and vitamin K). As with the definition of comorbidities, we adopted a widely used and validated approach to enhance specificity. Medication variables were quantified as the cumulative number of prescription days during the 365-day lookback period preceding the index date. This approach was used to capture exposure intensity beyond a binary indicator. The specific codes used to define all comorbidities and medications are detailed in Tables S1 and S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, respectively.</p></sec><sec id="s2-5"><title>Outcome Definition and Follow-Up</title><p>The primary end point was ESRD, defined as initiation of dialysis or receipt of kidney transplantation without prior dialysis. Patients were followed from the index date until ESRD, death, or December 31, 2019, whichever occurred first. For the ML classification models, the binary outcome was ESRD by the end of follow-up (event=1). In the ML analysis, the label reflects whether ESRD was observed by December 31, 2019, and does not represent a fixed-horizon risk. Patients without ESRD were labeled as nonevents (event=0), including those who died before reaching ESRD.</p></sec><sec id="s2-6"><title>Data Preprocessing and Handling of Missing Data</title><p>Our strategy for handling missing data involved 2 stages. First, case-wise deletion was performed to exclude any patient records with missing core administrative data (eg, sex, age, or date of diagnosis), as indicated in the study flowchart. For the final cohort, predictor variables were constructed such that no missing values remained. The absence of a record for a specific variable was treated as meaningful data rather than as a missing value. For instance, if a patient had no prescriptions for a given medication, the cumulative exposure days were coded as 0. Similarly, if a patient did not meet the predefined criteria for a comorbidity, the variable was coded as 0, indicating absence.</p></sec><sec id="s2-7"><title>Statistical Analysis</title><p>Categorical variables were presented as frequencies with percentages and compared using the chi-square test. Continuous variables were expressed as means with SDs and compared using the <italic>t</italic> test. Multivariable Cox proportional hazards regression models were used to estimate adjusted hazard ratios (HRs) and 95% CIs for the risk of dialysis initiation. A 2-tailed <italic>P</italic> value of &#x003C;.05 was considered statistically significant. All statistical analyses were performed using SAS version 9.4 (SAS Institute Inc).</p></sec><sec id="s2-8"><title>ML Model Development and Feature Selection</title><p>Given the extended accrual period, we used a temporal split to preserve chronological separation between model development and evaluation. Records from 2007 to 2016 (80%) were used for model training, and records from 2017 to 2018 (20%) were reserved as an independent held-out test set for performance assessment.</p><p>Within the training set, we performed 10-fold cross-validation to improve robustness and reduce overfitting. To address class imbalance, Synthetic Minority Over-sampling Technique (SMOTE) was applied only within the training folds of each cross-validation iteration to avoid information leakage into the validation folds. Model performance was evaluated on the held-out test set using accuracy, Cohen &#x03BA;, sensitivity, specificity, area under the curve (AUC), <italic>F</italic><sub>1</sub> score, and Brier score, recognizing that multiple complementary metrics are needed under imbalanced outcome distributions.</p><p>The 6 ML algorithms were chosen to encompass a broad spectrum of modeling techniques, ranging from interpretable linear models to complex, high-performance ensembles. Logistic regression was selected as a conventional statistical method widely used in clinical research, serving as a robust and interpretable baseline for comparison. To capture complex nonlinear relationships, we included 2 distinct models: classification and regression trees, a foundational decision tree algorithm, and multivariate adaptive regression splines, a flexible model adept at identifying interactions between predictors. Finally, to leverage the superior predictive power of ensemble learning, 3 state-of-the-art algorithms were selected [<xref ref-type="bibr" rid="ref20">20</xref>]. Random forest represents the bagging method, which builds independent trees to reduce variance, whereas CatBoost and eXtreme Gradient Boosting (XGBoost) are representatives of boosting methods that construct models sequentially to correct the errors of their predecessors and often yield high accuracy. This comprehensive selection allowed for a thorough evaluation of predictive performance across different algorithmic families, and these methods have been successfully applied in similar medical informatics contexts [<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref23">23</xref>] (see Supplementary Methods in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for detailed model descriptions). Hyperparameters for each model were optimized using random search within the training set under 10-fold cross-validation. The held-out temporal test set was used only for final performance evaluation. The specific hyperparameters for all models are detailed in Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. All model construction was conducted using Python (version 3.9; Python Software Foundation).</p><p>We employed a 2-pronged feature selection approach to identify the most significant predictors. In the first approach, each model performed feature selection based on its own internal mechanism, and its performance was evaluated using this algorithm-specific feature set. In the second approach, we constructed an overall consensus ranking of predictors using rank aggregation across the 6 algorithms. We prespecified that the best-performing algorithm would be selected based on performance on the held-out temporal test set, considering discrimination, class-imbalance&#x2013;sensitive metrics, and calibration. For the selected best-performing model, we additionally evaluated parsimony by sequentially adding predictors according to the consensus ordering and selecting the feature count that maximized test-set performance.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Characteristics of the Study Population</title><p>From the NHIRD, 2677 incident ADPKD cases were identified between 2007 and 2018. After applying exclusion criteria (n=821), 1856 patients were included in the final cohort (<xref ref-type="fig" rid="figure1">Figure 1</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Study flowchart of patient selection and machine learning model development. The diagram shows the patient selection process from the NHIRD for the period 2007&#x2010;2018 and the subsequent workflow for model development. Patients were split temporally into a training set (2007&#x2010;2016) and a held-out test set (2017&#x2010;2018). ESRD was ascertained through December 31, 2019. ADPKD: autosomal dominant polycystic kidney disease; CART: classification and regression trees; ESRD: end-stage renal disease; eXGB: extreme gradient boosting; LGR: logistic regression; MARS: multivariate adaptive regression splines; ML: machine learning; RF: random forest.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e80343_fig01.png"/></fig><p><xref ref-type="table" rid="table1">Table 1</xref> summarizes baseline characteristics assessed during the 365-day lookback period preceding the index date. During follow-up through December 31, 2019, 302 patients (302/1856, 16.27%) initiated dialysis. Kidney transplantation without prior dialysis was observed in only 2 patients. Due to small cell size restrictions intended to protect patient privacy in the NHIRD data release process, transplantation events could not be analyzed separately; therefore, ESRD outcomes are presented primarily in terms of dialysis initiation. The remaining 1554 patients (1554/1856, 83.73%) did not initiate dialysis and were censored at death or end of follow-up.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Baseline characteristics of the cohort stratified by dialysis initiation during follow-up.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Baseline characteristic</td><td align="left" valign="bottom">Autosomal dominant PKD<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> (n=1856)</td><td align="left" valign="bottom" colspan="2">Dialysis initiation during follow-up</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom"/><td align="left" valign="bottom">Yes</td><td align="left" valign="bottom">No</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="4">Sex , n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">1006 (54.20)</td><td align="left" valign="top">168 (55.63)</td><td align="left" valign="top">838 (53.93)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">850 (45.80)</td><td align="left" valign="top">134 (44.37)</td><td align="left" valign="top">716 (46.07)</td></tr><tr><td align="left" valign="top" colspan="4">Age group (y), n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x2264;40</td><td align="left" valign="top">687 (37.02)</td><td align="left" valign="top">56 (18.54)</td><td align="left" valign="top">631 (40.60)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>41&#x2010;55</td><td align="left" valign="top">754 (40.63)</td><td align="left" valign="top">152 (50.33)</td><td align="left" valign="top">602 (38.74)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>56&#x2010;65</td><td align="left" valign="top">265 (14.28)</td><td align="left" valign="top">56 (18.54)</td><td align="left" valign="top">209 (13.45)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x2265;66</td><td align="left" valign="top">150 (8.08)</td><td align="left" valign="top">38 (12.58)</td><td align="left" valign="top">112 (7.21)</td></tr><tr><td align="left" valign="top">Age, mean (SD)</td><td align="left" valign="top">45.85 (13.35)</td><td align="left" valign="top">50.94 (11.94)</td><td align="left" valign="top">44.86 (13.39)</td></tr><tr><td align="left" valign="top" colspan="4">CCI<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> group, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1&#x2010;2</td><td align="left" valign="top">1014 (54.63)</td><td align="left" valign="top">72 (3.88)</td><td align="left" valign="top">942 (50.75)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3&#x2010;5</td><td align="left" valign="top">660 (35.56)</td><td align="left" valign="top">168 (9.05)</td><td align="left" valign="top">492 (26.51)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>6+</td><td align="left" valign="top">182 (9.81)</td><td align="left" valign="top">62 (3.34)</td><td align="left" valign="top">120 (6.47)</td></tr><tr><td align="left" valign="top">CCI scores, mean (SD)</td><td align="left" valign="top">2.58 (2.34)</td><td align="left" valign="top">4.18 (2.27)</td><td align="left" valign="top">2.27 (2.22)</td></tr><tr><td align="left" valign="top" colspan="4">Underlying disease, n (%)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cerebrovascular diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Intracranial aneurysms</td><td align="left" valign="top">20 (1.08)</td><td align="left" valign="top">4 (1.32)</td><td align="left" valign="top">16 (1.03)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ischemic stroke</td><td align="left" valign="top">51 (2.75)</td><td align="left" valign="top">11 (3.64)</td><td align="left" valign="top">40 (2.57)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hemorrhagic stroke</td><td align="left" valign="top">91 (4.90)</td><td align="left" valign="top">27 (8.94)</td><td align="left" valign="top">64 (4.12)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cardiovascular diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hypertension</td><td align="left" valign="top">1164 (62.72)</td><td align="left" valign="top">203 (67.22)</td><td align="left" valign="top">961 (61.84)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AF<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">34 (1.83)</td><td align="left" valign="top">15 (4.97)</td><td align="left" valign="top">19 (1.22)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CHF<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">178 (9.59)</td><td align="left" valign="top">77 (25.50)</td><td align="left" valign="top">101 (6.50)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PVD<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup></td><td align="left" valign="top">71 (3.83)</td><td align="left" valign="top">26 (8.61)</td><td align="left" valign="top">45 (2.90)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Arrhythmia</td><td align="left" valign="top">214 (11.53)</td><td align="left" valign="top">69 (22.85)</td><td align="left" valign="top">145 (9.33)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ischemic heart disease</td><td align="left" valign="top">344 (18.53)</td><td align="left" valign="top">105 (34.77)</td><td align="left" valign="top">239 (15.38)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gastrointestinal diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Liver cirrhosis</td><td align="left" valign="top">33 (1.78)</td><td align="left" valign="top">14 (4.64)</td><td align="left" valign="top">19 (1.22)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Peptic ulcer bleeding</td><td align="left" valign="top">84 (4.53)</td><td align="left" valign="top">25 (8.28)</td><td align="left" valign="top">59 (3.80)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Diverticulosis</td><td align="left" valign="top">32 (1.72)</td><td align="left" valign="top">10 (3.31)</td><td align="left" valign="top">22 (1.42)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cholangitis</td><td align="left" valign="top">39 (2.10)</td><td align="left" valign="top">16 (5.30)</td><td align="left" valign="top">23 (1.48)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Acute pancreatitis</td><td align="left" valign="top">41 (2.21)</td><td align="left" valign="top">20 (6.62)</td><td align="left" valign="top">21 (1.35)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Renal and urological diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>UTI<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup></td><td align="left" valign="top">938 (50.54)</td><td align="left" valign="top">196 (64.90)</td><td align="left" valign="top">742 (47.57)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AKI<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup></td><td align="left" valign="top">173 (9.32)</td><td align="left" valign="top">71 (23.51)</td><td align="left" valign="top">102 (6.56)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lung diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>COPD<sup><xref ref-type="table-fn" rid="table1fn8">h</xref></sup></td><td align="left" valign="top">319 (17.19)</td><td align="left" valign="top">71 (23.51)</td><td align="left" valign="top">248 (15.96)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Pneumonia</td><td align="left" valign="top">543 (29.26)</td><td align="left" valign="top">121 (40.07)</td><td align="left" valign="top">422 (27.16)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Asthma</td><td align="left" valign="top">207 (11.15)</td><td align="left" valign="top">31 (10.26)</td><td align="left" valign="top">176 (11.33)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Metabolic diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dyslipidemia</td><td align="left" valign="top">706 (38.04)</td><td align="left" valign="top">124 (41.06)</td><td align="left" valign="top">582 (37.45)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DM<sup><xref ref-type="table-fn" rid="table1fn9">i</xref></sup></td><td align="left" valign="top">277 (14.92)</td><td align="left" valign="top">73 (24.17)</td><td align="left" valign="top">204 (13.13)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gout</td><td align="left" valign="top">427 (23.01)</td><td align="left" valign="top">122 (40.40)</td><td align="left" valign="top">305 (19.63)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mental diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dementia</td><td align="left" valign="top">47 (2.53)</td><td align="left" valign="top">15 (4.97)</td><td align="left" valign="top">32 (2.06)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Anxiety</td><td align="left" valign="top">321 (17.30)</td><td align="left" valign="top">62 (20.53)</td><td align="left" valign="top">259 (16.67)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Depression</td><td align="left" valign="top">250 (13.47)</td><td align="left" valign="top">46 (15.23)</td><td align="left" valign="top">204 (13.13)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Others</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Glaucoma</td><td align="left" valign="top">88 (4.74)</td><td align="left" valign="top">18 (5.96)</td><td align="left" valign="top">70 (4.50)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Anemia</td><td align="left" valign="top">461 (24.84)</td><td align="left" valign="top">199 (65.89)</td><td align="left" valign="top">262 (16.86)</td></tr><tr><td align="left" valign="top" colspan="4">Medication, mean days of use during the 365-day pre-index period (SD)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Antihypertension</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Beta-blockers</td><td align="left" valign="top">95.85 (107.05)</td><td align="left" valign="top">92.24 (91.14)</td><td align="left" valign="top">97.15 (112.30)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Alpha-blockers</td><td align="left" valign="top">94.40 (106.66)</td><td align="left" valign="top">101.10 (107.30)</td><td align="left" valign="top">90.89 (106.30)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ACEI<sup><xref ref-type="table-fn" rid="table1fn10">j</xref></sup>/ARB<sup><xref ref-type="table-fn" rid="table1fn11">k</xref></sup></td><td align="left" valign="top">160.11 (132.18)</td><td align="left" valign="top">130.10 (102.30)</td><td align="left" valign="top">167.30 (137.50)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CCB<sup><xref ref-type="table-fn" rid="table1fn12">l</xref></sup></td><td align="left" valign="top">157.80 (136.36)</td><td align="left" valign="top">162.20 (122)</td><td align="left" valign="top">156.50 (140.40)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Methyldopa</td><td align="left" valign="top">26.79 (37.29)</td><td align="left" valign="top">17.97 (28.55)</td><td align="left" valign="top">31.61 (41.78)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hydralazine</td><td align="left" valign="top">51.68 (65.70)</td><td align="left" valign="top">46.13 (60.99)</td><td align="left" valign="top">56.27 (69.50)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Minoxidil</td><td align="left" valign="top">53.04 (70.99)</td><td align="left" valign="top">43.11 (51.21)</td><td align="left" valign="top">68.30 (94.18)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Clonidine</td><td align="left" valign="top">41.69 (49.51)</td><td align="left" valign="top">42.35 (38)</td><td align="left" valign="top">40.92 (61.88)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Potassium-sparing diuretics</td><td align="left" valign="top">54.94 (83.58)</td><td align="left" valign="top">31.52 (68.85)</td><td align="left" valign="top">60.38 (85.97)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Thiazide diuretics</td><td align="left" valign="top">66.84 (83.42)</td><td align="left" valign="top">45.18 (67.33)</td><td align="left" valign="top">73.30 (86.68)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Loops diuretics</td><td align="left" valign="top">59.35 (94.95)</td><td align="left" valign="top">60.11 (84.12)</td><td align="left" valign="top">58.75 (102.70)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Antidiabetic</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Metformin</td><td align="left" valign="top">122.29 (122.92)</td><td align="left" valign="top">44.17 (43.31)</td><td align="left" valign="top">130.20 (125.70)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sulfonylureas</td><td align="left" valign="top">130.89 (120.83)</td><td align="left" valign="top">103.20 (117.20)</td><td align="left" valign="top">137.30 (121.40)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DPP4i<sup><xref ref-type="table-fn" rid="table1fn13">m</xref></sup></td><td align="left" valign="top">120.03 (101.88)</td><td align="left" valign="top">100.40 (103)</td><td align="left" valign="top">125 (101.50)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other OHAs</td><td align="left" valign="top">92.69 (102.37)</td><td align="left" valign="top">113.50 (126.70)</td><td align="left" valign="top">82.84 (88.87)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Rapid-acting insulins</td><td align="left" valign="top">14.71 (49.95)</td><td align="left" valign="top">2.12 (8.94)</td><td align="left" valign="top">27.31 (68.23)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Long-acting insulins</td><td align="left" valign="top">100.09 (88.53)</td><td align="left" valign="top">130 (109.90)</td><td align="left" valign="top">84.26 (73.73)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Antimetabolic</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Statin</td><td align="left" valign="top">121.32 (111.87)</td><td align="left" valign="top">124.60 (118.10)</td><td align="left" valign="top">120.60 (110.50)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Fenofibrate</td><td align="left" valign="top">57.96 (72.62)</td><td align="left" valign="top">56.79 (81.12)</td><td align="left" valign="top">58.42 (69.38)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other lipid-lowering agents</td><td align="left" valign="top">75.24 (90.44)</td><td align="left" valign="top">6.19 (2.38)</td><td align="left" valign="top">92.50 (93.65)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Urate-lowering agents</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Benzbromarone</td><td align="left" valign="top">65.45 (79.37)</td><td align="left" valign="top">41.72 (49.69)</td><td align="left" valign="top">71.38 (84.22)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Allopurinol</td><td align="left" valign="top">82.52 (97.02)</td><td align="left" valign="top">78.39 (84.91)</td><td align="left" valign="top">85.45 (105)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Febuxostat</td><td align="left" valign="top">104.04 (101.03)</td><td align="left" valign="top">92.67 (79.03)</td><td align="left" valign="top">108.20 (107.80)</td></tr><tr><td align="left" valign="top" colspan="4"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>NSAID<sup><xref ref-type="table-fn" rid="table1fn14">n</xref></sup></td><td align="left" valign="top">15.76 (34.22)</td><td align="left" valign="top">15.69 (29.67)</td><td align="left" valign="top">15.78 (35.12)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sedative hypnotics</td><td align="left" valign="top">92.03 (158.68)</td><td align="left" valign="top">118.70 (188.30)</td><td align="left" valign="top">83.81 (147.50)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Tranexamic acid</td><td align="left" valign="top">5.05 (16.89)</td><td align="left" valign="top">6.59 (11.14)</td><td align="left" valign="top">4.59 (18.24)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>mTOR<sup><xref ref-type="table-fn" rid="table1fn15">o</xref></sup> inhibitors</td><td align="left" valign="top">135.14 (148.87)</td><td align="left" valign="top">127.80 (140.60)</td><td align="left" valign="top">144 (174.70)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Sodium bicarbonate</td><td align="left" valign="top">9.50 (42.61)</td><td align="left" valign="top">20.52 (46.30)</td><td align="left" valign="top">7.25 (41.48)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Anticoagulants</td><td align="left" valign="top">110.46 (155.24)</td><td align="left" valign="top">113.10 (190.60)</td><td align="left" valign="top">109 (132.20)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Antiplatelet agents</td><td align="left" valign="top">211.22 (251.64)</td><td align="left" valign="top">204.20 (228.70)</td><td align="left" valign="top">214.30 (261.10)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Vitamin K</td><td align="left" valign="top">57.41 (91.58)</td><td align="left" valign="top">19.86 (43.90)</td><td align="left" valign="top">107.50 (114.30)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>PKD: polycystic kidney disease.</p></fn><fn id="table1fn2"><p><sup>b</sup>CCI: Charlson Comorbidity Index.</p></fn><fn id="table1fn3"><p><sup>c</sup>AF: atrial fibrillation.</p></fn><fn id="table1fn4"><p><sup>d</sup>CHF: congestive heart failure.</p></fn><fn id="table1fn5"><p><sup>e</sup>PVD: peripheral vascular disease.</p></fn><fn id="table1fn6"><p><sup>f</sup>UTI: urinary tract infection.</p></fn><fn id="table1fn7"><p><sup>g</sup>AKI: acute kidney injury.</p></fn><fn id="table1fn8"><p><sup>h</sup>COPD: chronic obstructive pulmonary disease.</p></fn><fn id="table1fn9"><p><sup>i</sup>DM: diabetes mellitus.</p></fn><fn id="table1fn10"><p><sup>j</sup>ACEI: angiotensin-converting enzyme inhibitor.</p></fn><fn id="table1fn11"><p><sup>k</sup>ARB: angiotensin II receptor blocker.</p></fn><fn id="table1fn12"><p><sup>l</sup>CCB: calcium channel blocker.</p></fn><fn id="table1fn13"><p><sup>m</sup>DPP4i: dipeptidyl peptidase-4 inhibitor.</p></fn><fn id="table1fn14"><p><sup>n</sup>NSAID: nonsteroidal anti-inflammatory drug.</p></fn><fn id="table1fn15"><p><sup>o</sup>mTOR: mechanistic target of rapamycin.</p></fn></table-wrap-foot></table-wrap><p>At baseline, the cohort had substantial cardiorenal comorbidity and medication use. The most prevalent comorbidities were hypertension (86.58%, 1606/1856) and UTI (50.38%, 935/1856), with pneumonia (29.26%, 543/1856), anemia (24.83%, 461/1856), and gout (23.01%, 427/1856) also common. Antihypertensive exposure was widespread (ACEI/ARB 161.30, SD 127.50 d; CCB 160.90, SD 133.70 d), and metabolic therapy was frequent (metformin 116.20, SD 137.10 d; long-acting insulin 91.71, SD 139.10 d).</p><p>Stratification by subsequent dialysis initiation highlighted clinically meaningful differences in baseline disease severity and management. Patients who later initiated dialysis were older (50.94, SD 11.94 vs 44.86, SD 13.39 y) and had higher comorbidity burden (Charlson Comorbidity Index [CCI] 4.18, SD 2.27 vs 2.27, SD 2.22; CCI&#x2265;6: 20.53% vs 7.72%), with the largest separations for anemia (65.89% vs 16.86%) and AKI (23.51% vs 6.56%). Baseline medication patterns were consistent with greater clinical complexity in the dialysis group, including lower metformin exposure (44.17, SD 95.41 vs 130.20, SD 148 d) and higher sodium bicarbonate exposure (20.52, SD 68.46 vs 7.25, SD 44.30 d).</p></sec><sec id="s3-2"><title>Risk Analysis for Progression to Dialysis</title><p><xref ref-type="table" rid="table2">Table 2</xref> presents the multivariable Cox regression results. After adjustment for sex, age category, CCI category, and comorbidities, male sex was associated with a higher risk of dialysis initiation (aHR 1.55, 95% CI 1.13&#x2010;2.11; <italic>P</italic>=.006). Age remained a strong predictor: compared with age younger than 55 years, the risk increased across categories. Among comorbidities, anemia showed the strongest association with dialysis initiation (aHR 4.33, 95% CI 3.25&#x2010;5.78; <italic>P</italic>&#x003C;.001). Congestive heart failure, AKI, and gout were also associated with a higher risk. Hypertension, COPD, and anxiety were associated with lower hazard in the adjusted model.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Risk for entering dialysis in the patients with ADPKD<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom" colspan="2">Cox model</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">aHR<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> (95% CI)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="3">Sex</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ref=Female</td><td align="left" valign="top">1</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">1.55 (1.13&#x2010;2.11)</td><td align="left" valign="top">.006</td></tr><tr><td align="left" valign="top" colspan="3">Age group</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ref=&#x003C;55</td><td align="left" valign="top">1</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>41&#x2010;55</td><td align="left" valign="top">3.01 (2.12&#x2010;4.30)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>56&#x2010;65</td><td align="left" valign="top">4.13 (2.63&#x2010;6.50)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x2003;&#x2265;</named-content>66</td><td align="left" valign="top">4.63 (2.71&#x2010;7.92)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top" colspan="3">CCI<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup> group</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ref=12</td><td align="left" valign="top">1</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>345</td><td align="left" valign="top">1.42 (1.01&#x2010;1.98)</td><td align="left" valign="top">.04</td></tr><tr><td align="char" char="plus" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>6+</td><td align="left" valign="top">1.28 (0.74&#x2010;2.21)</td><td align="left" valign="top">.39</td></tr><tr><td align="left" valign="top" colspan="3">Underlying disease</td></tr><tr><td align="left" valign="top" colspan="3"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cerebrovascular diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Intracranial aneurysms</td><td align="left" valign="top">2.12 (0.71&#x2010;6.31)</td><td align="left" valign="top">.18</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ischemic stroke</td><td align="left" valign="top">1.22 (0.59&#x2010;2.49)</td><td align="left" valign="top">.59</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hemorrhagic stroke</td><td align="left" valign="top">1.03 (0.57&#x2010;1.86)</td><td align="left" valign="top">.91</td></tr><tr><td align="left" valign="top" colspan="3"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cardiovascular diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hypertension</td><td align="left" valign="top">0.70 (0.53&#x2010;0.94)</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AF<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup></td><td align="left" valign="top">0.66 (0.32&#x2010;1.32)</td><td align="left" valign="top">.24</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CHF<sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup></td><td align="left" valign="top">1.81 (1.29&#x2010;2.54)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>PVD<sup><xref ref-type="table-fn" rid="table2fn7">g</xref></sup></td><td align="left" valign="top">1.25 (0.79&#x2010;2.00)</td><td align="left" valign="top">.34</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Arrhythmia</td><td align="left" valign="top">0.98 (0.69&#x2010;1.40)</td><td align="left" valign="top">.92</td></tr><tr><td align="left" valign="top" colspan="3"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gastrointestinal diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ischemic heart disease</td><td align="left" valign="top">1.09 (0.80&#x2010;1.48)</td><td align="left" valign="top">.58</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Liver cirrhosis</td><td align="left" valign="top">0.91 (0.48&#x2010;1.72)</td><td align="left" valign="top">.77</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Peptic ulcer bleeding</td><td align="left" valign="top">0.67 (0.42&#x2010;1.09)</td><td align="left" valign="top">.11</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Diverticulosis</td><td align="left" valign="top">0.82 (0.38&#x2010;1.79)</td><td align="left" valign="top">.62</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cholangitis</td><td align="left" valign="top">1.10 (0.61&#x2010;1.96)</td><td align="left" valign="top">.76</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Acute pancreatitis</td><td align="left" valign="top">1.18 (0.69&#x2010;2.04)</td><td align="left" valign="top">.55</td></tr><tr><td align="left" valign="top" colspan="3"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Renal and urological diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>UTI<sup><xref ref-type="table-fn" rid="table2fn8">h</xref></sup></td><td align="left" valign="top">0.84 (0.62&#x2010;1.14)</td><td align="left" valign="top">.26</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AKI<sup><xref ref-type="table-fn" rid="table2fn9">i</xref></sup></td><td align="left" valign="top">1.69 (1.19&#x2010;2.41)</td><td align="left" valign="top">.003</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>COPD<sup><xref ref-type="table-fn" rid="table2fn10">j</xref></sup></td><td align="left" valign="top">0.61 (0.44&#x2010;0.86)</td><td align="left" valign="top">.005</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Pneumonia</td><td align="left" valign="top">0.86 (0.65&#x2010;1.12)</td><td align="left" valign="top">.26</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Asthma</td><td align="left" valign="top">0.74 (0.47&#x2010;1.15)</td><td align="left" valign="top">.18</td></tr><tr><td align="left" valign="top" colspan="3"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Metabolic diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dyslipidemia</td><td align="left" valign="top">0.78 (0.51&#x2010;1.01)</td><td align="left" valign="top">.12</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DM<sup><xref ref-type="table-fn" rid="table2fn11">k</xref></sup></td><td align="left" valign="top">1.38 (0.97&#x2010;1.96)</td><td align="left" valign="top">.07</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gout</td><td align="left" valign="top">1.49 (1.08&#x2010;2.05)</td><td align="left" valign="top">.01</td></tr><tr><td align="left" valign="top" colspan="3"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mental diseases</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dementia</td><td align="left" valign="top">0.71 (0.37&#x2010;1.34)</td><td align="left" valign="top">.29</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Anxiety</td><td align="left" valign="top">0.53 (0.34&#x2010;0.82)</td><td align="left" valign="top">.004</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Depression</td><td align="left" valign="top">1.33 (0.82&#x2010;2.16)</td><td align="left" valign="top">.26</td></tr><tr><td align="left" valign="top" colspan="3"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Others</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Glaucoma</td><td align="left" valign="top">1.02 (0.60&#x2010;1.74)</td><td align="left" valign="top">.93</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Anemia</td><td align="left" valign="top">4.33 (3.25&#x2010;5.78)</td><td align="left" valign="top">&#x003C;.001</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>ADPKD: autosomal dominant polycystic kidney disease.</p></fn><fn id="table2fn2"><p><sup>b</sup>aHR: adjusted hazard ratio.</p></fn><fn id="table2fn3"><p><sup>c</sup>Not applicable.</p></fn><fn id="table2fn4"><p><sup>d</sup>CCI: Charlson Comorbidity Index.</p></fn><fn id="table2fn5"><p><sup>e</sup>AF: atrial fibrillation.</p></fn><fn id="table2fn6"><p><sup>f</sup>CHF: congestive heart failure.</p></fn><fn id="table2fn7"><p><sup>g</sup>PVD: peripheral vascular disease.</p></fn><fn id="table2fn8"><p><sup>h</sup>UTI: urinary tract infection.</p></fn><fn id="table2fn9"><p><sup>i</sup>AKI: acute kidney injury.</p></fn><fn id="table2fn10"><p><sup>j</sup>COPD: chronic obstructive pulmonary disease.</p></fn><fn id="table2fn11"><p><sup>k</sup>DM: diabetes mellitus.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-3"><title>Feature Importance Across ML Models</title><p><xref ref-type="fig" rid="figure2">Figure 2</xref> presents the relative importance of variables in predicting dialysis risk, as determined by the 6 ML models. A consensus emerged across the different algorithms, highlighting several key predictors. The top-ranked predictors spanned comorbidity burden and medication patterns, including anticoagulant use, hypertension, CCB use, higher CCI category, loop diuretics, sodium bicarbonate, anemia, and ACEI or ARB use, together with age and sex. Additional contributors included cardiorespiratory comorbidities, UTI, gout, and neuropsychiatric conditions and related medications.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Overall consensus feature ranking aggregated across 6 machine learning algorithms. Predictors were ranked within each algorithm using the model&#x2019;s native importance criterion; standardized ranks were then aggregated to generate an overall consensus ranking. ACEI: angiotensin-converting enzyme inhibitor; AF: atrial fibrillation; ARB: angiotensin II receptor blocker; CCB: calcium channel blocker; CCI: Charlson Comorbidity Index; COPD: chronic obstructive pulmonary disease; DM: diabetes mellitus; NSAID: nonsteroidal anti-inflammatory drug; PVD: peripheral vascular disease; UTI: urinary tract infection.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e80343_fig02.png"/></fig></sec><sec id="s3-4"><title>Performance Comparison of ML Models</title><p><xref ref-type="table" rid="table3">Table 3</xref> summarizes performance for 6 ML algorithms under 2 feature selection strategies: model-specific feature selection and a consensus feature set derived from rank aggregation. Using model-specific feature selection, XGBoost achieved the highest accuracy (0.9748) with specificity of 1, with an AUC of 0.9436 and a Brier score of 0.0254. Using the consensus feature set, performance improved across models. XGBoost achieved the highest accuracy (0.9832) and <italic>F</italic><sub>1</sub>-score (0.8), whereas MARS achieved the highest AUC (0.9762) and CatBoost achieved the lowest Brier score (0.0217), indicating strong discrimination with favorable calibration across top-performing models.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>The model predictions with six different machine learning algorithms.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Methods</td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom">Kappa</td><td align="left" valign="bottom">Sensitivity</td><td align="left" valign="bottom">Specificity</td><td align="left" valign="bottom">AUC<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="bottom">Brier score</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="8">Variables selected by its own algorithm</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>LGR<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td><td align="left" valign="top">0.9034</td><td align="left" valign="top">0.2552</td><td align="left" valign="top">0.4167</td><td align="left" valign="top">0.9292</td><td align="left" valign="top">0.7806</td><td align="left" valign="top">0.303</td><td align="left" valign="top">0.0771</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>RF<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="top">0.9580</td><td align="left" valign="top">0.4790</td><td align="left" valign="top">0.4167</td><td align="left" valign="top">0.9867</td><td align="left" valign="top">0.9338</td><td align="left" valign="top">0.500</td><td align="left" valign="top">0.0352</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MARS<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td><td align="left" valign="top">0.9664</td><td align="left" valign="top">0.6189</td><td align="left" valign="top">0.5833</td><td align="left" valign="top">0.9867</td><td align="left" valign="top">0.9558</td><td align="left" valign="top">0.6364</td><td align="left" valign="top">0.0260</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CART<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td><td align="left" valign="top">0.9202</td><td align="left" valign="top">0.3037</td><td align="left" valign="top">0.4167</td><td align="left" valign="top">0.9469</td><td align="left" valign="top">0.9023</td><td align="left" valign="top">0.3448</td><td align="left" valign="top">0.0588</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>XGBoost<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="left" valign="top">0.9748</td><td align="left" valign="top">0.6551</td><td align="left" valign="top">0.5000</td><td align="left" valign="top">1</td><td align="left" valign="top">0.9436</td><td align="left" valign="top">0.6667</td><td align="left" valign="top">0.0254</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CatBoost</td><td align="left" valign="top">0.9622</td><td align="left" valign="top">0.5521</td><td align="left" valign="top">0.5000</td><td align="left" valign="top">0.9867</td><td align="left" valign="top">0.9672</td><td align="left" valign="top">0.5714</td><td align="left" valign="top">0.0245</td></tr><tr><td align="left" valign="top" colspan="8">Variables selected based on the average results from six ML algorithms.</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>LGR</td><td align="left" valign="top">0.9496</td><td align="left" valign="top">0.4735</td><td align="left" valign="top">0.5000</td><td align="left" valign="top">0.9735</td><td align="left" valign="top">0.9288</td><td align="left" valign="top">0.5000</td><td align="left" valign="top">0.0557</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>RF</td><td align="left" valign="top">0.9706</td><td align="left" valign="top">0.6174</td><td align="left" valign="top">0.5000</td><td align="left" valign="top">0.9956</td><td align="left" valign="top">0.9611</td><td align="left" valign="top">0.6316</td><td align="left" valign="top">0.0302</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MARS</td><td align="left" valign="top">0.9790</td><td align="left" valign="top">0.7512</td><td align="left" valign="top">0.6667</td><td align="left" valign="top">0.9956</td><td align="left" valign="top">0.9762</td><td align="left" valign="top">0.7619</td><td align="left" valign="top">0.0232</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CART</td><td align="left" valign="top">0.9454</td><td align="left" valign="top">0.4899</td><td align="left" valign="top">0.5833</td><td align="left" valign="top">0.9646</td><td align="left" valign="top">0.9399</td><td align="left" valign="top">0.5185</td><td align="left" valign="top">0.060</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>XGBoost</td><td align="left" valign="top">0.9832</td><td align="left" valign="top">0.7916</td><td align="left" valign="top">0.6667</td><td align="left" valign="top">1</td><td align="left" valign="top">0.9546</td><td align="left" valign="top">0.8000</td><td align="left" valign="top">0.0219</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CatBoost</td><td align="left" valign="top">0.9790</td><td align="left" valign="top">0.7512</td><td align="left" valign="top">0.6567</td><td align="left" valign="top">0.9956</td><td align="left" valign="top">0.9676</td><td align="left" valign="top">0.7619</td><td align="left" valign="top">0.0217</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>AUC: area under the curve.</p></fn><fn id="table3fn2"><p><sup>b</sup>LGR: logistic regression.</p></fn><fn id="table3fn3"><p><sup>c</sup>RF: random forest.</p></fn><fn id="table3fn4"><p><sup>d</sup>MARS: multivariate adaptive regression splines.</p></fn><fn id="table3fn5"><p><sup>e</sup>CART: classification and regression trees.</p></fn><fn id="table3fn6"><p><sup>f</sup>XGBoost: extreme gradient boosting.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-5"><title>Optimization of the XGBoost Model via Feature Selection</title><p><xref ref-type="fig" rid="figure3">Figure 3</xref> shows the change in test set accuracy as top-ranked predictors from the consensus ranking were sequentially added to the XGBoost model. Accuracy increased rapidly as the highest-ranked predictors were included and reached its maximum with 27 predictors. This feature count was selected as the optimal balance between parsimony and predictive performance, and the 27-feature set was used for the final XGBoost model.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Optimization of extreme gradient boosting model performance by sequential feature addition. The plot shows the change in model accuracy (y-axis) as the number of top-ranked predictor variables (x-axis). The dashed vertical line indicates the point at which maximum accuracy was achieved with 27 variables.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v14i1e80343_fig03.png"/></fig></sec><sec id="s3-6"><title>Key Predictors in the Final XGBoost Model</title><p>The final XGBoost model used 27 baseline predictors selected during feature optimization (<xref ref-type="table" rid="table4">Table 4</xref>). This set included demographic and comorbidity burden measures (age, sex, and CCI category), major clinical conditions linked to renal risk or frailty (anemia, hypertension, ischemic heart disease, gout, pneumonia, COPD, UTI, anxiety, and depression), and multiple medication exposures. Key medication predictors included antihypertensive classes (ACEI or ARB, CCB, beta-blockers, and alpha-blockers), agents reflecting advanced renal management or metabolic status (loop diuretics, sodium bicarbonate, potassium-sparing diuretics, and rapid-acting insulin), and medications that may relate to underlying diseases (anticoagulants, antiplatelet agents, NSAIDs, sedative hypnotics, tranexamic acid, febuxostat, and statins). It is crucial to note that these medication-related predictors should be interpreted as proxies for underlying disease severity and complexity (ie, confounding by indication), rather than as direct causal risk factors.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>The variables selected for the best accuracy result in XGBoost. The rank is the average ranking from the average results of LGR<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup>, RF<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup>, MARS<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup>, CART<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup>, XGBoost<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup>, and CatBoost.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Rank</td><td align="left" valign="bottom">Variable</td></tr></thead><tbody><tr><td align="left" valign="top">1</td><td align="left" valign="top">Age</td></tr><tr><td align="left" valign="top">2</td><td align="left" valign="top">CCI<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup> scores</td></tr><tr><td align="left" valign="top">3</td><td align="left" valign="top">Anticoagulants</td></tr><tr><td align="left" valign="top">4</td><td align="left" valign="top">Loops diuretics</td></tr><tr><td align="left" valign="top">5</td><td align="left" valign="top">Alpha-blockers</td></tr><tr><td align="left" valign="top">6</td><td align="left" valign="top">NSAID<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td></tr><tr><td align="left" valign="top">7</td><td align="left" valign="top">Sex</td></tr><tr><td align="left" valign="top">8</td><td align="left" valign="top">CCB<sup><xref ref-type="table-fn" rid="table4fn8">h</xref></sup></td></tr><tr><td align="left" valign="top">9</td><td align="left" valign="top">Sedative hypnotics</td></tr><tr><td align="left" valign="top">10</td><td align="left" valign="top">Anemia</td></tr><tr><td align="left" valign="top">11</td><td align="left" valign="top">ACEI<sup><xref ref-type="table-fn" rid="table4fn9">i</xref></sup>/ARB<sup><xref ref-type="table-fn" rid="table4fn10">j</xref></sup></td></tr><tr><td align="left" valign="top">12</td><td align="left" valign="top">Hypertension</td></tr><tr><td align="left" valign="top">13</td><td align="left" valign="top">Gout</td></tr><tr><td align="left" valign="top">14</td><td align="left" valign="top">Tranexamic acid</td></tr><tr><td align="char" char="." valign="top">15</td><td align="left" valign="top">Febuxostat</td></tr><tr><td align="char" char="." valign="top">16</td><td align="left" valign="top">Ischemic heart disease</td></tr><tr><td align="char" char="." valign="top">17</td><td align="left" valign="top">Statin</td></tr><tr><td align="char" char="." valign="top">18</td><td align="left" valign="top">Antiplatelet agents</td></tr><tr><td align="char" char="." valign="top">19</td><td align="left" valign="top">Beta-blockers</td></tr><tr><td align="char" char="." valign="top">20</td><td align="left" valign="top">Pneumonia</td></tr><tr><td align="char" char="." valign="top">21</td><td align="left" valign="top">Sodium bicarbonate</td></tr><tr><td align="char" char="." valign="top">22</td><td align="left" valign="top">Potassium-sparing diuretics</td></tr><tr><td align="char" char="." valign="top">23</td><td align="left" valign="top">Rapid-acting insulins</td></tr><tr><td align="char" char="." valign="top">24</td><td align="left" valign="top">Anxiety</td></tr><tr><td align="char" char="." valign="top">25</td><td align="left" valign="top">COPD<sup><xref ref-type="table-fn" rid="table4fn11">k</xref></sup></td></tr><tr><td align="char" char="." valign="top">26</td><td align="left" valign="top">Depression</td></tr><tr><td align="char" char="." valign="top">27</td><td align="left" valign="top">UTI<sup><xref ref-type="table-fn" rid="table4fn12">l</xref></sup></td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>LGR: logistic regression.</p></fn><fn id="table4fn2"><p><sup>b</sup>RF: random forest.</p></fn><fn id="table4fn3"><p><sup>c</sup>MARS: multivariate adaptive regression splines.</p></fn><fn id="table4fn4"><p><sup>d</sup>CART: classification and regression trees.</p></fn><fn id="table4fn5"><p><sup>e</sup>XGBoost: extreme gradient boosting.</p></fn><fn id="table4fn6"><p><sup>f</sup>CCI: Charlson Comorbidity Index.</p></fn><fn id="table4fn7"><p><sup>g</sup>NSAID: nonsteroidal anti-inflammatory drug.</p></fn><fn id="table4fn8"><p><sup>h</sup>CCB: calcium channel blocker.</p></fn><fn id="table4fn9"><p><sup>i</sup>ACEI: angiotensin-converting enzyme inhibitors.</p></fn><fn id="table4fn10"><p><sup>j</sup>ARB: angiotensin receptor blocker.</p></fn><fn id="table4fn11"><p><sup>k</sup>COPD: chronic obstructive pulmonary disease.</p></fn><fn id="table4fn12"><p><sup>l</sup>UTI: urinary tract infection.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This retrospective cohort study used data from the NHIRD to predict ESRD progression in ADPKD using 6 ML algorithms, with ESRD operationalized as initiation of maintenance dialysis. On the held-out temporal test set, XGBoost demonstrated the best overall performance after feature optimization (accuracy 0.9832; <italic>F</italic><sub>1</sub> score 0.8). The final optimized XGBoost model was derived by sequentially adding top-ranked predictors and achieved peak accuracy with 27 variables. The most informative predictors reflected underlying disease severity and care intensity, including age, CCI, anemia, hypertension, ischemic heart disease, gout, pneumonia, COPD, UTI, anxiety, and depression, as well as medication exposures such as anticoagulants, loop diuretics, ACEI/ARB, CCB, and febuxostat.</p></sec><sec id="s4-2"><title>Interpretation of Major Clinical Risk Factors</title><p>Hypertension is a common early manifestation of ADPKD, often developing before renal function declines. It affects up to 86.6% of patients with ADPKD, frequently appearing around 30 years of age, with up to 20% of them diagnosed before the age of 20 [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. The underlying mechanisms involve intrarenal ischemia, renin-angiotensin-aldosterone system (RAAS) activation, and endothelial dysfunction. Progressive cyst expansion leads to renal hypoperfusion and sustained RAAS stimulation, further exacerbating hypertension and accelerating kidney damage [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. This mechanistic framework is consistent with our results, where hypertension and cardiovascular comorbidity markers, including ischemic heart disease and related medication patterns, contributed meaningfully to dialysis risk prediction.</p><p>Age and overall comorbidity burden were among the highest-ranked predictors in both the consensus feature ranking and the final XGBoost feature set. This pattern suggests that administrative claims-based models capture the cumulative burden of systemic illness, frailty, and health care utilization that often accompanies advanced kidney disease trajectories [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. In our cohort, ischemic heart disease and cardiovascular medication proxies (eg, anticoagulants, antiplatelet agents, beta-blockers, and loop diuretics) were repeatedly selected, indicating that cardiovascular disease severity and its treatment intensity provide informative signals of near-term dialysis risk [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>].</p><p>In our cohort, anemia showed the strongest association with dialysis initiation in the adjusted Cox model and was consistently selected by the ML algorithms. A study conducted in Japan found that, despite higher hemoglobin levels in ADPKD than in other CKD types, anemia remains a key predictor of renal disease progression. In nondialysis patients with ADPKD, lower hemoglobin levels were associated with faster kidney function decline, with men with hemoglobin levels less than 12 g/dL and women with hemoglobin levels less than 11 g/dL at higher risk [<xref ref-type="bibr" rid="ref32">32</xref>]. Together, these findings support anemia as a clinically accessible marker of advanced disease and progression risk in ADPKD.</p><p>AKI and infection-related diagnoses such as pneumonia and UTI also contributed to the prediction. These events may accelerate loss of residual kidney function through hemodynamic instability, inflammatory injury, or nephrotoxic exposures, and they may also serve as markers of vulnerability and more frequent clinical encounters. In parallel, medication predictors such as sodium bicarbonate and NSAIDs plausibly reflect clinically recognized metabolic acidosis and nephrotoxic exposure that often accompany advanced CKD and precede dialysis initiation [<xref ref-type="bibr" rid="ref33">33</xref>].</p></sec><sec id="s4-3"><title>Medication Predictors as Markers of Disease Severity</title><p>As highlighted earlier, a critical aspect of interpreting our findings is the potential for confounding by indication, particularly for medication-related predictors. In a retrospective cohort study, the use of a specific medication is often a marker of underlying disease severity rather than a cause of the outcome itself. Therefore, while these medications emerged as strong predictors in our model, they should be viewed primarily as indicators of a higher underlying risk profile, and our findings do not imply a causal relationship or recommend changes in prescribing practices. Consistent with prior work using administrative claims for kidney failure prediction, these medication patterns should be interpreted primarily as proxies for clinical complexity rather than as causal determinants of dialysis initiation [<xref ref-type="bibr" rid="ref31">31</xref>].</p><p>Renin-angiotensin system inhibitors have been established as the first-line treatment due to their benefits in hypertension control [<xref ref-type="bibr" rid="ref34">34</xref>]. In our model, the selection of additional antihypertensive classes (eg, alpha-blockers and CCB) and loop diuretics likely reflects difficult-to-control blood pressure, volume management needs, or concomitant cardiovascular disease rather than direct causal effects on renal decline. Similarly, anticoagulant and antiplatelet use may act as proxies for atrial fibrillation, vascular disease, or prior cardiovascular events, conditions that commonly cluster with advanced CKD and a higher risk of dialysis initiation.</p><p>Tranexamic acid was also selected among the final XGBoost predictors. In ADPKD, clinically significant gross hematuria is a common and clinically relevant event, and tranexamic acid has been used in small series for severe hematuria, although evidence remains limited [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. Therefore, in claims-based modeling, tranexamic acid likely functions as a proxy for clinically significant hematuria or bleeding-related care that clusters with more advanced disease trajectories, rather than as a causal determinant of dialysis initiation.</p><p>Hyperuricemia is increasingly implicated in CKD progression, and our model identified gout and febuxostat as informative predictors of dialysis. This finding does not suggest a causal link but rather reflects prescribing patterns that align with both international guidelines and local reimbursement policies. Major clinical practice guidelines for ADPKD recommend allopurinol as the first-line urate-lowering therapy [<xref ref-type="bibr" rid="ref2">2</xref>]. This standard is strictly reflected in Taiwan&#x2019;s National Health Insurance system, where reimbursement for the second-line agent, febuxostat, was restricted during our study period. These restrictions likely limited its use primarily to patients with substantial preexisting conditions, most notably advanced chronic kidney disease (defined as eGFR &#x003C;45 mL/min/1.73 m<sup>2</sup>) or other complications such as urate nephrolithiasis or severe tophaceous gout. Consequently, the predictive signal from febuxostat in our model arises because it serves as a powerful proxy, identifying a patient subgroup with higher baseline renal risk and greater disease complexity. Further prospective studies are needed to determine if urate-lowering therapy itself modifies the disease course in ADPKD.</p><p>Statins, primarily known for their cholesterol-lowering effects, also possess anti-inflammatory and antioxidant properties that could be beneficial in PKD. Chronic inflammation and oxidative stress play roles in the pathophysiology of PKD, contributing to cyst growth and renal function decline. Evidence regarding the efficacy of statins in PKD is equivocal. Some cohort studies and animal research suggest that statins may slow the decline in renal function in patients with PKD by reducing inflammation and oxidative stress [<xref ref-type="bibr" rid="ref9">9</xref>]. However, findings from definitive clinical trials in PKD populations, which are scarce, remain inconclusive.</p></sec><sec id="s4-4"><title>Comparison With Existing Risk Stratification Tools</title><p>Our ML approach should be compared with existing clinical risk tools for ADPKD, such as the Mayo Imaging Classification and the PROPKD score. The primary advantage of our model lies in its broad accessibility. By leveraging nationwide administrative data, it bypasses the need for resource-intensive assessments, such as MRI for TKV measurement or genetic sequencing, making it a scalable and cost-effective tool for initial risk stratification across a large population. The main disadvantage, however, is the lack of direct pathophysiological data. Without TKV or genetic data, our model relies on surrogate markers of disease severity and cannot offer the same level of mechanistic insight or precision as the gold-standard tools. Therefore, our model should not be viewed as a replacement for these established methods but rather as a complementary instrument. Its optimal clinical role would be to serve as a first-line screening tool to efficiently identify high-risk patients who could then be prioritized for more definitive prognostic evaluations like imaging or genetic testing.</p></sec><sec id="s4-5"><title>Strengths and Limitations</title><p>To our knowledge, this study represents the first nationwide ML-based analysis of dialysis risk in ADPKD using administrative data. It provides a scalable framework for population-level risk stratification. The use of the NHIRD, a large population-based dataset with long-term follow-up, ensures high generalizability to the nationwide population of Taiwan.</p><p>Several limitations of this study should be acknowledged. First, its retrospective design precludes the establishment of causality. Second, and most importantly, our study is constrained by the nature of the NHIRD, which lacks the gold-standard prognostic markers for ADPKD including genetic data (PKD1/PKD2 status) and imaging biomarkers like TKV, and key laboratory values such as eGFR or proteinuria. Without direct access to TKV or genetic data, our model inherently relies on surrogate markers such as comorbidity burden and medication patterns to infer underlying risk. Despite the use of a washout period and validation via the Catastrophic Illness Patient Registry, truly incident ADPKD cases cannot be fully guaranteed in claims-based data. We therefore wish to emphasize that our model is proposed as a complementary tool for broad-based risk stratification, not as a replacement for comprehensive clinical evaluation. Third, because observation windows vary by index year, the binary labeling framework may under-ascertain events among patients with shorter follow-up and can bias absolute risk interpretation. In addition, calibration curves were not presented, limiting assessment of absolute risk calibration. Fourth, because deaths occurring before ESRD were labeled as nonevents in the binary ML framework, patients with high competing mortality may be misclassified as having low renal risk. Fifth, the measurement of medication exposure, quantified by prescription days, is a proxy that does not capture actual patient adherence, dosage, or treatment adjustments. This limits our ability to make definitive conclusions about the role of specific pharmacological agents. Finally, our model was developed using a Taiwanese population, and its performance and the relative importance of predictors may vary across different ethnic and geographic groups, which may limit generalizability.</p></sec><sec id="s4-6"><title>Future Work</title><p>Future studies should prioritize prospective validation in diverse external cohorts. Methodologically, fixed-horizon prediction and time-to-event approaches, including survival ML and competing-risk or multistate frameworks, should be evaluated to better align modeling with clinical trajectories. External validation datasets that include laboratory, genetic, and imaging biomarkers (eg, eGFR, proteinuria, PKD1/PKD2 status, and TKV) will enable integrated, multitiered risk stratification and more complete assessment of calibration and clinical utility. Moreover, instance-level explainability methods (eg, SHAP) can be explored to support clinical interpretability.</p></sec><sec id="s4-7"><title>Conclusions</title><p>This study developed and evaluated 6 ML models to classify dialysis initiation risk in a nationwide ADPKD cohort using administrative claims data and a prespecified temporal validation design. On the held-out temporal test set, XGBoost showed the best overall performance. The most informative predictors primarily reflected disease severity and care intensity captured in claims data, including age, comorbidity burden, anemia, and hypertension, whereas medication variables should be interpreted as noncausal proxies of clinical complexity.</p></sec></sec></body><back><ack><p>No generative artificial intelligence tools were used to generate the manuscript text, analyses, figures, tables, or multimedia appendix. All study design decisions, analyses, interpretations, and final wording were produced and verified by the authors.</p></ack><notes><sec><title>Funding</title><p>This study was supported by the Shin-Kong Wu Ho-Su Memorial Hospital Research Foundation (2022SKHADR035) and The National Science and Technology Council, Taiwan (NSTC 112-2221-E-030 -009 -MY3). The funding source had no role in the study design, data collection, analysis, or interpretation of the results.</p></sec><sec><title>Data Availability</title><p>The dataset used in this study belongs to the Taiwan Ministry of Health and Welfare (MOHW). Due to data protection regulations, the dataset cannot be shared by the corresponding author upon request. However, researchers interested in accessing this dataset may apply for access through the website of the National Health Informatics Project of the MOHW [<xref ref-type="bibr" rid="ref36">36</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: MC, MHT, YWF</p><p>Data curation: MHT, HHL</p><p>Formal analysis: CHC, MC, YCH, CL</p><p>Funding acquisition: MC, YWF</p><p>Investigation: MHT, YWF</p><p>Methodology: CHC, MC, YCH, HHL, BCS, CL</p><p>Resources: MC, YCH</p><p>Software: MC, YCH</p><p>Supervision: MC, YWF</p><p>Validation: MHT, YCH, BCS</p><p>Writing &#x2013; original draft: CHC, MC</p><p>Writing &#x2013; review and editing: MHT, BCS, CL, YWF</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ACEI</term><def><p>angiotensin-converting enzyme inhibitor</p></def></def-item><def-item><term id="abb2">ADPKD</term><def><p>autosomal dominant polycystic kidney disease</p></def></def-item><def-item><term id="abb3">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb4">AKI</term><def><p>acute kidney injury</p></def></def-item><def-item><term id="abb5">ARB</term><def><p>angiotensin II receptor blocker</p></def></def-item><def-item><term id="abb6">AUC</term><def><p>area under the curve</p></def></def-item><def-item><term id="abb7">CCB</term><def><p>calcium channel blocker</p></def></def-item><def-item><term id="abb8">CCI</term><def><p>Charlson Comorbidity Index</p></def></def-item><def-item><term id="abb9">COPD</term><def><p>chronic obstructive pulmonary disease</p></def></def-item><def-item><term id="abb10">ESRD</term><def><p>end-stage renal disease</p></def></def-item><def-item><term id="abb11">HR</term><def><p>hazard ratio</p></def></def-item><def-item><term id="abb12">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb13">MRI</term><def><p>magnetic resonance imaging</p></def></def-item><def-item><term id="abb14">NHIRD</term><def><p>National Health Insurance Research Database</p></def></def-item><def-item><term id="abb15">NSAID</term><def><p>nonsteroidal anti-inflammatory drug</p></def></def-item><def-item><term id="abb16">PKD</term><def><p>polycystic kidney disease</p></def></def-item><def-item><term id="abb17">TKV</term><def><p>total kidney volume</p></def></def-item><def-item><term id="abb18">UTI</term><def><p>urinary tract infection</p></def></def-item><def-item><term id="abb19">XGBoost</term><def><p>extreme gradient boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Harris</surname><given-names>PC</given-names> </name><name name-style="western"><surname>Torres</surname><given-names>VE</given-names> </name></person-group><article-title>Polycystic kidney disease</article-title><source>Annu Rev Med</source><year>2009</year><volume>60</volume><fpage>321</fpage><lpage>337</lpage><pub-id pub-id-type="doi">10.1146/annurev.med.60.101707.125712</pub-id><pub-id pub-id-type="medline">18947299</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>Kidney Disease: Improving Global Outcomes (KDIGO) ADPKD Work Group</collab></person-group><article-title>KDIGO 2025 clinical practice guideline for the evaluation, management, and treatment of autosomal dominant polycystic kidney disease (ADPKD)</article-title><source>Kidney Int</source><year>2025</year><month>02</month><volume>107</volume><issue>2S</issue><fpage>S1</fpage><lpage>S239</lpage><pub-id pub-id-type="doi">10.1016/j.kint.2024.07.009</pub-id><pub-id pub-id-type="medline">39848759</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jafar</surname><given-names>TH</given-names> </name><name name-style="western"><surname>Stark</surname><given-names>PC</given-names> </name><name name-style="western"><surname>Schmid</surname><given-names>CH</given-names> </name><etal/></person-group><article-title>Progression of chronic kidney disease: the role of blood pressure control, proteinuria, and angiotensin-converting enzyme inhibition: a patient-level meta-analysis</article-title><source>Ann Intern Med</source><year>2003</year><month>08</month><day>19</day><volume>139</volume><issue>4</issue><fpage>244</fpage><lpage>252</lpage><pub-id pub-id-type="doi">10.7326/0003-4819-139-4-200308190-00006</pub-id><pub-id pub-id-type="medline">12965979</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Benck</surname><given-names>U</given-names> </name><name name-style="western"><surname>Kr&#x00FC;ger</surname><given-names>B</given-names> </name><name name-style="western"><surname>Schmitt</surname><given-names>WH</given-names> </name></person-group><article-title>Blood pressure in early autosomal dominant polycystic kidney disease</article-title><source>N Engl J Med</source><year>2015</year><month>03</month><day>5</day><volume>372</volume><issue>10</issue><fpage>975</fpage><lpage>977</lpage><pub-id pub-id-type="doi">10.1056/NEJMc1500332</pub-id><pub-id pub-id-type="medline">25738679</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kramers</surname><given-names>BJ</given-names> </name><name name-style="western"><surname>Koorevaar</surname><given-names>IW</given-names> </name><name name-style="western"><surname>Drenth</surname><given-names>JPH</given-names> </name><etal/></person-group><article-title>Salt, but not protein intake, is associated with accelerated disease progression in autosomal dominant polycystic kidney disease</article-title><source>Kidney Int</source><year>2020</year><month>10</month><volume>98</volume><issue>4</issue><fpage>989</fpage><lpage>998</lpage><pub-id pub-id-type="doi">10.1016/j.kint.2020.04.053</pub-id><pub-id pub-id-type="medline">32534051</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nowak</surname><given-names>KL</given-names> </name><name name-style="western"><surname>Steele</surname><given-names>C</given-names> </name><name name-style="western"><surname>Gitomer</surname><given-names>B</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Ouyang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chonchol</surname><given-names>MB</given-names> </name></person-group><article-title>Overweight and obesity and progression of ADPKD</article-title><source>Clin J Am Soc Nephrol</source><year>2021</year><month>06</month><volume>16</volume><issue>6</issue><fpage>908</fpage><lpage>915</lpage><pub-id pub-id-type="doi">10.2215/CJN.16871020</pub-id><pub-id pub-id-type="medline">34117082</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Torres</surname><given-names>VE</given-names> </name><name name-style="western"><surname>Chapman</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Devuyst</surname><given-names>O</given-names> </name><etal/></person-group><article-title>Tolvaptan in patients with autosomal dominant polycystic kidney disease</article-title><source>N Engl J Med</source><year>2012</year><month>12</month><day>20</day><volume>367</volume><issue>25</issue><fpage>2407</fpage><lpage>2418</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa1205511</pub-id><pub-id pub-id-type="medline">23121377</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Takiar</surname><given-names>V</given-names> </name><name name-style="western"><surname>Nishio</surname><given-names>S</given-names> </name><name name-style="western"><surname>Seo-Mayer</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Activating AMP-activated protein kinase (AMPK) slows renal cystogenesis</article-title><source>Proc Natl Acad Sci U S A</source><year>2011</year><month>02</month><day>8</day><volume>108</volume><issue>6</issue><fpage>2462</fpage><lpage>2467</lpage><pub-id pub-id-type="doi">10.1073/pnas.1011498108</pub-id><pub-id pub-id-type="medline">21262823</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fassett</surname><given-names>RG</given-names> </name><name name-style="western"><surname>Robertson</surname><given-names>IK</given-names> </name><name name-style="western"><surname>Ball</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Geraghty</surname><given-names>DP</given-names> </name><name name-style="western"><surname>Coombes</surname><given-names>JS</given-names> </name></person-group><article-title>Effect of atorvastatin on kidney function in chronic kidney disease: a randomised double-blind placebo-controlled trial</article-title><source>Atherosclerosis</source><year>2010</year><month>11</month><volume>213</volume><issue>1</issue><fpage>218</fpage><lpage>224</lpage><pub-id pub-id-type="doi">10.1016/j.atherosclerosis.2010.07.053</pub-id><pub-id pub-id-type="medline">20810109</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Irazabal</surname><given-names>MV</given-names> </name><name name-style="western"><surname>Rangel</surname><given-names>LJ</given-names> </name><name name-style="western"><surname>Bergstralh</surname><given-names>EJ</given-names> </name><etal/></person-group><article-title>Imaging classification of autosomal dominant polycystic kidney disease: a simple model for selecting patients for clinical trials</article-title><source>J Am Soc Nephrol</source><year>2015</year><month>01</month><volume>26</volume><issue>1</issue><fpage>160</fpage><lpage>172</lpage><pub-id pub-id-type="doi">10.1681/ASN.2013101138</pub-id><pub-id pub-id-type="medline">24904092</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cornec-Le Gall</surname><given-names>E</given-names> </name><name name-style="western"><surname>Audr&#x00E9;zet</surname><given-names>MP</given-names> </name><name name-style="western"><surname>Rousseau</surname><given-names>A</given-names> </name><etal/></person-group><article-title>The PROPKD score: a new algorithm to predict renal survival in autosomal dominant polycystic kidney disease</article-title><source>J Am Soc Nephrol</source><year>2016</year><month>03</month><volume>27</volume><issue>3</issue><fpage>942</fpage><lpage>951</lpage><pub-id pub-id-type="doi">10.1681/ASN.2015010016</pub-id><pub-id pub-id-type="medline">26150605</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Niel</surname><given-names>O</given-names> </name><name name-style="western"><surname>Boussard</surname><given-names>C</given-names> </name><name name-style="western"><surname>Bastard</surname><given-names>P</given-names> </name></person-group><article-title>Artificial intelligence can predict GFR decline during the course of ADPKD</article-title><source>Am J Kidney Dis</source><year>2018</year><month>06</month><volume>71</volume><issue>6</issue><fpage>911</fpage><lpage>912</lpage><pub-id pub-id-type="doi">10.1053/j.ajkd.2018.01.051</pub-id><pub-id pub-id-type="medline">29609979</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Bu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Tao</surname><given-names>C</given-names> </name><name name-style="western"><surname>Bae</surname><given-names>KT</given-names> </name><collab>HALT Polycystic Kidney Disease Study Group</collab></person-group><article-title>Deep learning-based automated imaging classification of ADPKD</article-title><source>Kidney Int Rep</source><year>2024</year><month>06</month><volume>9</volume><issue>6</issue><fpage>1802</fpage><lpage>1809</lpage><pub-id pub-id-type="doi">10.1016/j.ekir.2024.04.002</pub-id><pub-id pub-id-type="medline">38899202</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sharma</surname><given-names>K</given-names> </name><name name-style="western"><surname>Rupprecht</surname><given-names>C</given-names> </name><name name-style="western"><surname>Caroli</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Automatic segmentation of kidneys using deep learning for total kidney volume quantification in autosomal dominant polycystic kidney disease</article-title><source>Sci Rep</source><year>2017</year><month>05</month><day>17</day><volume>7</volume><issue>1</issue><fpage>2049</fpage><pub-id pub-id-type="doi">10.1038/s41598-017-01779-0</pub-id><pub-id pub-id-type="medline">28515418</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Taylor</surname><given-names>J</given-names> </name><name name-style="western"><surname>Thomas</surname><given-names>R</given-names> </name><name name-style="western"><surname>Metherall</surname><given-names>P</given-names> </name><etal/></person-group><article-title>An artificial intelligence generated automated algorithm to measure total kidney volume in ADPKD</article-title><source>Kidney Int Rep</source><year>2024</year><month>02</month><volume>9</volume><issue>2</issue><fpage>249</fpage><lpage>256</lpage><pub-id pub-id-type="doi">10.1016/j.ekir.2023.10.029</pub-id><pub-id pub-id-type="medline">38344736</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lin</surname><given-names>LY</given-names> </name><name name-style="western"><surname>Warren-Gash</surname><given-names>C</given-names> </name><name name-style="western"><surname>Smeeth</surname><given-names>L</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>PC</given-names> </name></person-group><article-title>Data resource profile: the National Health Insurance Research Database (NHIRD)</article-title><source>Epidemiol Health</source><year>2018</year><volume>40</volume><fpage>e2018062</fpage><pub-id pub-id-type="doi">10.4178/epih.e2018062</pub-id><pub-id pub-id-type="medline">30727703</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kalatharan</surname><given-names>V</given-names> </name><name name-style="western"><surname>McArthur</surname><given-names>E</given-names> </name><name name-style="western"><surname>Nash</surname><given-names>DM</given-names> </name><etal/></person-group><article-title>Diagnostic accuracy of administrative codes for autosomal dominant polycystic kidney disease in clinic patients with cystic kidney disease</article-title><source>Clin Kidney J</source><year>2021</year><month>02</month><volume>14</volume><issue>2</issue><fpage>612</fpage><lpage>616</lpage><pub-id pub-id-type="doi">10.1093/ckj/sfz184</pub-id><pub-id pub-id-type="medline">33623686</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nan-Ping</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yi-Hui</surname><given-names>L</given-names> </name><name name-style="western"><surname>Chi-Yu</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Comparisons of medical utilizations and categorical diagnoses of emergency visits between the elderly with catastrophic illness certificates and those without</article-title><source>BMC Health Serv Res</source><year>2013</year><month>04</month><day>26</day><volume>13</volume><fpage>152</fpage><pub-id pub-id-type="doi">10.1186/1472-6963-13-152</pub-id><pub-id pub-id-type="medline">23622501</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>SW</given-names> </name><name name-style="western"><surname>Li</surname><given-names>LC</given-names> </name><name name-style="western"><surname>Su</surname><given-names>CH</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>YH</given-names> </name><name name-style="western"><surname>Hsu</surname><given-names>TW</given-names> </name><name name-style="western"><surname>Hsu</surname><given-names>CN</given-names> </name></person-group><article-title>Association of statin and its lipophilicity with cardiovascular events in patients receiving chronic dialysis</article-title><source>Clin Pharmacol Ther</source><year>2020</year><month>06</month><volume>107</volume><issue>6</issue><fpage>1312</fpage><lpage>1324</lpage><pub-id pub-id-type="doi">10.1002/cpt.1722</pub-id><pub-id pub-id-type="medline">31715017</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Hastie</surname><given-names>T</given-names> </name><name name-style="western"><surname>Tibshirani</surname><given-names>R</given-names> </name><name name-style="western"><surname>Friedman</surname><given-names>J</given-names> </name></person-group><source>The Elements of Statistical Learning</source><year>2009</year><publisher-name>Springer</publisher-name><pub-id pub-id-type="doi">10.1007/978-0-387-84858-7</pub-id><pub-id pub-id-type="other">978-0-387-84857-0</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Prokhorenkova</surname><given-names>L</given-names> </name><name name-style="western"><surname>Gusev</surname><given-names>G</given-names> </name><name name-style="western"><surname>Vorobev</surname><given-names>A</given-names> </name><name name-style="western"><surname>Dorogush</surname><given-names>AV</given-names> </name><name name-style="western"><surname>Gulin</surname><given-names>A</given-names> </name></person-group><article-title>CatBoost: unbiased boosting with categorical features</article-title><access-date>2026-02-24</access-date><conf-name>32nd Conference on Neural Information Processing Systems (NeurIPS 2018)</conf-name><conf-date>Dec 3-8, 2018</conf-date><comment><ext-link ext-link-type="uri" xlink:href="https://proceedings.neurips.cc/paper_files/paper/2018/file/14491b756b3a51daac41c24863285549-Paper.pdf">https://proceedings.neurips.cc/paper_files/paper/2018/file/14491b756b3a51daac41c24863285549-Paper.pdf</ext-link></comment></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Ho</surname><given-names>CW</given-names> </name><name name-style="western"><surname>Chou</surname><given-names>WR</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>M</given-names> </name></person-group><article-title>A framework to predict second primary lung cancer patients by using ensemble models</article-title><source>Ann Oper Res</source><year>2025</year><month>05</month><volume>348</volume><issue>1</issue><fpage>373</fpage><lpage>397</lpage><pub-id pub-id-type="doi">10.1007/s10479-023-05691-x</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>KY</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>CK</given-names> </name><name name-style="western"><surname>Li</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>M</given-names> </name></person-group><article-title>Machine learning-driven prediction of medical expenses in triple-vessel PCI patients using feature selection</article-title><source>BMC Health Serv Res</source><year>2025</year><month>01</month><day>20</day><volume>25</volume><issue>1</issue><fpage>105</fpage><pub-id pub-id-type="doi">10.1186/s12913-025-12218-6</pub-id><pub-id pub-id-type="medline">39833782</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rahbari-Oskoui</surname><given-names>F</given-names> </name><name name-style="western"><surname>Williams</surname><given-names>O</given-names> </name><name name-style="western"><surname>Chapman</surname><given-names>A</given-names> </name></person-group><article-title>Mechanisms and management of hypertension in autosomal dominant polycystic kidney disease</article-title><source>Nephrol Dial Transplant</source><year>2014</year><month>12</month><volume>29</volume><issue>12</issue><fpage>2194</fpage><lpage>2201</lpage><pub-id pub-id-type="doi">10.1093/ndt/gft513</pub-id><pub-id pub-id-type="medline">24463189</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Helal</surname><given-names>I</given-names> </name><name name-style="western"><surname>Reed</surname><given-names>B</given-names> </name><name name-style="western"><surname>Mettler</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Prevalence of cardiovascular events in patients with autosomal dominant polycystic kidney disease</article-title><source>Am J Nephrol</source><year>2012</year><volume>36</volume><issue>4</issue><fpage>362</fpage><lpage>370</lpage><pub-id pub-id-type="doi">10.1159/000343281</pub-id><pub-id pub-id-type="medline">23038404</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chapman</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Stepniakowski</surname><given-names>K</given-names> </name><name name-style="western"><surname>Rahbari-Oskoui</surname><given-names>F</given-names> </name></person-group><article-title>Hypertension in autosomal dominant polycystic kidney disease</article-title><source>Adv Chronic Kidney Dis</source><year>2010</year><month>03</month><volume>17</volume><issue>2</issue><fpage>153</fpage><lpage>163</lpage><pub-id pub-id-type="doi">10.1053/j.ackd.2010.01.001</pub-id><pub-id pub-id-type="medline">20219618</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schrier</surname><given-names>RW</given-names> </name><name name-style="western"><surname>Abebe</surname><given-names>KZ</given-names> </name><name name-style="western"><surname>Perrone</surname><given-names>RD</given-names> </name><etal/></person-group><article-title>Blood pressure in early autosomal dominant polycystic kidney disease</article-title><source>N Engl J Med</source><year>2014</year><month>12</month><day>11</day><volume>371</volume><issue>24</issue><fpage>2255</fpage><lpage>2266</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa1402685</pub-id><pub-id pub-id-type="medline">25399733</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>DH</given-names> </name><name name-style="western"><surname>Schneeweiss</surname><given-names>S</given-names> </name><name name-style="western"><surname>Glynn</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Lipsitz</surname><given-names>LA</given-names> </name><name name-style="western"><surname>Rockwood</surname><given-names>K</given-names> </name><name name-style="western"><surname>Avorn</surname><given-names>J</given-names> </name></person-group><article-title>Measuring frailty in Medicare data: development and validation of a claims-based frailty index</article-title><source>J Gerontol A Biol Sci Med Sci</source><year>2018</year><month>06</month><day>14</day><volume>73</volume><issue>7</issue><fpage>980</fpage><lpage>987</lpage><pub-id pub-id-type="doi">10.1093/gerona/glx229</pub-id><pub-id pub-id-type="medline">29244057</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Walker</surname><given-names>H</given-names> </name><name name-style="western"><surname>Day</surname><given-names>S</given-names> </name><name name-style="western"><surname>Grant</surname><given-names>CH</given-names> </name><etal/></person-group><article-title>Representation of multimorbidity and frailty in the development and validation of kidney failure prognostic prediction models: a systematic review</article-title><source>BMC Med</source><year>2024</year><month>10</month><day>11</day><volume>22</volume><issue>1</issue><fpage>452</fpage><pub-id pub-id-type="doi">10.1186/s12916-024-03649-9</pub-id><pub-id pub-id-type="medline">39394084</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chuah</surname><given-names>A</given-names> </name><name name-style="western"><surname>Walters</surname><given-names>G</given-names> </name><name name-style="western"><surname>Christiadi</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Machine learning improves upon clinicians&#x2019; prediction of end stage kidney disease</article-title><source>Front Med</source><year>2022</year><volume>9</volume><pub-id pub-id-type="doi">10.3389/fmed.2022.837232</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Al-Sayouri</surname><given-names>S</given-names> </name><name name-style="western"><surname>Padman</surname><given-names>R</given-names> </name></person-group><article-title>Towards interpretable end-stage renal disease (ESRD) prediction: utilizing administrative claims data with explainable AI techniques</article-title><source>AMIA Annu Symp Proc</source><year>2024</year><volume>2024</volume><fpage>664</fpage><lpage>673</lpage><pub-id pub-id-type="medline">40417492</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ushio</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Kataoka</surname><given-names>H</given-names> </name><name name-style="western"><surname>Sato</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Association between anemia and renal prognosis in autosomal dominant polycystic kidney disease: a retrospective study</article-title><source>Clin Exp Nephrol</source><year>2020</year><month>06</month><volume>24</volume><issue>6</issue><fpage>500</fpage><lpage>508</lpage><pub-id pub-id-type="doi">10.1007/s10157-020-01856-1</pub-id><pub-id pub-id-type="medline">32036465</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goraya</surname><given-names>N</given-names> </name><name name-style="western"><surname>Wesson</surname><given-names>DE</given-names> </name></person-group><article-title>Clinical evidence that treatment of metabolic acidosis slows the progression of chronic kidney disease</article-title><source>Curr Opin Nephrol Hypertens</source><year>2019</year><month>05</month><volume>28</volume><issue>3</issue><fpage>267</fpage><lpage>277</lpage><pub-id pub-id-type="doi">10.1097/MNH.0000000000000491</pub-id><pub-id pub-id-type="medline">30681417</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Torres</surname><given-names>VE</given-names> </name><name name-style="western"><surname>Abebe</surname><given-names>KZ</given-names> </name><name name-style="western"><surname>Chapman</surname><given-names>AB</given-names> </name><etal/></person-group><article-title>Angiotensin blockade in late autosomal dominant polycystic kidney disease</article-title><source>N Engl J Med</source><year>2014</year><month>12</month><day>11</day><volume>371</volume><issue>24</issue><fpage>2267</fpage><lpage>2276</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa1402686</pub-id><pub-id pub-id-type="medline">25399731</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yao</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Treatment of persistent gross hematuria with tranexamic acid in autosomal dominant polycystic kidney disease</article-title><source>Kidney Blood Press Res</source><year>2017</year><volume>42</volume><issue>1</issue><fpage>156</fpage><lpage>164</lpage><pub-id pub-id-type="doi">10.1159/000474961</pub-id><pub-id pub-id-type="medline">28395294</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="web"><article-title>National health informatics project of the MOHW</article-title><source>Ministry of Health and Welfare</source><access-date>2026-02-27</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://dep.mohw.gov.tw/DOS/mp-113.html">https://dep.mohw.gov.tw/DOS/mp-113.html</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Supplementary methods and tables, including model implementation details for the six machine learning algorithms, ICD-9-CM/ICD-10-CM codes for comorbidities (Table S1), ATC codes and drug lists (Table S2), and tuned hyperparameters with software packages and versions (Table S3).</p><media xlink:href="medinform_v14i1e80343_app1.docx" xlink:title="DOCX File, 38 KB"/></supplementary-material></app-group></back></article>