<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id><journal-id journal-id-type="publisher-id">medinform</journal-id><journal-id journal-id-type="index">7</journal-id><journal-title>JMIR Medical Informatics</journal-title><abbrev-journal-title>JMIR Med Inform</abbrev-journal-title><issn pub-type="epub">2291-9694</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v13i1e74415</article-id><article-id pub-id-type="doi">10.2196/74415</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Machine Learning&#x2013;Based Analysis of Lifestyle Risk Factors for Atherosclerotic Cardiovascular Disease: Retrospective Case-Control Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Kim</surname><given-names>Hye-Jin</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Choi</surname><given-names>Heeji</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ahn</surname><given-names>Hyo-Jung</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Shin</surname><given-names>Seung-Ho</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Kim</surname><given-names>Chulho</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lee</surname><given-names>Sang-Hwa</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sohn</surname><given-names>Jong-Hee</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lee</surname><given-names>Jae-Jun</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Artificial Intelligence Research Center, College of Medicine, Hallym University</institution><addr-line>Chuhcneon-si</addr-line><country>Republic of Korea</country></aff><aff id="aff2"><institution>Health Insurance Review and Assessment Research Institute, Health Insurance Review and Assessment Service</institution><addr-line>Wonju-si</addr-line><country>Republic of Korea</country></aff><aff id="aff3"><institution>Department of Neurology, College of Medicine, Hallym University</institution><addr-line>1, Hallymdaehak-gil</addr-line><addr-line>Chuncheon-si</addr-line><country>Republic of Korea</country></aff><aff id="aff4"><institution>Department of Anesthesiology, College of Medicine, Hallym University</institution><addr-line>Chuncheon-si</addr-line><country>Republic of Korea</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Benis</surname><given-names>Arriel</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Adeoye</surname><given-names>Adekunle</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Obisesan Olawuni</surname><given-names>Kudirat Abidemi</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Potla</surname><given-names>Ravi Teja</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to  Chulho Kim, MD, PhD, Department of Neurology, College of Medicine, Hallym University, 1, Hallymdaehak-gil, Chuncheon-si, 24252, Republic of Korea, 82 332405255, 82 1095173201; <email>gumdol52@naver.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>7</day><month>8</month><year>2025</year></pub-date><volume>13</volume><elocation-id>e74415</elocation-id><history><date date-type="received"><day>24</day><month>03</month><year>2025</year></date><date date-type="rev-recd"><day>09</day><month>05</month><year>2025</year></date><date date-type="accepted"><day>16</day><month>06</month><year>2025</year></date></history><copyright-statement>&#x00A9; Hye-Jin Kim, Heeji Choi, Hyo-Jung Ahn, Seung-Ho Shin, Chulho Kim, Sang-Hwa Lee, Jong-Hee Sohn, Jae-Jun Lee. Originally published in JMIR Medical Informatics (<ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org">https://medinform.jmir.org</ext-link>), 7.8.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://medinform.jmir.org/">https://medinform.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://medinform.jmir.org/2025/1/e74415"/><abstract><sec><title>Background</title><p>The risk of developing atherosclerotic cardiovascular disease (ASCVD) varies among individuals and is related to a variety of lifestyle factors in addition to the presence of chronic diseases.</p></sec><sec><title>Objective</title><p>We aimed to assess the predictive accuracy of machine learning (ML) models incorporating lifestyle risk behaviors for ASCVD risk using the Korean nationwide database.</p></sec><sec sec-type="methods"><title>Methods</title><p>Using data from the Korea National Health and Nutrition Examination Survey, 5 ML algorithms were used for the prediction of high ASCVD risk: logistic regression (LR), support vector machine, random forest, extreme gradient boosting, and light gradient boosting models. ASCVD risk was assessed using the pooled cohort equations, with a high-risk threshold of &#x2265;7.5% over 10 years. Among the 8573 participants aged 40&#x2010;79 years, propensity score matching (PSM) was used to adjust for demographic confounders. We divided the dataset into a training and a test dataset in an 8:2 ratio. We also used bootstrapping to train the ML model with the area under the receiver operating characteristics curve score. Shapley additive explanations were used to identify the models&#x2019; important variables in assessing high ASCVD risks. In sensitivity analysis, we additionally performed binary LR analysis, in which the ML model&#x2019;s results were consistent with the conventional statistical model.</p></sec><sec sec-type="results"><title>Results</title><p>Of the 8573 participants, 41.7% (n=3578) had high ASCVD risk. Before PSM, age and sex differed significantly between groups. PSM (1:1) yielded 1976 patients with balanced demographics. After PSM, the high ASCVD risk group had higher alcohol or tobacco use, lower omega-3 intake, higher BMI, less physical activity, and spent less time sitting. In 5 ML models, the extreme gradient boosting model showed the highest area under the receiver operating characteristics curve, indicating superior overall discrimination between high and low ASCVD risk groups. However, the light gradient boosting model demonstrated better performance in accuracy, recall, and <italic>F</italic><sub>1</sub>-score. Variable importance analysis using Shapley additive explanations identified smoking and age as the strongest predictors, while BMI, sodium or omega-3 intake, and low-density lipoprotein cholesterol also had significant variables. Sensitivity analysis using multivariable LR analysis also confirmed these findings, showing that smoking, BMI, and low-density lipoprotein cholesterol increased ASCVD risk, whereas omega-3 intake and physical activity were associated with lower risk.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Analyzing lifestyle behavioral factors in ASCVD risk with an ML model improves the predictive performance compared to traditional models. Personalized prevention strategies tailored to an individual&#x2019;s lifestyle can effectively reduce ASCVD risk.</p></sec></abstract><kwd-group><kwd>atherosclerotic cardiovascular disease</kwd><kwd>machine learning</kwd><kwd>lifestyle risk behaviors</kwd><kwd>predictive modeling</kwd><kwd>low-density lipoprotein</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Atherosclerotic cardiovascular disease (ASCVD) remains the leading cause of morbidity and mortality worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. In 2019, cardiovascular diseases (CVDs) were responsible for an estimated 32% of all global deaths [<xref ref-type="bibr" rid="ref2">2</xref>]. Of the 17 million premature deaths caused by noncommunicable diseases in 2019, 38% were attributable to CVDs [<xref ref-type="bibr" rid="ref2">2</xref>]. The prevalence of CVDs in South Korea has recently been increasing [<xref ref-type="bibr" rid="ref3">3</xref>]. While the CVD mortality rate declined until 2010, it has been steadily rising since then [<xref ref-type="bibr" rid="ref4">4</xref>]. Considering these trends, addressing CVDs is crucial for improving public health outcomes.</p><p>The main risk factors for developing ASCVD include hypertension, smoking, and dyslipidemia [<xref ref-type="bibr" rid="ref5">5</xref>]. Additionally, ASCVD outcomes vary across different ethnic groups based on socioeconomic status, which also influences health-related lifestyle behaviors [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. As the prevalence of ASCVD is increasing, the importance of primary prevention has been emphasized from a public health perspective [<xref ref-type="bibr" rid="ref9">9</xref>]. ASCVDs are closely related to modifiable risk factors that can be controlled through lifestyle modification, which is the cornerstone of ASCVD prevention [<xref ref-type="bibr" rid="ref9">9</xref>]. The most effective prevention strategy is a comprehensive approach that promotes a healthy lifestyle and addresses all major risk factors [<xref ref-type="bibr" rid="ref10">10</xref>].</p><p>Machine learning (ML) has been increasingly applied in medical data analysis, offering numerous benefits for enhancing patient care and improving clinical outcomes [<xref ref-type="bibr" rid="ref11">11</xref>]. Additionally, ML facilitates precision medicine by enabling early identification of high-risk patients for disease progression with high accuracy [<xref ref-type="bibr" rid="ref11">11</xref>]. Previous studies have constructed ML models for predicting ASCVD, but few have modeled the impact of lifestyle behaviors on ASCVD risk [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. Despite advances in ML, the combined predictive power of detailed lifestyle factors&#x2014;especially within interpretable ML frameworks&#x2014;remains underexplored. Although ML improves risk prediction, understanding which lifestyle factors have the greatest impact is crucial for prevention&#x2014;yet this is often unclear with black-box models. This study addresses that gap by applying interpretable ML techniques to accurately predict ASCVD risk and clarify the specific impact of individual lifestyle factors. ASCVD risk is influenced by demographic variables such as age, race, and sex, as well as lifestyle behaviors [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. Using data from the nationwide Korea National Health and Nutrition Examination Survey (KNHANES), we used five ML models to (1) examine the relationship between lifestyle factors and ASCVD risk, (2) evaluate the predictive performance of these models, and (3) identify the most influential predictors using interpretable methods.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Participants</title><p>This retrospective case-control study used nationally representative data from the KNHANES. The KNHANES is an ongoing, cross-sectional survey initiated in 1998 by the Korea Disease Control and Prevention Agency (KDCA) to assess the health and nutritional status of the Korean population. We used anonymized, publicly available data from 2019 to 2021. Among the 22,559 total participants in the 2019&#x2010;2021 KNHANES dataset, we initially screened 10,481 individuals aged 40&#x2010;79 years with no history of cardiovascular events. We excluded 1908 participants with missing data on sodium intake, low-density lipoprotein (LDL) cholesterol, time spent sitting, occupation, marital status, smoking status, income, BMI, or weight change over 1 year. The final analytic sample included 8573 participants.</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>The original KNHANES surveys received ethical approval from the KDCA Institutional Review Board, and informed consent was obtained from all participants. All data were anonymized and deidentified by KDCA prior to public release. As this study involved the secondary analysis of deidentified public data, it was exempt from additional institutional review board review by our institution (2024-03-008).</p></sec><sec id="s2-3"><title>Measurement of ASCVD Risk Score</title><p>The 10-year ASCVD risk was assessed using the American College of Cardiology/American Heart Association pooled cohort equations (PCEs) risk score [<xref ref-type="bibr" rid="ref15">15</xref>]. They recommended that PCEs for non-Hispanic White people may be considered for risk estimation in populations other than non-Hispanic African American and non-Hispanic White people [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Therefore, the estimation function of the ASCVD risk score for the White population was used in this study. This score algorithm is designed to predict both the 10-year (40&#x2010;79 years of age) and lifetime (20&#x2010;59 years of age) risk of ASCVD. This includes the assessment of both fatal and nonfatal coronary heart disease and stroke [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. We categorized participants into two groups based on their 10-year ASCVD risk calculated using the PCEs: a low ASCVD risk group (ASCVD risk &#x003C;7.5%) and a high ASCVD risk group (ASCVD risk &#x2265;7.5%).</p></sec><sec id="s2-4"><title>Measurement of Lifestyle Risk Behaviors</title><p>The lifestyle risk behaviors analyzed in this study included sex, age, occupation, marital status, residential area, household income, alcohol consumption, smoking, omega-3 intake, sodium intake, BMI, weight change over 1 year, LDL cholesterol, physical activity, and time spent sitting. The occupation was classified into three categories of nonmanual workers, manual workers, and other workers. Marital status was separated and widowed, and divorced participants were assigned the no spouse status. The residential area was grouped as urban or rural areas. Alcohol consumption was divided into two categories, where participants drank at least 2 days per week and fewer than 2 days per week [<xref ref-type="bibr" rid="ref19">19</xref>], regardless of the amount of alcohol consumed. Individuals who had smoked at least 100 cigarettes in their lifetime and currently smoked were classified as smokers, whereas those who had smoked fewer than 100 cigarettes in their lifetime but did not currently smoke and never smoked in their lifetime were classified as nonsmokers. BMI was calculated as weight in kilograms divided by height in meters squared. Weight change over 1 year was classified into three categories of no weight change, weight gain, and weight loss. Using the criteria specified in the questionnaire, weight gains and losses of 0 to less than 3 kg over 1 year were classified as no change, gains of more than 3 kg as weight gain, and losses of more than 3 kg as weight loss. Physical activity was calculated using the sum of the minutes of exercise per week and considering the strength of the exercise intensity (vigorous and moderate). The combination of vigorous intensity and moderate intensity exercise was considered by calculating the minutes exercised per week as follows: 2&#x00D7;moderate activity (minutes per week)+vigorous activity (minutes per week) [<xref ref-type="bibr" rid="ref20">20</xref>]. &#x201C;Physically active&#x201D; is defined as engaging in at least 150 minutes of moderate activity per week [<xref ref-type="bibr" rid="ref21">21</xref>]. We used omega-3 or sodium intake in grams per day and time spent sitting in minutes per day, and these variables were entered into the ML model as continuous variables.</p></sec><sec id="s2-5"><title>Statistical Analysis</title><p>We categorized ASCVD risk into two groups: high and low risk. The ASCVD risk score itself is calculated using age and sex. Consequently, the high-risk and low-risk groups are inherently expected to differ significantly in these demographic factors by definition. In addition, our primary goal was to assess how lifestyle behaviors differ between high and low-risk individuals after accounting for nonmodifiable or less modifiable factors. Therefore, we performed 1:1 propensity score matching (PSM) based on sociodemographic characteristics to assess the impact of lifestyle behaviors on ASCVD risk.</p><p>The propensity score was calculated with the following variables: sex, age, job or marital status, residential area, and household income. In descriptive analyses of two-group comparisons, continuous variables were presented as median and IQR, and categorical variables were presented as proportions (%). Differences between high and low ASCVD groups were compared using the Mann-Whitney <italic>U</italic> test for continuous variables after a normality test, and the chi-square test for categorical variables.</p><p>We used 5 ML algorithms for the prediction of high ASCVD risk: logistic regression (LR), support vector machine, random forest (RF), extreme gradient boosting (XGB), and light gradient boosting (LGB) model. We specifically included ensemble methods, particularly RF, XGB, and LGB models. These ensemble ML models can effectively capture complex, nonlinear relationships and high-order interactions between various risk factors (eg, lifestyle, demographic, and clinical variables) without requiring explicit prespecification [<xref ref-type="bibr" rid="ref22">22</xref>]. In addition, they include built-in regularization techniques (like L1 and L2 penalties) to mitigate overfitting, a common concern with complex medical data [<xref ref-type="bibr" rid="ref23">23</xref>]. In the ML model, categorical variables (including sex [after PSM, though balanced], job category, marital status, residential area, alcohol consumption frequency category, smoking status, and weight change category) were retained in their original numeric coding format. Continuous variables (including age [after PSM], omega-3 intake, sodium intake, BMI, LDL cholesterol, and time spent sitting) were scaled to a range of [0, 1] using min-max normalization. In this study, we adopted a strict data separation strategy for model development and evaluation. First, the entire dataset was randomly partitioned into a training set (80%) and a test set (20%), and stratification was applied to the partitioning to ensure that both sets retained the same class distribution as the original data. We also fixed the random seed to ensure the reproducibility of the data. Then, we performed a 5-fold stratified cross-validation on the training dataset only. In this process, we divided the training data into five equal-sized folds and repeated it five times, using 4-fold for training and one for validation in each iteration. Based on the results of this cross-validation, the optimal model structure and hyperparameters with the lowest loss were selected. Hyperparameter optimization for each of the five ML models (LR, support vector machine, RF, XGB, and LGB) was performed using Optuna, an automated hyperparameter optimization framework [<xref ref-type="bibr" rid="ref24">24</xref>]. We used Optuna&#x2019;s Tree-structured Parzen Estimator sampler, a Bayesian optimization approach, to efficiently search for optimal hyperparameter combinations. For each model, optimization was conducted over 100 trials, aiming to minimize the loss obtained from the 5-fold cross-validation within the training dataset. The specific hyperparameters tuned for each model, their respective search spaces (eg, ranges for continuous parameters and choices for categorical parameters), and the final optimal configurations identified by Optuna and used for training are all detailed in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. We evaluated the final model using a separate test set (20% of the total data). This is to objectively measure the generalization performance of the model. To calculate CIs for the ML model&#x2019;s performance metrics, we used the bootstrapping method. The 95% CIs were calculated by repeating the bootstrapping samples 1000 times with 50% of the data as restoration extraction from the test dataset. Understanding the performance of ML models is becoming increasingly important, which highlights the growing significance of explainable artificial intelligence in interpreting model results. We used the SHapley Additive exPlanations (SHAP) value to visualize the importance and relationships among the input features of the model. In addition to the area under the receiver operating characteristics curve (AUROC) score, accuracy, precision, recall, <italic>F</italic><sub>1</sub>-score, specificity, and area under the precision-recall curve were calculated to assess the performance of the developed ML models.</p><p>We conducted a multivariable LR analysis as a sensitivity test to verify whether the ML model&#x2019;s findings on high ASCVD risk were consistent with conventional statistical methods. Univariable LR analysis was first performed on 1:1 matched patients (high vs low ASCVD risk) to identify lifestyle and sociodemographic factors associated with high ASCVD risk. Variables with a <italic>P</italic> value &#x003C;.05 in the univariable model were entered into the multivariable model, and their significance was reported as adjusted odds ratios with 95% CIs.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Baseline Characteristics</title><p>Of the 8573 participants, the proportion of the high ASCVD risk group was 41.7% (3578/8573), and 5059 (59%) participants were women (<xref ref-type="table" rid="table1">Table 1</xref>). As detailed in <xref ref-type="table" rid="table1">Table 1</xref>, prior to PSM, substantial baseline differences were evident across nearly all measured characteristics. Notably, the high ASCVD risk group was significantly older (median age 68.0, IQR 62.0-73.0 vs 51.0, IQR 45.0-58.0 y; <italic>P</italic>&#x003C;.001) and comprised a much higher proportion of men (61.9% vs 26%; <italic>P</italic>&#x003C;.001) compared to the low-risk group. Significant disparities also existed in socioeconomic factors (job distribution, marital status, residential area, and income) and various lifestyle behaviors, including higher rates of frequent alcohol consumption and smoking, lower omega-3 intake, higher BMI, lower physical activity levels, and differences in weight change patterns and sitting time (all <italic>P</italic>&#x2264;.02). The propensity score distribution and standardized differences before and after PSM for the variables used in propensity score calculation are presented in Figures S1 and S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Using the 1:1 PSM method, 1976 patients were included in the final population for analysis, ensuring no significant differences in sociodemographic variables between the two groups, except for lifestyle behaviors. Following 1:1 PSM, which successfully balanced the groups for key demographic and socioeconomic confounders (sex, age, job, marital status, residential area, and income; all <italic>P</italic>&#x003E;.20), several crucial differences in lifestyle behaviors remained statistically significant. Specifically, even after matching, the high ASCVD risk group demonstrated markedly higher rates of frequent alcohol consumption (25.3% vs 18.3 %; <italic>P</italic>&#x003C;.001) and current smoking (42.2% vs 6.3%; <italic>P</italic>&#x003C;.001). Furthermore, this group had significantly lower daily omega-3 intake (median 1.3, IQR 0.7-2.3 vs 1.5, IQR 0.9-2.6 g; <italic>P</italic>&#x003C;.001) and a higher BMI (median 25.1, IQR 23.2-27.3 vs 23.9, IQR 21.9-25.8 kg/m&#x00B2;; <italic>P</italic>&#x003C;.001). They also reported engaging in less physical activity (16.6% active vs 22% active; <italic>P</italic>=.003). Interestingly, the high-risk group reported slightly less time spent sitting compared to the low-risk group after matching (median 8, IQR 5-10 h per day; <italic>P</italic>=.003). Notably, the initial significant differences observed in sodium intake and LDL cholesterol levels before matching were no longer significant after PSM (<italic>P</italic>=.15 and <italic>P</italic>=.12, respectively), suggesting these factors were partly confounded by the demographic variables adjusted for in the matching process. The flowchart of participants is presented in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Comparison of baseline characteristics of high and low ASCVD<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> risk groups before and after propensity score matching.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variable</td><td align="left" valign="bottom" colspan="3">Before PSM<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="bottom" colspan="3">After PSM</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Low ASCVD risk group (n=4995)</td><td align="left" valign="top">High ASCVD group (n=3578)</td><td align="left" valign="top"><italic>P</italic> value</td><td align="left" valign="top">High ASCVD group (n=988)</td><td align="left" valign="top">Low ASCVD group (n=988)</td><td align="left" valign="top"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Gender (women), n (%)</td><td align="left" valign="top">3695 (74)</td><td align="left" valign="top">1364 (38.1)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">493 (49.9)</td><td align="left" valign="top">482 (48.8)</td><td align="left" valign="top">.65</td></tr><tr><td align="left" valign="top">Age (years), median (IQR)</td><td align="left" valign="top">51.0 (45.0&#x2010;58.0)</td><td align="left" valign="top">68.0 (62.0&#x2010;73.0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">59.0 (54.0&#x2010;65.0)</td><td align="left" valign="top">61.0 (52.0&#x2010;67.0)</td><td align="left" valign="top">.20</td></tr><tr><td align="left" valign="top" colspan="3">Job, n (%)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.62</td></tr><tr><td align="left" valign="top">&#x2003;Nonmanual workers</td><td align="left" valign="top">1886 (37.8)</td><td align="left" valign="top">1543 (43.1)</td><td align="left" valign="top"/><td align="left" valign="top">435 (44)</td><td align="left" valign="top">454 (46)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Other workers</td><td align="left" valign="top">1632 (32.7)</td><td align="left" valign="top">1641 (45.9)</td><td align="left" valign="top"/><td align="left" valign="top">355 (35.9)</td><td align="left" valign="top">350 (35.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Manual workers</td><td align="left" valign="top">1477 (29.6)</td><td align="left" valign="top">394 (11)</td><td align="left" valign="top"/><td align="left" valign="top">198 (20)</td><td align="left" valign="top">184 (18.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Marital status (without spouse), n (%)</td><td align="left" valign="top">867 (17.4)</td><td align="left" valign="top">922 (25.8)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">229 (23.2)</td><td align="left" valign="top">235 (23.8)</td><td align="left" valign="top">.36</td></tr><tr><td align="left" valign="top">Residential area (urban), n (%)</td><td align="left" valign="top">881 (17.6)</td><td align="left" valign="top">1001 (28)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">216 (21.9)</td><td align="left" valign="top">234 (23.7)</td><td align="left" valign="top">.93</td></tr><tr><td align="left" valign="top">Income (10,000 won per month), median (IQR)</td><td align="left" valign="top">492 (292&#x2010;700)</td><td align="left" valign="top">230 (109-450)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">360 (200&#x2010;614)</td><td align="left" valign="top">355 (193&#x2010;600)</td><td align="left" valign="top">.98</td></tr><tr><td align="left" valign="top">Alcohol drinking (&#x2265;2 per week), n (%)</td><td align="left" valign="top">839 (16.8)</td><td align="left" valign="top">873 (24.4)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">181 (18.3)</td><td align="left" valign="top">250 (25.3)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Smoking, n (%)</td><td align="left" valign="top">442 (8.8)</td><td align="left" valign="top">915 (25.6)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">62 (6.3)</td><td align="left" valign="top">417 (42.2)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Omega-3 intake (g per day), median (IQR)</td><td align="left" valign="top">1.4 (0.8&#x2010;2.3)</td><td align="left" valign="top">1.3 (0.7&#x2010;2.3)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">1.5 (0.9&#x2010;2.6)</td><td align="left" valign="top">1.3 (0.7&#x2010;2.3)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Sodium intake (g per day), median (IQR)</td><td align="left" valign="top">2.8 (1.9&#x2010;4.0)</td><td align="left" valign="top">2.9 (1.9&#x2010;4.2)</td><td align="left" valign="top">.02</td><td align="left" valign="top">3.1 (2.0&#x2010;4.2)</td><td align="left" valign="top">2.9 (2.0&#x2010;4.2)</td><td align="left" valign="top">.15</td></tr><tr><td align="left" valign="top">BMI (kg/m&#x00B2;), median (IQR)</td><td align="left" valign="top">23.5 (21.4&#x2010;25.9)</td><td align="left" valign="top">24.4 (22.5&#x2010;26.5)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">23.9 (21.9&#x2010;25.8)</td><td align="left" valign="top">25.1 (23.2&#x2010;27.3)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top" colspan="3">Weight change over 1 year, n (%)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top">.14</td></tr><tr><td align="left" valign="top">&#x2003;Weight loss</td><td align="left" valign="top">528 (10.6)</td><td align="left" valign="top">506 (14.1)</td><td align="left" valign="top"/><td align="left" valign="top">116 (11.7)</td><td align="left" valign="top">121 (12.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;No weight change</td><td align="left" valign="top">3171 (63.5)</td><td align="left" valign="top">2584 (72.2)</td><td align="left" valign="top"/><td align="left" valign="top">703 (71.2)</td><td align="left" valign="top">666 (67.4)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Weight gain</td><td align="left" valign="top">1296 (25.9)</td><td align="left" valign="top">488 (13.6)</td><td align="left" valign="top"/><td align="left" valign="top">169 (17.1)</td><td align="left" valign="top">201 (20.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">LDL<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup> (mg/dL), median (IQR)</td><td align="left" valign="top">120 (97&#x2010;143)</td><td align="left" valign="top">110 (85&#x2010;135)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">114 (91&#x2010;139)</td><td align="left" valign="top">116 (92&#x2010;143)</td><td align="left" valign="top">.12</td></tr><tr><td align="left" valign="top">Physical activity, n (%)</td><td align="left" valign="top">1074 (21.5)</td><td align="left" valign="top">534 (14.9)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">217 (22)</td><td align="left" valign="top">164 (16.6)</td><td align="left" valign="top">.003</td></tr><tr><td align="left" valign="top">Time spent sitting (hours/day), median (IQR)</td><td align="left" valign="top">8.0 (5.0&#x2010;10.0)</td><td align="left" valign="top">8.0 (5.8&#x2010;11.0)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">8.0 (5.0&#x2010;10.0)</td><td align="left" valign="top">8.0 (5.7&#x2010;10.9)</td><td align="left" valign="top">.003</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>ASCVD: atherosclerotic cardiovascular disease.</p></fn><fn id="table1fn2"><p><sup>b</sup>PSM: propensity score matching.</p></fn><fn id="table1fn3"><p><sup>c</sup>LDL: low-density lipoprotein.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Flowchart of the participants. ASCVD: atherosclerotic cardiovascular disease; CVD: cardiovascular disease; KNHANES: Korea National Health and Nutrition Examination Survey; LDL: low-density lipoprotein.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e74415_fig01.png"/></fig></sec><sec id="s3-2"><title>Evaluation Outcomes: Performance of ML Model for ASCVD Risk</title><p>The 1976 matched patients were allocated to the training and test datasets in an 8:2 ratio while maintaining the same ASCVD risk proportion. A comparison of variables between these two groups is presented in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, showing no significant differences in variable distribution. <xref ref-type="fig" rid="figure2">Figure 2</xref> shows the result of ML performance for predicting high ASCVD risk in the test dataset, with XGB showing the highest AUROC (0.811, 95% CI, 0.748&#x2010;0.867). <xref ref-type="table" rid="table2">Table 2</xref> presents the other performances of the five ML models; the LGB model demonstrated the best performance, including accuracy, recall, and <italic>F</italic><sub>1</sub>-score. The high AUROC values achieved, particularly by XGB (0.811) and LGB (0.810), indicate valid discriminative power, suggesting these models are capable of effectively distinguishing between individuals at high versus low 10-year ASCVD risk based on the included lifestyle and clinical factors. Additionally, the LGB model achieved the highest recall (0.692), meaning it correctly identified approximately 69% of the high-risk individuals in the test set. The superior <italic>F</italic><sub>1</sub>-score (LGB 0.735) and area under the precision-recall curve score (LGB 0.829, XGB 0.828) in the test dataset showed the models&#x2019; robust performance, even in a real-world imbalanced dataset.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>The area under the receiver operating characteristics curve values for 5 machine learning models for predicting high atherosclerotic cardiovascular disease risk (&#x2265;7.5% of 10-year risk) in the test dataset. LGB: light gradient boosting; LR: logistic regression; RF: random forest; SVM: support vector machine; XGB: extreme gradient boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e74415_fig02.png"/></fig><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Overall performance of the 5 machine learning models for high ASCVD<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> risk prediction on the test dataset with propensity score matching<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup>.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">LR<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup> (95% CI)</td><td align="left" valign="bottom">SVM<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup> (95% CI)</td><td align="left" valign="bottom">RF<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup> (95% CI)</td><td align="left" valign="bottom">XGB<sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup> (95% CI)</td><td align="left" valign="bottom">LGB<sup><xref ref-type="table-fn" rid="table2fn7">g</xref></sup> (95% CI)</td></tr></thead><tbody><tr><td align="left" valign="top">Accuracy</td><td align="left" valign="top">0.730 (0.672&#x2010;0.788)</td><td align="left" valign="top">0.730 (0.672&#x2010;0.788)</td><td align="left" valign="top">0.732 (0.672&#x2010;0.793)</td><td align="left" valign="top">0.722 (0.662&#x2010;0.783)</td><td align="left" valign="top">0.750 (0.692&#x2010;0.808)</td></tr><tr><td align="left" valign="top">Precision</td><td align="left" valign="top">0.776 (0.701&#x2010;0.853)</td><td align="left" valign="top">0.827 (0.750&#x2010;0.901)</td><td align="left" valign="top">0.791 (0.714&#x2010;0.870)</td><td align="left" valign="top">0.768 (0.693&#x2010;0.846)</td><td align="left" valign="top">0.783 (0.711&#x2010;0.855)</td></tr><tr><td align="left" valign="top">Recall</td><td align="left" valign="top">0.646 (0.556&#x2010;0.737)</td><td align="left" valign="top">0.581 (0.485&#x2010;0.677)</td><td align="left" valign="top">0.631 (0.535&#x2010;0.727)</td><td align="left" valign="top">0.636 (0.535&#x2010;0.727)</td><td align="left" valign="top">0.692 (0.596&#x2010;0.778)</td></tr><tr><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.705 (0.630&#x2010;0.776)</td><td align="left" valign="top">0.682 (0.600&#x2010;0.757)</td><td align="left" valign="top">0.702 (0.624&#x2010;0.774)</td><td align="left" valign="top">0.696 (0.618&#x2010;0.767)</td><td align="left" valign="top">0.735 (0.663&#x2010;0.802)</td></tr><tr><td align="left" valign="top">AUROC<sup><xref ref-type="table-fn" rid="table2fn8">h</xref></sup></td><td align="left" valign="top">0.809 (0.748&#x2010;0.867)</td><td align="left" valign="top">0.800 (0.737&#x2010;0.859)</td><td align="left" valign="top">0.786 (0.720&#x2010;0.847)</td><td align="left" valign="top">0.811 (0.748&#x2010;0.867)</td><td align="left" valign="top">0.810 (0.749&#x2010;0.869)</td></tr><tr><td align="left" valign="top">Specificity</td><td align="left" valign="top">0.813 (0.737&#x2010;0.889)</td><td align="left" valign="top">0.879 (0.808&#x2010;0.939)</td><td align="left" valign="top">0.833 (0.758&#x2010;0.909)</td><td align="left" valign="top">0.808 (0.727&#x2010;0.879)</td><td align="left" valign="top">0.808 (0.727&#x2010;0.879)</td></tr><tr><td align="left" valign="top">AUPRC<sup><xref ref-type="table-fn" rid="table2fn9">i</xref></sup></td><td align="left" valign="top">0.811 (0.741&#x2010;0.881)</td><td align="left" valign="top">0.803 (0.730&#x2010;0.873)</td><td align="left" valign="top">0.805 (0.737&#x2010;0.868)</td><td align="left" valign="top">0.828 (0.766&#x2010;0.884)</td><td align="left" valign="top">0.829 (0.771&#x2010;0.886)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>ASCVD: atherosclerotic cardiovascular disease.</p></fn><fn id="table2fn2"><p><sup>b</sup>Data are represented as averaged value with 95% CI.</p></fn><fn id="table2fn3"><p><sup>c</sup>LR: logistic regression.</p></fn><fn id="table2fn4"><p><sup>d</sup>SVM: support vector machine.</p></fn><fn id="table2fn5"><p><sup>e</sup>RF: random forest.</p></fn><fn id="table2fn6"><p><sup>f</sup>XGB: extreme gradient boosting.</p></fn><fn id="table2fn7"><p><sup>g</sup>LGB: light gradient boosting.</p></fn><fn id="table2fn8"><p><sup>h</sup>AUROC: area under the receiver operating characteristics curve.</p></fn><fn id="table2fn9"><p><sup>i</sup>AUPRC: area under the precision-recall curve.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-3"><title>Variable Importance in ML Model</title><p>To visualize the importance of variables included in the ML model, we presented SHAP values for the XGB model used to predict high ASCVD risk (<xref ref-type="fig" rid="figure3">Figure 3</xref>). Current smoking and age were the strongest predictors of high ASCVD risk over 10 years. Among lifestyle factors, BMI, sodium or omega-3 intake, and LDL cholesterol were also associated with increased risk. In contrast, factors such as &#x201C;time spent sitting,&#x201D; physical activity, sex, and marital status had a relatively smaller impact. The SHAP values for the LGB model, presented in Figure S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, show a similar pattern of variable importance as the XGB model.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Variable importances of extreme gradient boosting models for high ASCVD risk in the test dataset. (A) Importance matrix plot showing the direction of the relationship between an input variable and high ASCVD risk. (B) Shapley Additive exPlanations summary plot of lifestyle variables predictive features of the ML model. As demonstrated by the color bar, higher values are shown in red, while lower values are shown in blue. ASCVD: atherosclerotic cardiovascular disease; LDL: low-density lipoprotein; ML: machine learning.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="medinform_v13i1e74415_fig03.png"/></fig></sec><sec id="s3-4"><title>Associations of Lifestyle Risk Factors With 10-Year ASCVD Risk</title><p>For sensitivity analysis, we examined whether the ML model&#x2019;s results were consistent with binary LR (<xref ref-type="table" rid="table3">Table 3</xref>) using high ASCVD risk as the outcome. Multivariable binary LR showed that smoking and BMI were positively associated with high ASCVD risk, while omega-3 intake and physical activity were significantly negatively associated. Compared to the SHAP values of the XGB and LGB models, factors such as smoking status, BMI, and omega-3 intake showed similar associations in the multivariable binary LR model.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Result of binary logistic regression analysis of lifestyle variables for predicting 10-year high ASCVD<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> risk in propensity score matched cohort.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variable</td><td align="left" valign="bottom" colspan="2">Univariable analysis</td><td align="left" valign="bottom" colspan="2">Multivariable analysis</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">OR<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> (95% CI)</td><td align="left" valign="top"><italic>P</italic> value</td><td align="left" valign="top">Adjusted OR (95% CI)</td><td align="left" valign="top"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Gender (women)</td><td align="left" valign="top">0.96 (0.80&#x2010;1.14)</td><td align="left" valign="top">.62</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Age (years)</td><td align="left" valign="top">1.01 (1.00&#x2010;1.02)</td><td align="left" valign="top">.20</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top" colspan="5">Job</td></tr><tr><td align="left" valign="top">&#x2003;Manual workers</td><td align="left" valign="top">1.00 (reference)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">&#x2003;Nonmanual workers</td><td align="left" valign="top">1.12 (0.88&#x2010;1.43)</td><td align="left" valign="top">.34</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">&#x2003;Other workers</td><td align="left" valign="top">1.06 (0.83&#x2010;1.36)</td><td align="left" valign="top">.64</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Marital status (without spouse)</td><td align="left" valign="top">1.03 (0.84&#x2010;1.27)</td><td align="left" valign="top">.75</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Residential area (urban)</td><td align="left" valign="top">1.11 (0.90&#x2010;1.37)</td><td align="left" valign="top">.33</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Income (10,000 won per month)</td><td align="left" valign="top">1.00 (1.00&#x2010;1.00)</td><td align="left" valign="top">.98</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Alcohol drinking (&#x2265;2 per week)</td><td align="left" valign="top">1.51 (1.22&#x2010;1.87)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">0.89 (0.68&#x2010;1.15)</td><td align="left" valign="top">.37</td></tr><tr><td align="left" valign="top">Smoking</td><td align="left" valign="top">10.91 (8.19&#x2010;14.53)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">11.52 (8.20&#x2010;15.60)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Omega-3 intake (g per day)</td><td align="left" valign="top">0.93 (0.89&#x2010;0.97)</td><td align="left" valign="top">.003</td><td align="left" valign="top">0.93 (0.88&#x2010;0.98)</td><td align="left" valign="top">.01</td></tr><tr><td align="left" valign="top">Sodium intake (g per day)</td><td align="left" valign="top">1.00 (1.00&#x2010;1.00)</td><td align="left" valign="top">.97</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">BMI (kg/m<sup>2</sup>)</td><td align="left" valign="top">1.13 (1.10&#x2010;1.17)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">1.13 (1.09&#x2010;1.16)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top" colspan="5">Weight change over 1 year</td></tr><tr><td align="left" valign="top">&#x2003;Weight loss</td><td align="left" valign="top">1.00 (reference)</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">&#x2003;No weight change</td><td align="left" valign="top">0.91 (0.69&#x2010;1.20)</td><td align="left" valign="top">.49</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">&#x2003;Weight gain</td><td align="left" valign="top">1.14 (0.82&#x2010;1.58)</td><td align="left" valign="top">.43</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">LDL<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup> (mg/dL)</td><td align="left" valign="top">1.00 (1.00&#x2010;1.01)</td><td align="left" valign="top">.04</td><td align="left" valign="top">1.00 (1.00&#x2010;1.00)</td><td align="left" valign="top">.67</td></tr><tr><td align="left" valign="top">Physical activity</td><td align="left" valign="top">0.71 (0.56&#x2010;0.89)</td><td align="left" valign="top">.003</td><td align="left" valign="top">0.61 (0.47&#x2010;0.79)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Time spent sitting (hours per day)</td><td align="left" valign="top">1.00 (1.00&#x2010;1.00)</td><td align="left" valign="top">.003</td><td align="left" valign="top">1.00 (1.00&#x2010;1.00)</td><td align="left" valign="top">.42</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>ASCVD: atherosclerotic cardiovascular disease.</p></fn><fn id="table3fn2"><p><sup>b</sup>OR: odds ratio.</p></fn><fn id="table3fn3"><p><sup>c</sup>Not applicable.</p></fn><fn id="table3fn4"><p><sup>d</sup>LDL: low-density lipoprotein.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study assessed the performance of ML models, including XGB and LGB, in predicting 10-year high ASCVD risk in adults and identifying key risk factors. After adjusting for confounders using PSM, both models demonstrated high AUROC values, with LGB outperforming in accuracy, recall, and <italic>F</italic><sub>1</sub>-score. Variable importance analysis identified smoking and age as the strongest predictors, while BMI, sodium or omega-3 intake, and LDL cholesterol also had significant variables. Multivariable LR also confirmed these findings, showing that smoking, BMI, and LDL cholesterol increased ASCVD risk, whereas omega-3 intake and physical activity were associated with lower risk.</p><p>Age is associated with increased oxidative stress, which leads to an increased susceptibility to CVD onset [<xref ref-type="bibr" rid="ref25">25</xref>]. Excessive generation of reactive oxygen species leads to a state of oxidative stress, which is a major risk factor for the development and progression of atherosclerosis [<xref ref-type="bibr" rid="ref26">26</xref>]. Aging is an unmodifiable ASCVD risk factor, but it can be prevented if other factors can be corrected. Cigarette smoking is widely accepted as a major risk factor for the development of clinical CVD, resulting from direct effects on atherosclerosis. Epidemiologic studies strongly support that cigarette smoking in both men and women increases the incidence of myocardial infarction and fatal coronary artery disease [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>].</p><p>Cigarette smoking is widely accepted as a major risk factor for the development of clinical CVD, resulting from direct effects on atherosclerosis. Epidemiologic studies strongly support that cigarette smoking in both men and women increases the incidence of myocardial infarction and fatal coronary artery disease [<xref ref-type="bibr" rid="ref29">29</xref>]. Because the chemical constituents of smoke have high oxidant and inflammatory capacities, they can directly induce endothelial damage and potentiate an inflammatory response [<xref ref-type="bibr" rid="ref30">30</xref>]. Smoke is able to increase LDL levels through metabolic alterations and the induction of LDL oxidation due to the direct oxidant capacity of smoke components [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. Obesity has been linked to persistent inflammation and oxidative stress. Oxidative stress plays a crucial role in disorders related to obesity, such as dyslipidemia and hypertension, causing CVDs [<xref ref-type="bibr" rid="ref32">32</xref>]. The prevalence of overweight and obesity has been strongly increasing over the last few decades, and it is considered to be one of the largest challenges for public health work worldwide [<xref ref-type="bibr" rid="ref33">33</xref>].</p><p>Interestingly, some lifestyle factors commonly associated with cardiovascular health, such as sodium intake and time spent sitting, showed weaker associations with high ASCVD risk in our final models after adjusting for confounders. For instance, while sodium intake was significantly different between groups before PSM, this difference did not persist after matching, and it did not emerge as a strong predictor in the multivariable LR or the SHAP analyses for the ML models. Similarly, &#x201C;time spent sitting&#x201D; did not demonstrate a strong independent association in the multivariable LR model (<italic>P</italic>=.42) despite being significant in the univariable analysis and showing a difference post-PSM. Furthermore, its importance ranking in the SHAP analyses was relatively low. The lack of a strong independent association between sitting time and ASCVD risk may reflect collinearity with physical activity, limitations in the variable&#x2019;s definition (eg, failure to capture prolonged uninterrupted sitting), potential inaccuracies in self-reported data, and residual confounding suggested by the unexpected postmatching trend.</p><p>The American Heart Association has recently outlined a new framework that focuses on defining and optimizing cardiovascular health through the adoption of 8 simple health components: healthy diet, engaging in regular physical activity, avoidance of nicotine, healthy sleep, and healthy levels of blood lipids, glucose, and blood pressure [<xref ref-type="bibr" rid="ref34">34</xref>]. Most clinical guidelines for the primary or secondary prevention of ASCVD emphasize the importance of lifestyle modification. These lifestyle changes are also an important part of public health policy for CVD prevention. Therefore, a lifestyle approach to ASCVD risk may be important for accurate prediction and prioritization of treatment strategies for prevention.</p><p>Beyond simply ranking variable importance, the application of SHAP analysis provides crucial granular insights into how individual factors contribute to the predicted ASCVD risk for each patient, offering significant advantages over traditional &#x201C;black-box&#x201D; models. Our SHAP results (<xref ref-type="fig" rid="figure3">Figure 3</xref> and Figure S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) confirm that current smoking and age are not just important, but consistently exert the strongest positive influence toward a high-risk prediction across the cohort. The magnitude of the positive SHAP values associated with current smoking underscores its overwhelming impact, reinforcing the paramount importance of smoking cessation as a primary prevention strategy from a clinical standpoint. Similarly, the consistent positive contribution of increasing age highlights the nonmodifiable baseline upon which lifestyle interventions must act. Furthermore, the SHAP visualizations offer nuances beyond simple correlation. Especially, higher omega-3 intake consistently generated negative SHAP values, indicating its protective effect by lowering the predicted risk score. While LDL cholesterol&#x2019;s influence appeared less dominant after PSM in the LR, SHAP analysis still identified it as a contributor, potentially highlighting its relevance within the complex interplay captured by the ML model.</p></sec><sec id="s4-2"><title>Limitations</title><p>This study has several limitations. First, it is a cross-sectional study, which does not allow for establishing causal relationships. While our ML models identify strong associations and predictive patterns (eg, smoking status being highly predictive of high ASCVD risk), this design prevents us from definitively concluding that altering a specific lifestyle factor will cause a change in ASCVD risk. For instance, the model might show that higher omega-3 intake is associated with lower predicted risk, but we cannot ascertain from this data alone whether increasing omega-3 intake would directly lead to a reduction in an individual&#x2019;s true risk, or if the association is partly due to other unmeasured confounding factors linked to both omega-3 intake and cardiovascular health. This limitation significantly impacts the direct translation of our ML model&#x2019;s findings, particularly the feature importance results (like SHAP values), into prescriptive clinical actions. Second, some variables were measured by questionnaire, which may lead to underestimation or overestimation for the prediction of ASCVD risk. Especially in the case of nutrition, it is particularly difficult to accurately reflect daily intake. Third, the study involved a secondary analysis of data from the KNHANES, so it was not possible to include all lifestyle and socioeconomic status variables in the analysis. Finally, we excluded 1908 participants (approximately 18% of the initially eligible cohort after age screening) due to missing data on one or more key analytical variables (sodium intake, LDL-cholesterol, time spent sitting, etc). This exclusion was based on a complete case analysis approach, meaning only participants with complete records for all variables used in the models were included. Multiple imputation techniques could potentially allow for the inclusion of this population and might mitigate some of the selection bias. Future studies should investigate the impact of handling missing data via multiple imputation compared to complete case analysis, specifically assessing potential improvement in the performance metrics of the developed ML models. Nevertheless, the strength of this study is that it used representative and reliable data from KNHANES to predict modifiable lifestyle risk factors using an ML approach.</p></sec><sec id="s4-3"><title>Conclusions</title><p>This study demonstrates that ML models are effective tools for assessing ASCVD risk and highlights the significant impact of lifestyle factors such as smoking, BMI, and omega-3 intake. These findings highlight the significant clinical informatics potential for integrating the developed interpretable ML models into electronic health records, clinical decision support tools, and digital health platforms to enable dynamic, personalized ASCVD risk assessment and guide targeted lifestyle interventions within routine clinical practice. Longitudinal studies are needed to establish causal links between the identified lifestyle factors and ASCVD development in a multiethnic population. Furthermore, additional measures of lifestyle with wearable devices could enhance the clinical utility of the ML model.</p></sec></sec></body><back><ack><p>This research was supported by a grant of the Korea Health Technology R&#x0026;D Project through the Korea Health Industry Development Institute (KHIDI), funded by the Ministry of Health &#x0026; Welfare, Republic of Korea (grant HR21C0198), and by a grant of the Korea Health Technology R&#x0026;D Project through the KHIDI; funded by the Ministry of Health &#x0026; Welfare, Republic of Korea (grant: RS-2022-KH129707); supported by "&#x201C;Regional Innovation Strategy (RIS)"&#x201D; through the National Research Foundation of Korea funded by the Ministry of Education (2022RIS-005) and supported by Hallym University Research Fund.</p></ack><fn-group><fn fn-type="con"><p>HJK designed the study and prepared the manuscript. HC, HJA, and SHS collected data and literature search. CK drafted the manuscript. SHL, JHS, and JJL conducted data analysis. All authors carried out critical review and approved the final manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ASCVD</term><def><p>atherosclerotic cardiovascular disease</p></def></def-item><def-item><term id="abb2">AUROC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb3">CVD</term><def><p>cardiovascular disease</p></def></def-item><def-item><term id="abb4">KDCA</term><def><p>Korea Disease Control and Prevention Agency</p></def></def-item><def-item><term id="abb5">KNHANES</term><def><p>Korea National Health and Nutrition Examination Survey</p></def></def-item><def-item><term id="abb6">LDL</term><def><p>low-density lipoprotein</p></def></def-item><def-item><term id="abb7">LGB</term><def><p>light gradient boosting</p></def></def-item><def-item><term id="abb8">LR</term><def><p>logistic regression</p></def></def-item><def-item><term id="abb9">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb10">PCE</term><def><p>pooled cohort equation</p></def></def-item><def-item><term id="abb11">PSM</term><def><p>propensity score matching</p></def></def-item><def-item><term id="abb12">RF</term><def><p>random forest</p></def></def-item><def-item><term id="abb13">SHAP</term><def><p>SHapley Additive exPlanations</p></def></def-item><def-item><term id="abb14">XGB</term><def><p>extreme gradient boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weir</surname><given-names>HK</given-names> </name><name name-style="western"><surname>Anderson</surname><given-names>RN</given-names> </name><name name-style="western"><surname>Coleman King</surname><given-names>SM</given-names> </name><etal/></person-group><article-title>Heart disease and cancer deaths&#x2014;trends and projections in the United States, 1969-2020</article-title><source>Prev Chronic Dis</source><year>2016</year><month>11</month><day>17</day><volume>13</volume><fpage>E157</fpage><pub-id pub-id-type="doi">10.5888/pcd13.160211</pub-id><pub-id pub-id-type="medline">27854420</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roth</surname><given-names>GA</given-names> </name><name name-style="western"><surname>Mensah</surname><given-names>GA</given-names> </name><name name-style="western"><surname>Johnson</surname><given-names>CO</given-names> </name><etal/></person-group><article-title>Global burden of cardiovascular diseases and risk factors, 1990-2019: update from the GBD 2019 study</article-title><source>J Am Coll Cardiol</source><year>2020</year><month>12</month><day>22</day><volume>76</volume><issue>25</issue><fpage>2982</fpage><lpage>3021</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2020.11.010</pub-id><pub-id pub-id-type="medline">33309175</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>HC</given-names> </name></person-group><article-title>Epidemiology of cardiovascular disease and its risk factors in Korea</article-title><source>Global Health Med</source><year>2021</year><month>06</month><day>30</day><volume>3</volume><issue>3</issue><fpage>134</fpage><lpage>141</lpage><pub-id pub-id-type="doi">10.35772/ghm.2021.01008</pub-id><pub-id pub-id-type="medline">34250288</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>HH</given-names> </name><name name-style="western"><surname>Cho</surname><given-names>SMJ</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Korea heart disease fact sheet 2020: analysis of nationwide data</article-title><source>Korean Circ J</source><year>2021</year><month>06</month><volume>51</volume><issue>6</issue><fpage>495</fpage><lpage>503</lpage><pub-id pub-id-type="doi">10.4070/kcj.2021.0097</pub-id><pub-id pub-id-type="medline">34085422</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Poznyak</surname><given-names>AV</given-names> </name><name name-style="western"><surname>Sadykhov</surname><given-names>NK</given-names> </name><name name-style="western"><surname>Kartuesov</surname><given-names>AG</given-names> </name><etal/></person-group><article-title>Hypertension as a risk factor for atherosclerosis: cardiovascular risk assessment</article-title><source>Front Cardiovasc Med</source><year>2022</year><volume>9</volume><fpage>959285</fpage><pub-id pub-id-type="doi">10.3389/fcvm.2022.959285</pub-id><pub-id pub-id-type="medline">36072873</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Devareddy</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sarraju</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rodriguez</surname><given-names>F</given-names> </name></person-group><article-title>Health disparities across the continuum of ASCVD risk</article-title><source>Curr Cardiol Rep</source><year>2022</year><month>09</month><volume>24</volume><issue>9</issue><fpage>1129</fpage><lpage>1137</lpage><pub-id pub-id-type="doi">10.1007/s11886-022-01736-y</pub-id><pub-id pub-id-type="medline">35788894</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mollborn</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lawrence</surname><given-names>EM</given-names> </name><name name-style="western"><surname>Hummer</surname><given-names>RA</given-names> </name></person-group><article-title>A gender framework for understanding health lifestyles</article-title><source>Soc Sci Med</source><year>2020</year><month>11</month><volume>265</volume><fpage>113182</fpage><pub-id pub-id-type="doi">10.1016/j.socscimed.2020.113182</pub-id><pub-id pub-id-type="medline">32942201</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rajendran</surname><given-names>A</given-names> </name><name name-style="western"><surname>Minhas</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Kazzi</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Sex-specific differences in cardiovascular risk factors and implications for cardiovascular disease prevention in women</article-title><source>Atherosclerosis</source><year>2023</year><month>11</month><volume>384</volume><fpage>117269</fpage><pub-id pub-id-type="doi">10.1016/j.atherosclerosis.2023.117269</pub-id><pub-id pub-id-type="medline">37752027</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lloyd-Jones</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Braun</surname><given-names>LT</given-names> </name><name name-style="western"><surname>Ndumele</surname><given-names>CE</given-names> </name><etal/></person-group><article-title>Use of risk assessment tools to guide decision-making in the primary prevention of atherosclerotic cardiovascular disease: a special report from the American Heart Association and American College of Cardiology</article-title><source>J Am Coll Cardiol</source><year>2019</year><month>06</month><day>25</day><volume>73</volume><issue>24</issue><fpage>3153</fpage><lpage>3167</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2018.11.005</pub-id><pub-id pub-id-type="medline">30423392</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dalakoti</surname><given-names>M</given-names> </name><name name-style="western"><surname>Virani</surname><given-names>S</given-names> </name></person-group><article-title>Lifelong prevention of atherosclerotic cardiovascular disease (ASCVD) through LDL-C control&#x2014;means and cost/benefit of sustained very low lifetime LDL-C targets</article-title><source>Am J Prev Cardiol</source><year>2024</year><month>09</month><volume>19</volume><fpage>100720</fpage><pub-id pub-id-type="doi">10.1016/j.ajpc.2024.100720</pub-id><pub-id pub-id-type="medline">39252855</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shamout</surname><given-names>F</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Clifton</surname><given-names>DA</given-names> </name></person-group><article-title>Machine learning for clinical outcome prediction</article-title><source>IEEE Rev Biomed Eng</source><year>2020</year><month>07</month><day>7</day><volume>14</volume><fpage>116</fpage><lpage>126</lpage><pub-id pub-id-type="doi">10.1109/RBME.2020.3007816</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nakanishi</surname><given-names>R</given-names> </name><name name-style="western"><surname>Slomka</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Rios</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Machine learning adds to clinical and CAC assessments in predicting 10-year CHD and CVD deaths</article-title><source>JACC Cardiovasc Imaging</source><year>2021</year><month>03</month><volume>14</volume><issue>3</issue><fpage>615</fpage><lpage>625</lpage><pub-id pub-id-type="doi">10.1016/j.jcmg.2020.08.024</pub-id><pub-id pub-id-type="medline">33129741</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cho</surname><given-names>SY</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Kang</surname><given-names>SH</given-names> </name><etal/></person-group><article-title>Pre-existing and machine learning-based models for cardiovascular risk prediction</article-title><source>Sci Rep</source><year>2021</year><month>04</month><day>26</day><volume>11</volume><issue>1</issue><fpage>8886</fpage><pub-id pub-id-type="doi">10.1038/s41598-021-88257-w</pub-id><pub-id pub-id-type="medline">33903629</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Connelly</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Azizi</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Alipour</surname><given-names>P</given-names> </name><name name-style="western"><surname>Delles</surname><given-names>C</given-names> </name><name name-style="western"><surname>Pilote</surname><given-names>L</given-names> </name><name name-style="western"><surname>Raparelli</surname><given-names>V</given-names> </name></person-group><article-title>The importance of gender to understand sex differences in cardiovascular disease</article-title><source>Can J Cardiol</source><year>2021</year><month>05</month><volume>37</volume><issue>5</issue><fpage>699</fpage><lpage>710</lpage><pub-id pub-id-type="doi">10.1016/j.cjca.2021.02.005</pub-id><pub-id pub-id-type="medline">33592281</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goff</surname><given-names>DC</given-names>  <suffix>Jr</suffix></name><name name-style="western"><surname>Lloyd-Jones</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Bennett</surname><given-names>G</given-names> </name><etal/></person-group><article-title>2013 ACC/AHA guideline on the assessment of cardiovascular risk: a report of the American College of Cardiology/American Heart Association task force on practice guidelines</article-title><source>Circulation</source><year>2014</year><month>06</month><day>24</day><volume>129</volume><issue>25 Suppl 2</issue><fpage>S49</fpage><lpage>73</lpage><pub-id pub-id-type="doi">10.1161/01.cir.0000437741.48606.98</pub-id><pub-id pub-id-type="medline">24222018</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wong</surname><given-names>ND</given-names> </name><name name-style="western"><surname>Budoff</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Ferdinand</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Atherosclerotic cardiovascular disease risk assessment: an American Society for Preventive Cardiology clinical practice statement</article-title><source>Am J Prev Cardiol</source><year>2022</year><month>06</month><volume>10</volume><fpage>100335</fpage><pub-id pub-id-type="doi">10.1016/j.ajpc.2022.100335</pub-id><pub-id pub-id-type="medline">35342890</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lloyd-Jones</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Braun</surname><given-names>LT</given-names> </name><name name-style="western"><surname>Ndumele</surname><given-names>CE</given-names> </name><etal/></person-group><article-title>Use of risk assessment tools to guide decision-making in the primary prevention of atherosclerotic cardiovascular disease: a special report from the American Heart Association and American College of Cardiology</article-title><source>Circulation</source><year>2019</year><month>06</month><day>18</day><volume>139</volume><issue>25</issue><fpage>e1162</fpage><lpage>e1177</lpage><pub-id pub-id-type="doi">10.1161/CIR.0000000000000638</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mortensen</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Fuster</surname><given-names>V</given-names> </name><name name-style="western"><surname>Muntendam</surname><given-names>P</given-names> </name><etal/></person-group><article-title>A simple disease-guided approach to personalize ACC/AHA-recommended statin allocation in elderly people: the bioimage study</article-title><source>J Am Coll Cardiol</source><year>2016</year><month>08</month><day>30</day><volume>68</volume><issue>9</issue><fpage>881</fpage><lpage>891</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2016.05.084</pub-id><pub-id pub-id-type="medline">27561760</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>HK</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>BH</given-names> </name></person-group><article-title>The epidemiology of alcohol use disorders</article-title><source>J Korean Diabetes</source><year>2012</year><volume>13</volume><issue>2</issue><fpage>69</fpage><pub-id pub-id-type="doi">10.4093/jkd.2012.13.2.69</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lopez</surname><given-names>JPR</given-names> </name><name name-style="western"><surname>Sabag</surname><given-names>A</given-names> </name><name name-style="western"><surname>Juan</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Rezende</surname><given-names>LFM</given-names> </name><name name-style="western"><surname>Pastor-Valero</surname><given-names>M</given-names> </name></person-group><article-title>Do vigorous-intensity and moderate-intensity physical activities reduce mortality to the same extent? A systematic review and meta-analysis</article-title><source>BMJ Open Sport Exerc Med</source><year>2020</year><month>10</month><volume>6</volume><issue>1</issue><fpage>e000775</fpage><pub-id pub-id-type="doi">10.1136/bmjsem-2020-000775</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nelson</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Rejeski</surname><given-names>WJ</given-names> </name><name name-style="western"><surname>Blair</surname><given-names>SN</given-names> </name><etal/></person-group><article-title>Physical activity and public health in older adults: recommendation from the American College of Sports Medicine and the American Heart Association</article-title><source>Circulation</source><year>2007</year><month>08</month><day>28</day><volume>116</volume><issue>9</issue><fpage>1094</fpage><lpage>1105</lpage><pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.107.185650</pub-id><pub-id pub-id-type="medline">17671236</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shaikh</surname><given-names>TA</given-names> </name><name name-style="western"><surname>Rasool</surname><given-names>T</given-names> </name><name name-style="western"><surname>Verma</surname><given-names>P</given-names> </name><name name-style="western"><surname>Mir</surname><given-names>WA</given-names> </name></person-group><article-title>A fundamental overview of ensemble deep learning models and applications: systematic literature and state of the art</article-title><source>Ann Oper Res</source><year>2024</year><pub-id pub-id-type="doi">10.1007/s10479-024-06444-0</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Afsaneh</surname><given-names>E</given-names> </name><name name-style="western"><surname>Sharifdini</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ghazzaghi</surname><given-names>H</given-names> </name><name name-style="western"><surname>Ghobadi</surname><given-names>MZ</given-names> </name></person-group><article-title>Recent applications of machine learning and deep learning models in the prediction, diagnosis, and management of diabetes: a comprehensive review</article-title><source>Diabetol Metab Syndr</source><year>2022</year><month>12</month><day>27</day><volume>14</volume><issue>1</issue><fpage>196</fpage><pub-id pub-id-type="doi">10.1186/s13098-022-00969-9</pub-id><pub-id pub-id-type="medline">36572938</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Akiba</surname><given-names>T</given-names> </name><name name-style="western"><surname>Sano</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yanase</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ohta</surname><given-names>T</given-names> </name><name name-style="western"><surname>Koyama</surname><given-names>M</given-names> </name></person-group><article-title>Optuna: a next-generation hyperparameter optimization framework</article-title><conf-name>Proceedings of the 25th ACM SIGKDD iNternational Conference on Knowledge Discovery &#x0026; Data Mining</conf-name><conf-date>Aug 4-8, 2019</conf-date><conf-loc>Anchorage, AK, USA</conf-loc><fpage>2623</fpage><lpage>2631</lpage><pub-id pub-id-type="doi">10.1145/3292500.3330701</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jebari-Benslaiman</surname><given-names>S</given-names> </name><name name-style="western"><surname>Galicia-Garc&#x00ED;a</surname><given-names>U</given-names> </name><name name-style="western"><surname>Larrea-Sebal</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Pathophysiology of atherosclerosis</article-title><source>IJMS</source><year>2022</year><month>03</month><day>20</day><volume>23</volume><issue>6</issue><fpage>3346</fpage><pub-id pub-id-type="doi">10.3390/ijms23063346</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Man</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Beckman</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Jaffe</surname><given-names>IZ</given-names> </name></person-group><article-title>Sex as a biological variable in atherosclerosis</article-title><source>Circ Res</source><year>2020</year><month>04</month><day>24</day><volume>126</volume><issue>9</issue><fpage>1297</fpage><lpage>1319</lpage><pub-id pub-id-type="doi">10.1161/CIRCRESAHA.120.315930</pub-id><pub-id pub-id-type="medline">32324497</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rodgers</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Jones</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bolleddu</surname><given-names>SI</given-names> </name><etal/></person-group><article-title>Cardiovascular risks associated with gender and aging</article-title><source>J Cardiovasc Dev Dis</source><year>2019</year><month>04</month><day>27</day><volume>6</volume><issue>2</issue><fpage>19</fpage><pub-id pub-id-type="doi">10.3390/jcdd6020019</pub-id><pub-id pub-id-type="medline">31035613</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Batty</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bennett</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>E</given-names> </name></person-group><article-title>The role of oxidative stress in atherosclerosis</article-title><source>Cells</source><year>2022</year><month>11</month><day>30</day><volume>11</volume><issue>23</issue><fpage>3843</fpage><pub-id pub-id-type="doi">10.3390/cells11233843</pub-id><pub-id pub-id-type="medline">36497101</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gallucci</surname><given-names>G</given-names> </name><name name-style="western"><surname>Tartarone</surname><given-names>A</given-names> </name><name name-style="western"><surname>Lerose</surname><given-names>R</given-names> </name><name name-style="western"><surname>Lalinga</surname><given-names>AV</given-names> </name><name name-style="western"><surname>Capobianco</surname><given-names>AM</given-names> </name></person-group><article-title>Cardiovascular risk of smoking and benefits of smoking cessation</article-title><source>J Thorac Dis</source><year>2020</year><month>07</month><volume>12</volume><issue>7</issue><fpage>3866</fpage><lpage>3876</lpage><pub-id pub-id-type="doi">10.21037/jtd.2020.02.47</pub-id><pub-id pub-id-type="medline">32802468</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Higashi</surname><given-names>Y</given-names> </name></person-group><article-title>Smoking cessation and vascular endothelial function</article-title><source>Hypertens Res</source><year>2023</year><month>12</month><volume>46</volume><issue>12</issue><fpage>2670</fpage><lpage>2678</lpage><pub-id pub-id-type="doi">10.1038/s41440-023-01455-z</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>C</given-names> </name><name name-style="western"><surname>Lei</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>Cigarette smoking exposure breaks the homeostasis of cholesterol and bile acid metabolism and induces gut microbiota dysbiosis in mice with different diets</article-title><source>Toxicology</source><year>2021</year><month>02</month><day>28</day><volume>450</volume><fpage>152678</fpage><pub-id pub-id-type="doi">10.1016/j.tox.2021.152678</pub-id><pub-id pub-id-type="medline">33440193</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>H</given-names> </name><name name-style="western"><surname>Xia</surname><given-names>N</given-names> </name></person-group><article-title>The interplay between adipose tissue and vasculature: role of oxidative stress in obesity</article-title><source>Front Cardiovasc Med</source><year>2021</year><month>03</month><day>4</day><volume>8</volume><fpage>650214</fpage><pub-id pub-id-type="doi">10.3389/fcvm.2021.650214</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ni</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Global prevalence of overweight and obesity in children and adolescents: a systematic review and meta-analysis</article-title><source>JAMA Pediatr</source><year>2024</year><month>08</month><day>1</day><volume>178</volume><issue>8</issue><fpage>800</fpage><lpage>813</lpage><pub-id pub-id-type="doi">10.1001/jamapediatrics.2024.1576</pub-id><pub-id pub-id-type="medline">38856986</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kris-Etherton</surname><given-names>PM</given-names> </name><name name-style="western"><surname>Petersen</surname><given-names>KS</given-names> </name><name name-style="western"><surname>Despr&#x00E9;s</surname><given-names>JP</given-names> </name><etal/></person-group><article-title>Strategies for promotion of a healthy lifestyle in clinical settings: pillars of ideal cardiovascular health: a science advisory from the American Heart Association</article-title><source>Circulation</source><year>2021</year><month>12</month><day>14</day><volume>144</volume><issue>24</issue><fpage>e495</fpage><lpage>e514</lpage><pub-id pub-id-type="doi">10.1161/CIR.0000000000001018</pub-id><pub-id pub-id-type="medline">34689589</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Supplementary figures and tables.</p><media xlink:href="medinform_v13i1e74415_app1.docx" xlink:title="DOCX File, 372 KB"/></supplementary-material></app-group></back></article>