<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Cardio</journal-id><journal-id journal-id-type="publisher-id">cardio</journal-id><journal-id journal-id-type="index">26</journal-id><journal-title>JMIR Cardio</journal-title><abbrev-journal-title>JMIR Cardio</abbrev-journal-title><issn pub-type="epub">2561-1011</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e68066</article-id><article-id pub-id-type="doi">10.2196/68066</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Machine Learning Model for Predicting Coronary Heart Disease Risk: Development and Validation Using Insights From a Japanese Population&#x2013;Based Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Vu</surname><given-names>Thien</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kokubo</surname><given-names>Yoshihiro</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Inoue</surname><given-names>Mai</given-names></name><degrees>ME</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yamamoto</surname><given-names>Masaki</given-names></name><degrees>BE</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Mohsen</surname><given-names>Attayeb</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Martin-Morales</surname><given-names>Agustin</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Dawadi</surname><given-names>Research</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Inoue</surname><given-names>Takao</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Tay</surname><given-names>Jie Ting</given-names></name><degrees>MRES</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yoshizaki</surname><given-names>Mari</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Watanabe</surname><given-names>Naoki</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kuriya</surname><given-names>Yuki</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Matsumoto</surname><given-names>Chisa</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Arafa</surname><given-names>Ahmed</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff8">8</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Nakao</surname><given-names>Yoko M</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kato</surname><given-names>Yuka</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff9">9</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Teramoto</surname><given-names>Masayuki</given-names></name><degrees>MD, MPH</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Araki</surname><given-names>Michihiro</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff10">10</xref><xref ref-type="aff" rid="aff11">11</xref></contrib></contrib-group><aff id="aff1"><institution>Artificial Intelligence Center for Health and Biomedical Research, National Institutes of Biomedical Innovation, Health and Nutrition</institution><addr-line>3-17 Senrioka-shinmachi</addr-line><addr-line>Osaka</addr-line><country>Japan</country></aff><aff id="aff2"><institution>NCD Epidemiology Research Center, Shiga University of Medical Science, Shiga</institution><addr-line>Otsu</addr-line><country>Japan</country></aff><aff id="aff3"><institution>Department of Cardiac Surgery, Cardiovascular Center, Cho Ray Hospital</institution><addr-line>Ho Chi Minh City</addr-line><country>Vietnam</country></aff><aff id="aff4"><institution>Department of Preventive Cardiology, National Cerebral and Cardiovascular Center</institution><addr-line>Suita, Osaka</addr-line><country>Japan</country></aff><aff id="aff5"><institution>Libyan Centre for Dental Research</institution><addr-line>Zliten</addr-line><country>Libya</country></aff><aff id="aff6"><institution>Faculty of Informatics, Yamato University</institution><addr-line>Osaka</addr-line><country>Japan</country></aff><aff id="aff7"><institution>Department of Cardiology, Center for Health Surveillance and Preventive Medicine, Tokyo Medical University Hospital</institution><addr-line>Tokyo</addr-line><country>Japan</country></aff><aff id="aff8"><institution>Department of Public Health, Faculty of Medicine, Beni-Suef University</institution><addr-line>Beni-Suef</addr-line><country>Egypt</country></aff><aff id="aff9"><institution>Division of Health Sciences, Osaka University Graduate School of Medicine</institution><addr-line>Suita, Osaka</addr-line><country>Japan</country></aff><aff id="aff10"><institution>Graduate School of Medicine, Kyoto University</institution><addr-line>Kyoto</addr-line><country>Japan</country></aff><aff id="aff11"><institution>Graduate School of Science, Technology and Innovation, Kobe University</institution><addr-line>Kobe</addr-line><country>Japan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Gasmi</surname><given-names>Maha</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Nomali</surname><given-names>Mahin</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Misra</surname><given-names>Neeladri</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Thien Vu, MD, PhD, Artificial Intelligence Center for Health and Biomedical Research, National Institutes of Biomedical Innovation, Health and Nutrition, 3-17 Senrioka-shinmachi, Osaka, 566-0002, Japan, 81 8093069457; <email>thienvuyd01@gmail.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>12</day><month>5</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e68066</elocation-id><history><date date-type="received"><day>29</day><month>10</month><year>2024</year></date><date date-type="rev-recd"><day>03</day><month>02</month><year>2025</year></date><date date-type="accepted"><day>24</day><month>02</month><year>2025</year></date></history><copyright-statement>&#x00A9; Thien Vu, Yoshihiro Kokubo, Mai Inoue, Masaki Yamamoto, Attayeb Mohsen, Agustin Martin-Morales, Research Dawadi, Takao Inoue, Jie Ting Tay, Mari Yoshizaki, Naoki Watanabe, Yuki Kuriya, Chisa Matsumoto, Ahmed Arafa, Yoko M Nakao, Yuka Kato, Masayuki Teramoto, Michihiro Araki. Originally published in JMIR Cardio (<ext-link ext-link-type="uri" xlink:href="https://cardio.jmir.org">https://cardio.jmir.org</ext-link>), 12.5.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Cardio, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://cardio.jmir.org">https://cardio.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://cardio.jmir.org/2025/1/e68066"/><abstract><sec><title>Background</title><p>Coronary heart disease (CHD) is a major cause of morbidity and mortality worldwide. Identifying key risk factors is essential for effective risk assessment and prevention. A data-driven approach using machine learning (ML) offers advanced techniques to analyze complex, nonlinear, and high-dimensional datasets, uncovering novel predictors of CHD that go beyond the limitations of traditional models, which rely on predefined variables.</p></sec><sec><title>Objective</title><p>This study aims to evaluate the contribution of various risk factors to CHD, focusing on both established and novel markers using ML techniques.</p></sec><sec sec-type="methods"><title>Methods</title><p>The study recruited 7672 participants aged 30-84 years from Suita City, Japan, between 1989 and 1999. Over an average of 15 years, participants were monitored for cardiovascular events. A total of 7260 participants and 28 variables were included in the analysis after excluding individuals with missing outcome data and eliminating unnecessary variables. Five ML models&#x2014;logistic regression, random forest (RF), support vector machine, Extreme Gradient Boosting, and Light Gradient-Boosting Machine&#x2014;were applied for predicting CHD incidence. Model performance was evaluated using accuracy, sensitivity, specificity, precision, area under the curve, <italic>F</italic><sub>1</sub>-score, calibration curves, observed-to-expected ratios, and decision curve analysis. Additionally, Shapley Additive Explanations (SHAPs) were used to interpret the prediction models and understand the contribution of various risk factors to CHD.</p></sec><sec sec-type="results"><title>Results</title><p>Among 7260 participants, 305 (4.2%) were diagnosed with CHD. The RF model demonstrated the highest performance, with an accuracy of 0.73 (95% CI 0.64&#x2010;0.80), sensitivity of 0.74 (95% CI 0.62&#x2010;0.84), specificity of 0.72 (95% CI 0.61&#x2010;0.83), and an area under the curve of 0.73 (95% CI 0.65&#x2010;0.80). RF also showed excellent calibration, with predicted probabilities closely aligning with observed outcomes, and provided substantial net benefit across a range of risk thresholds, as demonstrated by decision curve analysis. SHAP analysis elucidated key predictors of CHD, including the intima-media thickness (IMT_cMax) of the common carotid artery, blood pressure, lipid profiles (non&#x2013;high-density lipoprotein cholesterol, high-density lipoprotein cholesterol, and triglycerides), and estimated glomerular filtration rate. Novel risk factors identified as significant contributors to CHD risk included lower calcium levels, elevated white blood cell counts, and body fat percentage. Furthermore, a protective effect was observed in women, suggesting the potential necessity for gender-specific risk assessment strategies in future cardiovascular health evaluations.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>We developed a model to predict CHD using ML and applied SHAP methods for interpretation. This approach highlights the multifactor nature of CHD risk evaluation, aiming to support health care professionals in identifying risk factors and formulating effective prevention strategies.</p></sec></abstract><kwd-group><kwd>coronary heart disease</kwd><kwd>machine learning</kwd><kwd>logistic regression</kwd><kwd>random forest</kwd><kwd>support vector machine</kwd><kwd>Extreme Gradient Boosting</kwd><kwd>Light Gradient-Boosting Machine</kwd><kwd>Shapley Additive Explanations</kwd><kwd>CHD</kwd><kwd>SVM</kwd><kwd>XGBoost</kwd><kwd>LightGBM</kwd><kwd>SHAP</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Coronary heart disease (CHD) remains a leading cause of morbidity and mortality worldwide, responsible for approximately 9.14 million deaths in 2019 [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Early identification of individuals at high risk is crucial, as timely interventions can significantly reduce the likelihood of severe outcomes like heart attacks and strokes. Studies have shown that early prediction and intervention can lead to a notable reduction in CHD-related mortality through preventive treatments such as statins and lifestyle changes [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. While conventional risk assessment models have been used, there is growing recognition of the potential of machine learning (ML) in enhancing CHD prediction [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>].</p><p>ML algorithms have proven their ability to analyze complex data and identify intricate patterns and relationships that are not easily detected by traditional statistical methods [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. By integrating diverse data sources, such as demographics, medical history, lifestyle habits, and diagnostic findings, these algorithms can predict the likelihood of developing CHD. This approach offers comprehensive risk evaluation, adaptability to new data, and the potential to uncover novel risk factors and disease mechanisms [<xref ref-type="bibr" rid="ref11">11</xref>].</p><p>Several studies have demonstrated the effectiveness of ML models in deriving quantitative markers for coronary artery disease and predicting the presence of heart disease. For example, a study developed and validated a coronary artery disease&#x2013;predictive ML model using electronic health records and assessed its probabilities as in silico scores for coronary artery disease in participants in 2 longitudinal biobank cohorts [<xref ref-type="bibr" rid="ref12">12</xref>]. Another study applied an ensemble ML model for coronary disease prediction, using ML classifiers to predict heart disease [<xref ref-type="bibr" rid="ref13">13</xref>]. These findings highlight the potential of ML in driving innovation and improving the accuracy of CHD diagnosis and prediction [<xref ref-type="bibr" rid="ref14">14</xref>].</p><p>However, challenges exist in utilizing ML for CHD prediction, including data quality, feature selection, model interpretability, and generalizability. These issues must be carefully addressed to ensure the reliability and robustness of the predictive models. Rigorous validation, regulatory compliance, and effective communication strategies are essential for its successful integration into clinical practice.</p><p>While several established CHD prediction models rely on traditional statistical techniques with predefined risk factors, they are limited by linear assumptions and struggle with complex, high-dimensional datasets. This restricts their ability to uncover novel or subtle risk factors. In contrast, ML models can handle these complexities, offering more nuanced and accurate predictions by identifying nonlinear interactions and discovering previously overlooked factors. Therefore, ML may enhance the overall understanding of CHD and improve both risk assessment and prevention strategies.</p><p>This study aimed to address the role of ML techniques in predicting incident CHD and identifying novel risk factors. This study sought to deepen our understanding of the factors contributing to CHD development by analyzing a comprehensive dataset. These findings will enhance risk assessment, enabling the development of personalized interventions and preventive strategies.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design and Participants</title><p>The Suita Study, a prospective population-based cohort study, was conducted in Suita City, Osaka, Japan. From 1989 to 1999, a total of 7672 men and women aged 30-84 years who did not have a previous history of cardiovascular disease were recruited for the study. Participants were selected from the population registry of the municipality and were followed up every 2 years for an average of 15 years until their first occurrence of stroke, myocardial infarction (MI), death, or relocation.</p><p>After excluding participants with missing outcome data and removing unnecessary variables, the analysis included 7260 participants and 28 variables. Opt-out procedures were implemented for those who preferred not to participate in this study. Informed consent was obtained from all participants at the time of enrollment. The study followed the Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis or Diagnosis and Artificial Intelligence (TRIPOD+AI) statement guidelines for reporting prediction models in medicine, and we have added the completed checklist in <xref ref-type="supplementary-material" rid="app4">Checklist 1</xref> [<xref ref-type="bibr" rid="ref15">15</xref>].</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>The study was conducted in compliance with the ethical standards outlined in the Declaration of Helsinki, and approval was granted by the Institutional Review Board at the National Cerebral and Cardiovascular Center (approval R21024-2). As this study involves secondary data analysis, it is important to note that the original informed consent, obtained during the primary data collection, permits the use of the data for secondary analyses without requiring additional consent from participants. Participants&#x2019; privacy was protected by anonymizing or deidentifying the data to prevent identification.</p></sec><sec id="s2-3"><title>Outcome</title><p>The primary outcome was CHD, including MI, sudden death within 24 hours of acute illness onset, and coronary artery disease requiring bypass surgery or intervention. Medical records were carefully reviewed by hospital doctors or researchers who were blinded to the baseline data to provide an unbiased approach to the analysis. MIs were classified as definite or probable according to the criteria established by the MONICA Project [<xref ref-type="bibr" rid="ref16">16</xref>].</p><p>Every 2 years, each participant&#x2019;s health was evaluated at the National Cerebral and Cardiovascular Center in Osaka, Japan, to detect the occurrence of CHD. Yearly questionnaires were also completed by all participants by mail or telephone. CHD surveillance was completed by systematically searching for death certificates [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>].</p></sec><sec id="s2-4"><title>Predictors</title><p>Predictors were measured at baseline and processed according to a standardized protocol. A comprehensive and prospective data collection process was implemented, encompassing various aspects such as demographics, medical history, medical imaging, laboratory data, lifestyle habits, and outcomes.</p><sec id="s2-4-1"><title>Blood Pressure and Physical Measurements</title><p>Blood pressure was measured in each participant using a mercury column sphygmomanometer, an appropriately sized cuff, and a standardized protocol to ensure accuracy and precision [<xref ref-type="bibr" rid="ref17">17</xref>]. Before the initial blood pressure reading, the participants were instructed to rest for at least 5 minutes to establish a stable baseline. Blood pressure readings were obtained by averaging the second and third measurements, which were performed at intervals of more than 1 minute to allow for adequate observation and recording. Hypertension was defined as systolic blood pressure &#x2265;140 mm Hg, diastolic blood pressure &#x2265;90 mm Hg, or the use of antihypertensive medications.</p><p>BMI was calculated as weight (kg) divided by the square of height (m<sup>2</sup>).</p></sec><sec id="s2-4-2"><title>Biochemical Measurements</title><p>At baseline, routine blood tests were conducted, including measurements of total cholesterol, high-density lipoprotein cholesterol (HDL-c), and fasting glucose levels. Non-HDL-c was calculated by subtracting HDL-c from total cholesterol. Diabetes mellitus was diagnosed if participants had fasting plasma glucose (FPG) &#x2265;126 mg/dL, a non-FPG &#x2265;200 mg/dL, or the use of diabetes mellitus medication.</p><p>The estimated glomerular filtration rate (eGFR; mL/min/1.73 m<sup>2</sup>) was calculated according to the original Modification of Diet in Renal Disease equation modified by the Japanese coefficient (0.881) as follows: 0.881&#x00D7;186&#x00D7;serum creatinine<sup>&#x2212;1.154</sup> &#x00D7; age<sup>&#x2212;0.203</sup> &#x00D7; (0.742 if female) [<xref ref-type="bibr" rid="ref19">19</xref>].</p></sec><sec id="s2-4-3"><title>Imaging Diagnostics</title><p>Carotid artery measurements were performed using a high-resolution ultrasound machine to assess atherosclerotic indices, specifically intima-media thickness (IMT), on both sides of the common carotid artery (CCA), carotid artery bulb, internal carotid artery, and external carotid artery. The maximum IMT in the CCA (IMT_cMax) was defined as the highest measurable IMT in the scanned CCA regions, while the maximum IMT (IMT_MAX) was the highest measurable IMT across the entire scanned area, including the CCA, bulb, internal carotid artery, and external carotid artery on both sides [<xref ref-type="bibr" rid="ref20">20</xref>].</p><p>Atrial fibrillation was checked by standard 12-lead ECGs from all participants and was determined by well-trained physicians [<xref ref-type="bibr" rid="ref18">18</xref>].</p></sec><sec id="s2-4-4"><title>Lifestyle and Medical History</title><p>Smoking status and drinking statuses were categorized as current, quit, or never. A questionnaire was used to ask participants about their past and present history of CHD.</p></sec></sec><sec id="s2-5"><title>Sample Size</title><p>All available data were used, and no formal sample size calculation was performed. The dataset included 7260 participants, among whom 305 had CHD, with 28 predictors selected after the feature selection process used in the model. Based on the events per predictor ratio, which is approximately 10.89 (305/28), the sample size is sufficient to ensure model stability and reliability [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Therefore, this dataset is adequate to answer the research questions.</p></sec><sec id="s2-6"><title>Missing Data</title><p>Missing data analysis was conducted, and variables with more than 30% missing values were excluded to enhance model robustness. Missing data were imputed using Multivariate Imputation by Chained Equations. See <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for details on the percentage of missing data for each variable before imputation.</p></sec><sec id="s2-7"><title>Statistical Analysis Methods</title><sec id="s2-7-1"><title>Descriptive Analysis</title><p>Continuous variables were summarized using means and SDs for normally distributed data, or medians and IQR for nonnormally distributed data. Categorical variables were reported as frequencies and percentages. To compare differences in patient characteristics based on CHD incidence (yes or no), we used various statistical tests including 2-tailed Student <italic>t</italic> tests, Mann&#x2012;Whitney <italic>U</italic> tests, or chi-square tests, as appropriate.</p></sec><sec id="s2-7-2"><title>Feature Selection</title><p>Feature selection was conducted in a stepwise manner to ensure that only the most relevant variables were included in the predictive models. Initially, variables with more than 30% missing data were excluded to avoid potential bias from imputation. Following this, a correlation matrix was used to identify and remove variables with high multicollinearity, defined as having a correlation coefficient greater than 0.8. See correlation coefficients heat map in the <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> for details. The next step involved applying the least absolute shrinkage and selection operator regression. This technique shrinks the coefficients of less significant predictors toward zero, effectively removing them from the model, and was performed using cross-validation to identify the most important features based on the data. Finally, after statistical feature selection, medical knowledge was applied to confirm the clinical relevance of the remaining variables. Important predictors such as age, glucose levels, HDL-c, and blood pressure were retained, given their established association with CHD. The list of variables (predictors) used for model development was described in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p></sec></sec><sec id="s2-8"><title>Development of ML Models</title><sec id="s2-8-1"><title>Overview</title><p>The goal of this analysis was to predict the incidence of CHD using ML models and examine the contribution of each risk factor to the CHD incidence. A comprehensive process was followed, which included descriptive analysis, feature selection, model training, hyperparameter optimization, and interpretability through Shapley Additive Explanation (SHAP) values.</p><p>To manage the imbalance between CHD and non-CHD cases, we used down sampling on the majority class (non-CHD) to create a balanced dataset. This approach helps to ensure that the models do not disproportionately favor the majority class during training, improving prediction performance on the minority class.</p><p>The dataset was split into training (80%) and testing (20%) sets while maintaining balanced target variable distributions across both. Next, one-hot encoding was applied to convert categorical variables into a binary format, and normalization was performed to scale numerical features.</p><p>Several ML algorithms were implemented to compare their predictive power. Logistic regression (LR) was used as a baseline model, offering simplicity and interpretability [<xref ref-type="bibr" rid="ref23">23</xref>]. Random forest (RF), an ensemble learning method, was used due to its strength in handling high-dimensional data and offering feature-importance insights [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Support vector machines (SVMs) with radial basis kernels were used for their effectiveness in nonlinear classification tasks [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. Extreme Gradient Boosting (XGBoost) is an ML algorithm that improves model performance by using a series of decision trees, where each tree corrects the mistakes of the previous one. This sequential approach helps make predictions more accurate. Light Gradient-Boosting Machine (LightGBM) is another efficient algorithm that works similarly to XGBoost but is designed to be faster and more scalable, especially when working with large datasets and many features. Both algorithms are known for their high performance in handling complex data and large-scale problems [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref27">27</xref>].</p></sec><sec id="s2-8-2"><title>Model Evaluation</title><p>We used 5-fold cross-validation during model training to ensure robustness and mitigate overfitting. Hyperparameter optimization was conducted using a grid search approach. The model&#x2019;s performance on the testing set was evaluated using 5 metrics: accuracy, sensitivity, specificity, precision, area under the curve (AUC), and <italic>F</italic><sub>1</sub>-score [<xref ref-type="bibr" rid="ref15">15</xref>].</p><p>Calibration plots are used to evaluate the predictive accuracy of ML models in estimating CHD incidence. Calibration measures how closely the predicted absolute risk corresponds to the observed (true) risk across groups of patients categorized into different risk levels. The overall observed-to-expected (OE) ratio is calculated by dividing the total observed events by the total expected events for the entire population. For each decile, the OE ratio is determined by dividing the observed events within that decile by the expected events for the same decile. An ideal model is represented by a straight line bisecting the calibration plot, with an OE ratio of 1, indicating perfect calibration. An OE ratio &#x003C;1 suggests overprediction, while a ratio &#x003E;1 indicates underprediction [<xref ref-type="bibr" rid="ref15">15</xref>].</p><p>Decision curve analysis (DCA) assesses the clinical use of ML models for predicting CHD incidence. DCA uses net benefit as a metric, reflecting the tradeoff between true-positive and false-positive predictions for a specific strategy [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>].</p></sec><sec id="s2-8-3"><title>Model Interpretation</title><p>SHAP is a method used in ML to make the predictions of a model more understandable. It helps explain how each input feature (such as age, cholesterol levels, or blood pressure) affects the model&#x2019;s decision. Essentially, SHAP breaks down the prediction to show how much each feature contributes to the final result, allowing us to see which factors are most important for predicting a condition like CHD [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. SHAP summary plots visualized the importance of key features, while SHAP dependence plots highlighted the non-linear relationships between features and CHD incidence.</p></sec></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Study Participants&#x2019; Characteristics</title><p>In this study, 7260 participants were analyzed, of which 305 (4.2%) were diagnosed with CHD. The median age of participants with CHD was 63 (IQR 56-71) years , which was significantly older than that of those without CHD, whose median age was 55 (IQR 44-65) years. CHD was more prevalent in men (n=202, 66.2%) compared to women (n=103, 33.8%), and this gender difference was statistically significant.</p><p>Several cardiovascular risk factors were also associated with CHD. Participants with CHD had higher systolic and diastolic blood pressures. The eGFR was lower in participants with CHD compared to those without. The IMT of CCAs, IMT_cMax, was also significantly higher in patients with CHD (1.10 mm vs 1.00 mm; <italic>P</italic>&#x003C;.001).</p><p>BMI and waist circumference were also higher in participants with CHD, indicating a greater degree of obesity. Additionally, lipid profiles showed significant differences, with lower HDL-c levels and higher non-HDL-c and triglyceride levels in patients with CHD.</p><p>Higher glucose levels and white blood cell counts were observed in participants with CHD, along with elevated hemoglobin levels. Regarding lifestyle factors, smoking was more common in those with CHD, while drinking status did not differ significantly between the 2 groups.</p><p>Regarding lifestyle factors, current smoking was more prevalent among participants with CHD (36.1% vs 29.0%; <italic>P</italic>&#x003C;.001), while drinking status did not significantly differ between the groups.</p><p>In terms of comorbidities, atrial fibrillation, hypertension, diabetes mellitus, and dyslipidemia were all significantly more common in participants with CHD, as outlined in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Characteristics of study participants with and without CHD<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> incidence (Japanese participants aged 30&#x2010;84 years, Suita Study). CHD was diagnosed by a first-ever acute myocardial infarction, sudden cardiac death within 24 hours of illness, or coronary artery disease followed by bypass or angioplasty. Values are presented as mean (SD) for continuous variables with approximately normally distribution or by median (IQR) with skewed distribution and n (%) for categorical variables. Differences in characteristics were evaluated by using the unpaired 2-tailed Student <italic>t</italic> test, Wilcoxon rank sums test, or chi-square test.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom" colspan="2">CHD</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="top">No (n=6955)</td><td align="left" valign="top">Yes (n=305)</td><td align="left" valign="bottom"/></tr></thead><tbody><tr><td align="left" valign="top">Age (years), median (IQR)</td><td align="left" valign="top">55.0 (44.0-65.0)</td><td align="left" valign="top">63.0 (56.0-71.0)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top" colspan="3">Sex, n (%)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">3147 (45.2)</td><td align="left" valign="top">202 (66.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">3808 (54.8)</td><td align="left" valign="top">103 (33.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">SBP<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> (mm Hg), median (IQR)</td><td align="left" valign="top">123 (110-137)</td><td align="left" valign="top">138 (125-153)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">DBP<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup> (mm Hg), median (IQR)</td><td align="left" valign="top">77.0 (70.0-85.0)</td><td align="left" valign="top">83.0 (74.0-89.0)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">IMT_cMax<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup> (mm), median (IQR)</td><td align="left" valign="top">1.00 (0.80-1.10)</td><td align="left" valign="top">1.10 (1.00-1.30)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">eGFR<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup> (mL/min/1.73 m&#x00B2;), mean (SD)</td><td align="left" valign="top">104 (32.2)</td><td align="left" valign="top">95.3 (63.3)</td><td align="left" valign="top">.014</td></tr><tr><td align="left" valign="top">BMI (kg/m&#x00B2;), mean (SD)</td><td align="left" valign="top">22.5 (3.10)</td><td align="left" valign="top">23.3 (3.26)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Body fat (%), mean (SD)</td><td align="left" valign="top">23.2 (6.32)</td><td align="left" valign="top">22.6 (7.06)</td><td align="left" valign="top">.15</td></tr><tr><td align="left" valign="top">Waist circumference (cm), median (IQR)</td><td align="left" valign="top">80.0 (73.0-86.0)</td><td align="left" valign="top">83.0 (77.0-90.0)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">HDL-c<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup> (mg/dL), median (IQR)</td><td align="left" valign="top">53.0 (44.0-63.0)</td><td align="left" valign="top">46.0 (38.0-56.0)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">non-HDL-c (mg/dL), mean (SD)</td><td align="left" valign="top">152 (36.9)</td><td align="left" valign="top">172 (40.5)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Triglycerides (mg/dL), median (IQR)</td><td align="left" valign="top">98.0 (70.0-143)</td><td align="left" valign="top">121 (90.0-174)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Calcium (mg/dL), mean (SD)</td><td align="left" valign="top">9.35 (0.46)</td><td align="left" valign="top">9.34 (0.43)</td><td align="left" valign="top">.61</td></tr><tr><td align="left" valign="top">Fructosamine (&#x03BC;mol/L), median (IQR)</td><td align="left" valign="top">251 (237-266)</td><td align="left" valign="top">257 (242-276)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Glucose (mg/dL), median (IQR)</td><td align="left" valign="top">95.0 (89.0-101)</td><td align="left" valign="top">100 (93.0-109)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">WBC<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup> count (/mm&#x00B3;), median (IQR)</td><td align="left" valign="top">5.33 (4.48-6.36)</td><td align="left" valign="top">5.65 (4.81-6.78)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">RBC<sup><xref ref-type="table-fn" rid="table1fn8">h</xref></sup> count (10&#x00B3;/mm&#x00B3;), mean (SD)</td><td align="left" valign="top">4.53 (0.44)</td><td align="left" valign="top">4.60 (0.46)</td><td align="left" valign="top">.008</td></tr><tr><td align="left" valign="top" colspan="3">Smoking status, n (%)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Current</td><td align="left" valign="top">2019 (29)</td><td align="left" valign="top">110 (36.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Past</td><td align="left" valign="top">1091 (15.7)</td><td align="left" valign="top">79 (25.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Never</td><td align="left" valign="top">3845 (55.3)</td><td align="left" valign="top">116 (38)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="3">Drinking status, n (%)</td><td align="left" valign="top">.27</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Current</td><td align="left" valign="top">3613 (51.9)</td><td align="left" valign="top">152 (49.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Past</td><td align="left" valign="top">156 (2.24)</td><td align="left" valign="top">11 (3.61)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Never</td><td align="left" valign="top">3186 (45.8)</td><td align="left" valign="top">142 (46.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Atrial fibrillation, n (%)</td><td align="left" valign="top">123 (1.77)</td><td align="left" valign="top">20 (6.56)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Hypertension, n (%)</td><td align="left" valign="top">2056 (29.6)</td><td align="left" valign="top">172 (56.4)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Diabetes mellitus, n (%)</td><td align="left" valign="top">426 (6.13)</td><td align="left" valign="top">49 (16.1)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Dyslipidemia, n (%)</td><td align="left" valign="top">5280 (75.9)</td><td align="left" valign="top">265 (86.9)</td><td align="left" valign="top">&#x003C;.001</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>CHD: coronary heart disease.</p></fn><fn id="table1fn2"><p><sup>b</sup>SBP: systolic blood pressure.</p></fn><fn id="table1fn3"><p><sup>c</sup>DBP: diastolic blood pressure.</p></fn><fn id="table1fn4"><p><sup>d</sup>IMT_cMax: maximum intima-media thickness of common carotid arteries.</p></fn><fn id="table1fn5"><p><sup>e</sup>eGFR: estimated glomerular filtration rate.</p></fn><fn id="table1fn6"><p><sup>f</sup>HDL-c: high-density lipoprotein cholesterol.</p></fn><fn id="table1fn7"><p><sup>g</sup>WBC: white blood cell.</p></fn><fn id="table1fn8"><p><sup>h</sup>RBC: red blood cell.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Model Performance</title><p>The performance metrics of the 5 ML models used in our CHD prediction study provide valuable insights into their effectiveness, as shown in <xref ref-type="table" rid="table2">Table 2</xref>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Performance metrics and 95% CIs for machine learning models predicting CHD<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> incidence (Japanese participants, aged 30&#x2010;84 years, Suita Study).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom">Sensitivity</td><td align="left" valign="bottom">Specificity</td><td align="left" valign="bottom">Precision</td><td align="left" valign="bottom">AUC<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score</td></tr></thead><tbody><tr><td align="left" valign="top">LR<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="top">0.66 (0.58&#x2010;0.75)</td><td align="left" valign="top">0.59 (0.46&#x2010;0.71)</td><td align="left" valign="top">0.74 (0.62&#x2010;0.84)</td><td align="left" valign="top">0.69 (0.55&#x2010;0.81)</td><td align="left" valign="top">0.66 (0.57&#x2010;0.75)</td><td align="left" valign="top">0.64 (0.52&#x2010;0.73)</td></tr><tr><td align="left" valign="top">RF<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup></td><td align="left" valign="top">0.73 (0.64&#x2010;0.80)</td><td align="left" valign="top">0.74 (0.62&#x2010;0.84)</td><td align="left" valign="top">0.72 (0.61&#x2010;0.83)</td><td align="left" valign="top">0.73 (0.61&#x2010;0.84)</td><td align="left" valign="top">0.73 (0.65&#x2010;0.80)</td><td align="left" valign="top">0.73 (0.64&#x2010;0.82)</td></tr><tr><td align="left" valign="top">SVM<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup></td><td align="left" valign="top">0.71 (0.62&#x2010;0.80)</td><td align="left" valign="top">0.70 (0.59&#x2010;0.81)</td><td align="left" valign="top">0.72 (0.62&#x2010;0.83)</td><td align="left" valign="top">0.72 (0.60&#x2010;0.84)</td><td align="left" valign="top">0.71 (0.63&#x2010;0.79)</td><td align="left" valign="top">0.71 (0.61&#x2010;0.80)</td></tr><tr><td align="left" valign="top">XGBoost<sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup></td><td align="left" valign="top">0.72 (0.64&#x2010;0.80)</td><td align="left" valign="top">0.74 (0.63&#x2010;0.84)</td><td align="left" valign="top">0.70 (0.58&#x2010;0.82)</td><td align="left" valign="top">0.71 (0.60&#x2010;0.82)</td><td align="left" valign="top">0.72 (0.64&#x2010;0.80)</td><td align="left" valign="top">0.73 (0.63&#x2010;0.81)</td></tr><tr><td align="left" valign="top">LightGBM<sup><xref ref-type="table-fn" rid="table2fn7">g</xref></sup></td><td align="left" valign="top">0.50 (0.43&#x2010;0.58)</td><td align="left" valign="top">1.00 (1.00&#x2010;1.00)</td><td align="left" valign="top">0.00 (0.00&#x2010;0.00)</td><td align="left" valign="top">0.50 (0.41&#x2010;0.59)</td><td align="left" valign="top">0.5 (0.49&#x2010;0.57)</td><td align="left" valign="top">0.67 (0.58&#x2010;0.74)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>CHD: coronary heart disease.</p></fn><fn id="table2fn2"><p><sup>b</sup>AUC: area under the curve.</p></fn><fn id="table2fn3"><p><sup>c</sup>LR: logistic regression.</p></fn><fn id="table2fn4"><p><sup>d</sup>RF: random forest.</p></fn><fn id="table2fn5"><p><sup>e</sup>SVM: support vector machine.</p></fn><fn id="table2fn6"><p><sup>f</sup>XGBoost: Extreme Gradient Boosting.</p></fn><fn id="table2fn7"><p><sup>g</sup>LightGBM: Light Gradient-Boosting Machine.</p></fn></table-wrap-foot></table-wrap><p>RF emerged as the strongest model for CHD prediction in this study, achieving the highest overall performance with an accuracy of 0.73 (95% CI 0.64&#x2010;0.80), sensitivity of 0.74 (95% CI 0.62&#x2010;0.84), specificity of 0.72 (95% CI 0.61&#x2010;0.83), and an AUC of 0.73 (95% CI 0.65&#x2010;0.80). These results highlight its balanced ability to identify both CHD and non-CHD cases effectively. In comparison, XGBoost delivered robust, yet slightly inferior, results with an accuracy of 0.72 (95% CI 0.64&#x2010;0.80), sensitivity of 0.74 (95% CI 0.63&#x2010;0.84), specificity of 0.70 (95% CI 0.58&#x2010;0.82), an AUC of 0.72 (95% CI 0.64&#x2010;0.80), and an <italic>F</italic><sub>1</sub>-score of 0.73 (95% CI 0.63&#x2010;0.81). SVM demonstrated competitive performance, achieving an AUC of 0.71 (95% CI 0.63&#x2010;0.79), but ranked slightly behind RF and XGBoost. In contrast, LightGBM, despite its perfect sensitivity of 1.00 (95% CI 1.00&#x2010;1.00), showed a specificity of 0.00 (95% CI 0.00&#x2010;0.00) and an AUC of 0.50 (95% CI 0.49&#x2010;0.57), rendering it unsuitable for this task. LR, while serving as a baseline model, exhibited moderate performance with an accuracy of 0.66 (95% CI 0.58&#x2010;0.75), sensitivity of 0.59 (95% CI 0.46&#x2010;0.71), specificity of 0.74 (95% CI 0.62&#x2010;0.84), and an AUC of 0.66 (95% CI 0.57&#x2010;0.75), but lacked the sensitivity required for effective CHD prediction.</p><p>The calibration curves for the 5 models (<xref ref-type="fig" rid="figure1">Figure 1</xref>) and the OE ratios by decile (<xref ref-type="fig" rid="figure2">Figure 2</xref>) provide critical insights into their predictive reliability. Among the models, RF demonstrated excellent calibration, with predicted probabilities closely aligning with observed outcomes across all deciles. This strong calibration is complemented by its performance in DCA (<xref ref-type="fig" rid="figure3">Figure 3</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Calibration plots for machine learning models predicting CHD incidence (Japanese participants, aged 30&#x2010;84 years, Suita Study). CHD: coronary heart disease; LightGBM: Light Gradient-Boosting Machine; XGBoost: Extreme Gradient Boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e68066_fig01.png"/></fig><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Calibration plots displaying observed-to-expected ratios for each decile of predicted CHD incidence risk (Japanese participants, aged 30&#x2010;84 years, Suita Study). CHD: coronary heart disease; LightGBM: Light Gradient-Boosting Machine; SVM: support vector machine; XGBoost: Extreme Gradient Boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e68066_fig02.png"/></fig><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Decision curve analysis comparing machine learning models for predicting CHD incidence (Japanese participants, aged 30&#x2010;84 years, Suita Study). CHD: coronary heart disease; LightGBM: Light Gradient-Boosting Machine; XGBoost: Extreme Gradient Boosting.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e68066_fig03.png"/></fig><p>In terms of clinical use, as illustrated in <xref ref-type="fig" rid="figure3">Figure 3</xref>, all models exhibit a similar positive net benefit when the threshold is below 0.5, meaning that using the predictive models is better than not using any model (treat none). However, when the threshold exceeds 0.5, the models tend to decline rapidly, with LR and XGBoost showing the most pronounced decrease, declining earlier compared to the other models.</p><p>Based on the performance metrics, RF emerges as the best model for CHD prediction in this study due to its highest overall accuracy, balanced sensitivity and specificity, strong AUC, excellent calibration, and robust clinical use across various threshold probabilities.</p></sec><sec id="s3-3"><title>Model Interpretation</title><p>In <xref ref-type="fig" rid="figure4">Figure 4</xref>, the bar plot on the left ranks the top features contributing to CHD prediction, with IMT_cMax identified as the most influential variable, followed by systolic blood pressure (SBP), HDL-c, non-HDL-c, and eGFR. This ranking emphasizes the significance of arterial health, blood pressure regulation, lipid levels, and kidney function in assessing CHD risk. The SHAP summary heat plot on the right provides a detailed visualization of how each feature influences individual model predictions. It shows that higher values of IMT_cMax, non-HDL-c, and blood pressure are positively associated with an increased likelihood of CHD, whereas lower levels of protective factors like HDL-c and eGFR are associated with a higher risk of CHD. Other important variables, such as age, glucose levels, and triglycerides, also contribute significantly, with older age and impaired glucose regulation being linked to a higher CHD risk. Additionally, markers of inflammation like white blood cell count and other factors such as calcium levels, sex, body fat, and BMI play roles in determining CHD risk.</p><p><xref ref-type="fig" rid="figure5">Figure 5</xref> consists of several SHAP dependency plots that illustrate the relationship between each key variable and CHD risk in more detail. For IMT_cMax, there is a positive association with CHD risk, showing that as the thickness of the carotid artery increases, so does the risk of CHD. The eGFR plot shows that lower eGFR values are associated with a higher risk of CHD, while higher eGFR values are associated with a lower risk, indicating the crucial role of kidney function in cardiovascular health. Non-HDL-c shows a generally positive association with CHD, where higher levels correspond to a higher risk. For SBP, the risk of CHD increases sharply with rising SBP values. HDL-c is inversely related to CHD risk, indicating its protective role, while higher triglycerides (TG) are linked to increased risk, especially at moderate levels. Age and glucose levels show a direct relationship with CHD risk, whereas older age and higher glucose levels are associated with increased risk. The SHAP value for diastolic blood pressure (DBP) also shows a positive relationship, suggesting that higher DBP levels contribute to the increased risk of CHD.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Contribution of variables to CHD incidence prediction using SHAP values (Japanese participants, aged 30&#x2010;84 years, Suita Study). (A) The bar plot shows each variable&#x2019;s contribution to CHD, with bar length indicating the contribution extent. (B) The heat plot of SHAP values illustrates the relationships between variables and CHD. Purple signifies a positive relationship and yellow a negative one. Each point represents a participant, with the x-axis showing SHAP values and the y-axis indicating variable importance. bf: body fat; Ca: calcium; CHD: coronary heart disease; DBP: diastolic blood pressure; eGFR: estimated glomerular filtration rate; Frct: Fructosamine; Hb: hemoglobin; htn: hypertension; IMT_cMax: maximum intima-media thickness of common carotid arteries; HDL-c: high-density lipoprotein cholesterol; SBP: systolic blood pressure; smk_sts: smoking status; TG: triglycerides; WBC: white blood cell; wt20: weight at age of 20 years.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e68066_fig04.png"/></fig><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>SHAP dependency plots showing the relationship between key variables and CHD risk (Japanese participants, aged 30&#x2010;84 years, Suita Study). CHD: coronary heart disease; DBP: diastolic blood pressure; eGFR: estimated glomerular filtration rate; IMT_cMax: maximum intima-media thickness of common carotid arteries; HDL-c: high-density lipoprotein cholesterol; SBP: systolic blood pressure; SHAP: Shapley Additive Explanation; TG: triglycerides.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e68066_fig05.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study provides a comprehensive evaluation of the role of ML in predicting CHD. Among a cohort of 7260 participants, 305 were diagnosed with CHD. The analysis not only validated several well-established cardiovascular and metabolic risk factors but also identified novel predictors of CHD. Importantly, the findings underscore the use of ML models and the SHAP method in elucidating key contributors to CHD risk, with RF demonstrating superior performance, excelling in both discrimination and calibration for CHD prediction.</p></sec><sec id="s4-2"><title>Comparison With Prior Work</title><sec id="s4-2-1"><title>Arterial Health</title><p>Carotid IMT emerged as the strongest predictor of CHD in our study. IMT_cMax, which measures the thickness of the CCAs, is a well-established indicator of atherosclerosis and future cardiovascular events, including MI and stroke [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. Multiple studies support this, showing that even a small increase in IMT correlates with a significantly elevated risk of acute MI and stroke. For instance, in the Atherosclerosis Risk in Communities study, a 0.1 mm increase in IMT corresponded to a 50% increase in CHD risk [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. Therefore, measuring IMT through noninvasive techniques like ultrasound has important clinical applications in evaluating subclinical atherosclerosis and assessing CHD risk. Given that many coronary artery assessments are invasive, the use of ultrasound to measure carotid artery IMT offers a valuable alternative for early detection and risk stratification.</p></sec><sec id="s4-2-2"><title>Blood Pressure, Lipid Profiles, and Glucose</title><p>SBP and hypertension were among the most critical predictors of CHD, aligning with the well-established association between elevated blood pressure and cardiovascular risk [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. Both SBP and diastolic blood pressure were prominent, emphasizing the need for effective blood pressure management in reducing CHD risk [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>].</p><p>Furthermore, non-HDL-c and triglycerides were strongly associated with CHD, confirming the importance of lipid management in cardiovascular health [<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref39">39</xref>]. Glucose levels were also significant, suggesting that monitoring glucose metabolism is essential in cardiovascular risk management [<xref ref-type="bibr" rid="ref40">40</xref>-<xref ref-type="bibr" rid="ref42">42</xref>].</p></sec><sec id="s4-2-3"><title>Renal Function and Metabolic Factors</title><p>The role of eGFR as a key predictor highlights the connection between renal function and CHD [<xref ref-type="bibr" rid="ref43">43</xref>]. Impaired kidney function has been increasingly recognized as a cardiovascular risk factor, particularly due to its association with hypertension and dyslipidemia [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]. The results support incorporating kidney function markers in future CHD risk assessments. In addition, metabolic markers and body fat percentage were identified as important predictors, signaling the impact of obesity-related factors on cardiovascular health. These findings suggest that obesity-related measures beyond BMI should be considered in CHD risk assessments.</p></sec><sec id="s4-2-4"><title>Sex</title><p>The sex-specific analysis highlighted the protective effect of being female, consistent with existing research showing that premenopausal women are generally at a lower risk of developing CHD due to protective hormonal factors [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>]. These findings suggest the need for sex-specific strategies in managing CHD risk.</p></sec></sec><sec id="s4-3"><title>Potential Risk Factors</title><p>One of the strengths of this study is its ability to uncover novel predictors, such as white blood cell count, which serves as a marker of systemic inflammation. Inflammation is increasingly recognized as a key player in the development of atherosclerosis and cardiovascular events. Additionally, lower calcium levels were associated with a higher risk of CHD, highlighting the importance of mineral balance in cardiovascular health. Furthermore, body fat percentage and BMI were highlighted as significant predictors of CHD, further emphasizing the need for a comprehensive evaluation of obesity-related metrics in cardiovascular risk assessments. These novel insights could lead to more personalized prevention strategies for individuals who may not exhibit classic cardiovascular risk profiles.</p></sec><sec id="s4-4"><title>Limitations</title><p>Despite the promising results, several limitations of the study need to be considered. First, the quality of the data, particularly with respect to missing values, poses a challenge. Although feature selection techniques, such as least absolute shrinkage and selection operator regression and SHAP analysis, were used to mitigate this, the impact of missing data remains a potential limitation. Second, the generalizability of the findings is limited because the study relies on a specific population. The results may not fully apply to populations with different demographic and clinical characteristics. To address this, future research should focus on evaluating these ML models in real-world clinical settings, where variability in clinical practice, missing data, and other factors may affect model performance.</p></sec><sec id="s4-5"><title>Conclusions</title><p>This study demonstrates the potential of ML in predicting CHD. The SHAP method enhances the interpretability of the prediction model, aiding health care professionals in clinical practice by supporting effective risk management and intervention strategies.</p></sec></sec></body><back><ack><p>This article was supported by the Japan Science and Technology Agency COI-NEXT (grant JPMJPF2018) to MA.</p></ack><notes><sec><title>Data Availability</title><p>The dataset examined in this study is not available to the public due to the inclusion of individuals&#x2019; personal information but is available from the corresponding author at a reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>TV conceptualized and designed the study, conducted the data analysis and interpretation, and drafted the manuscript. Y Kokubo contributed to the study concept and design, curated the data, provided resources, and supervised the project. MA assisted in study design, data curation, and supervision. MI and MY contributed to data analysis and interpretation. RD, AMM, JTT, AA, MT, YMN, and TI provided critical feedback and revised the manuscript. All authors reviewed and approved the final version of the manuscript.</p></fn><fn fn-type="conflict"><p>YMN is employed by the Department of Digital Health and Epidemiology, Graduate School of Medicine and Public Health, Kyoto University, an Industry-Academia Collaboration Course supported by Eisai Co., Ltd. and Kyowa Kirin Co., Ltd. Additionally, YMN reports a study grant from Bayer outside the submitted work.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AUC</term><def><p>area under the curve</p></def></def-item><def-item><term id="abb2">CCA</term><def><p>common carotid artery</p></def></def-item><def-item><term id="abb3">CHD</term><def><p>coronary heart disease</p></def></def-item><def-item><term id="abb4">DCA</term><def><p>decision curve analysis</p></def></def-item><def-item><term id="abb5">eGFR</term><def><p>estimated glomerular filtration rate</p></def></def-item><def-item><term id="abb6">HDL-c</term><def><p>high-density lipoprotein cholesterol</p></def></def-item><def-item><term id="abb7">IMT</term><def><p>intima-media thickness</p></def></def-item><def-item><term id="abb8">IMT_cMax</term><def><p>maximum intima-media thickness of common carotid arteries</p></def></def-item><def-item><term id="abb9">LightGBM</term><def><p>Light Gradient-Boosting Machine</p></def></def-item><def-item><term id="abb10">LR</term><def><p>logistic regression</p></def></def-item><def-item><term id="abb11">MI</term><def><p>myocardial infarction</p></def></def-item><def-item><term id="abb12">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb13">OE</term><def><p>observed-to-expected</p></def></def-item><def-item><term id="abb14">RF</term><def><p>random forest</p></def></def-item><def-item><term id="abb15">SBP</term><def><p>systolic blood pressure</p></def></def-item><def-item><term id="abb16">SHAP</term><def><p>Shapley Additive Explanation</p></def></def-item><def-item><term id="abb17">SVM</term><def><p>support vector machine</p></def></def-item><def-item><term id="abb18">TRIPOD+AI</term><def><p>Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis or Diagnosis and Artificial Intelligence</p></def></def-item><def-item><term id="abb19">XGBoost</term><def><p>Extreme Gradient Boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vos</surname><given-names>T</given-names> </name><name name-style="western"><surname>Lim</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Abbafati</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Global burden of 369 diseases and injuries in 204 countries and territories, 1990&#x2013;2019: a systematic analysis for the Global Burden of Disease Study 2019</article-title><source>Lancet</source><year>2020</year><month>10</month><volume>396</volume><issue>10258</issue><fpage>1204</fpage><lpage>1222</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(20)30925-9</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roth</surname><given-names>GA</given-names> </name><name name-style="western"><surname>Mensah</surname><given-names>GA</given-names> </name><name name-style="western"><surname>Johnson</surname><given-names>CO</given-names> </name><etal/></person-group><article-title>Global burden of cardiovascular diseases and risk factors, 1990&#x2013;2019</article-title><source>J Am Coll Cardiol</source><year>2020</year><month>12</month><volume>76</volume><issue>25</issue><fpage>2982</fpage><lpage>3021</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2020.11.010</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lim</surname><given-names>HY</given-names> </name><name name-style="western"><surname>Burrell</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Brook</surname><given-names>R</given-names> </name><name name-style="western"><surname>Nandurkar</surname><given-names>HH</given-names> </name><name name-style="western"><surname>Donnan</surname><given-names>G</given-names> </name><name name-style="western"><surname>Ho</surname><given-names>P</given-names> </name></person-group><article-title>The need for individualized risk assessment in cardiovascular disease</article-title><source>J Pers Med</source><year>2022</year><month>07</month><day>14</day><volume>12</volume><issue>7</issue><fpage>1140</fpage><pub-id pub-id-type="doi">10.3390/jpm12071140</pub-id><pub-id pub-id-type="medline">35887637</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Matheson</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Kato</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Baba</surname><given-names>S</given-names> </name><name name-style="western"><surname>Cox</surname><given-names>C</given-names> </name><name name-style="western"><surname>Lima</surname><given-names>JAC</given-names> </name><name name-style="western"><surname>Ambale-Venkatesh</surname><given-names>B</given-names> </name></person-group><article-title>Cardiovascular risk prediction using machine learning in a large Japanese cohort</article-title><source>Circ Rep</source><year>2022</year><month>12</month><day>9</day><volume>4</volume><issue>12</issue><fpage>595</fpage><lpage>603</lpage><pub-id pub-id-type="doi">10.1253/circrep.CR-22-0101</pub-id><pub-id pub-id-type="medline">36530840</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weng</surname><given-names>SF</given-names> </name><name name-style="western"><surname>Reps</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kai</surname><given-names>J</given-names> </name><name name-style="western"><surname>Garibaldi</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Qureshi</surname><given-names>N</given-names> </name></person-group><article-title>Can machine-learning improve cardiovascular risk prediction using routine clinical data?</article-title><source>PLoS ONE</source><year>2017</year><volume>12</volume><issue>4</issue><fpage>e0174944</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0174944</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jiang</surname><given-names>T</given-names> </name><name name-style="western"><surname>Gradus</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Rosellini</surname><given-names>AJ</given-names> </name></person-group><article-title>Supervised machine learning: a brief primer</article-title><source>Behav Ther</source><year>2020</year><month>09</month><volume>51</volume><issue>5</issue><fpage>675</fpage><lpage>687</lpage><pub-id pub-id-type="doi">10.1016/j.beth.2020.05.002</pub-id><pub-id pub-id-type="medline">32800297</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Linardatos</surname><given-names>P</given-names> </name><name name-style="western"><surname>Papastefanopoulos</surname><given-names>V</given-names> </name><name name-style="western"><surname>Kotsiantis</surname><given-names>S</given-names> </name></person-group><article-title>Explainable AI: a review of machine learning interpretability methods</article-title><source>Entropy (Basel)</source><year>2020</year><month>12</month><day>25</day><volume>23</volume><issue>1</issue><fpage>18</fpage><pub-id pub-id-type="doi">10.3390/e23010018</pub-id><pub-id pub-id-type="medline">33375658</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Kokubo</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Inoue</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Machine learning approaches for stroke risk prediction: findings from the Suita Study</article-title><source>J Cardiovasc Dev Dis</source><year>2024</year><month>07</month><day>1</day><volume>11</volume><issue>7</issue><fpage>207</fpage><pub-id pub-id-type="doi">10.3390/jcdd11070207</pub-id><pub-id pub-id-type="medline">39057627</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Martin-Morales</surname><given-names>A</given-names> </name><name name-style="western"><surname>Yamamoto</surname><given-names>M</given-names> </name><name name-style="western"><surname>Inoue</surname><given-names>M</given-names> </name><name name-style="western"><surname>Vu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Dawadi</surname><given-names>R</given-names> </name><name name-style="western"><surname>Araki</surname><given-names>M</given-names> </name></person-group><article-title>Predicting cardiovascular disease mortality: leveraging machine learning for comprehensive assessment of health and nutrition variables</article-title><source>Nutrients</source><year>2023</year><month>09</month><day>11</day><volume>15</volume><issue>18</issue><fpage>3937</fpage><pub-id pub-id-type="doi">10.3390/nu15183937</pub-id><pub-id pub-id-type="medline">37764721</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thanh</surname><given-names>NT</given-names> </name><name name-style="western"><surname>Luan</surname><given-names>VT</given-names> </name><name name-style="western"><surname>Viet</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Tung</surname><given-names>TH</given-names> </name><name name-style="western"><surname>Thien</surname><given-names>V</given-names> </name></person-group><article-title>A machine learning-based risk score for prediction of mechanical ventilation in children with dengue shock syndrome: a retrospective cohort study</article-title><source>PLoS ONE</source><year>2024</year><volume>19</volume><issue>12</issue><fpage>e0315281</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0315281</pub-id><pub-id pub-id-type="medline">39642139</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kumar</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Koul</surname><given-names>A</given-names> </name><name name-style="western"><surname>Singla</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ijaz</surname><given-names>MF</given-names> </name></person-group><article-title>Artificial intelligence in disease diagnosis: a systematic literature review, synthesizing framework and future research agenda</article-title><source>J Ambient Intell Humaniz Comput</source><year>2023</year><volume>14</volume><issue>7</issue><fpage>8459</fpage><lpage>8486</lpage><pub-id pub-id-type="doi">10.1007/s12652-021-03612-z</pub-id><pub-id pub-id-type="medline">35039756</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Forrest</surname><given-names>IS</given-names> </name><name name-style="western"><surname>Petrazzini</surname><given-names>BO</given-names> </name><name name-style="western"><surname>Duffy</surname><given-names>&#x00C1;</given-names> </name><etal/></person-group><article-title>Machine learning-based marker for coronary artery disease: derivation and validation in two longitudinal cohorts</article-title><source>The Lancet</source><year>2023</year><month>01</month><volume>401</volume><issue>10372</issue><fpage>215</fpage><lpage>225</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(22)02079-7</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bani Hani</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Ahmad</surname><given-names>MM</given-names> </name></person-group><article-title>Machine-learning algorithms for ischemic heart disease prediction: a systematic review</article-title><source>Curr Cardiol Rev</source><year>2023</year><volume>19</volume><issue>1</issue><fpage>e090622205797</fpage><pub-id pub-id-type="doi">10.2174/1573403X18666220609123053</pub-id><pub-id pub-id-type="medline">35692135</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alizadehsani</surname><given-names>R</given-names> </name><name name-style="western"><surname>Abdar</surname><given-names>M</given-names> </name><name name-style="western"><surname>Roshanzamir</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Machine learning-based coronary artery disease diagnosis: a comprehensive review</article-title><source>Comput Biol Med</source><year>2019</year><month>08</month><volume>111</volume><fpage>103346</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2019.103346</pub-id><pub-id pub-id-type="medline">31288140</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Collins</surname><given-names>GS</given-names> </name><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names> </name><name name-style="western"><surname>Dhiman</surname><given-names>P</given-names> </name><etal/></person-group><article-title>TRIPOD+AI statement: updated guidance for reporting clinical prediction models that use regression or machine learning methods</article-title><source>BMJ</source><year>2024</year><month>04</month><day>16</day><volume>385</volume><fpage>e078378</fpage><pub-id pub-id-type="doi">10.1136/bmj-2023-078378</pub-id><pub-id pub-id-type="medline">38626948</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tunstall-Pedoe</surname><given-names>H</given-names> </name><name name-style="western"><surname>Kuulasmaa</surname><given-names>K</given-names> </name><name name-style="western"><surname>Amouyel</surname><given-names>P</given-names> </name><name name-style="western"><surname>Arveiler</surname><given-names>D</given-names> </name><name name-style="western"><surname>Rajakangas</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Pajak</surname><given-names>A</given-names> </name></person-group><article-title>Myocardial infarction and coronary deaths in the World Health Organization MONICA Project. Registration procedures, event rates, and case-fatality rates in 38 populations from 21 countries in four continents</article-title><source>Circulation</source><year>1994</year><month>07</month><volume>90</volume><issue>1</issue><fpage>583</fpage><lpage>612</lpage><pub-id pub-id-type="doi">10.1161/01.cir.90.1.583</pub-id><pub-id pub-id-type="medline">8026046</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kokubo</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Kamide</surname><given-names>K</given-names> </name><name name-style="western"><surname>Okamura</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Impact of high-normal blood pressure on the risk of cardiovascular disease in a Japanese urban cohort: the Suita Study</article-title><source>Hypertension</source><year>2008</year><month>10</month><volume>52</volume><issue>4</issue><fpage>652</fpage><lpage>659</lpage><pub-id pub-id-type="doi">10.1161/HYPERTENSIONAHA.108.118273</pub-id><pub-id pub-id-type="medline">18725580</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kokubo</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Watanabe</surname><given-names>M</given-names> </name><name name-style="western"><surname>Higashiyama</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Interaction of blood pressure and body mass index with risk of incident atrial fibrillation in a Japanese urban cohort: the Suita Study</article-title><source>Am J Hypertens</source><year>2015</year><month>11</month><volume>28</volume><issue>11</issue><fpage>1355</fpage><lpage>1361</lpage><pub-id pub-id-type="doi">10.1093/ajh/hpv038</pub-id><pub-id pub-id-type="medline">25845964</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Imai</surname><given-names>E</given-names> </name><name name-style="western"><surname>Horio</surname><given-names>M</given-names> </name><name name-style="western"><surname>Nitta</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Estimation of glomerular filtration rate by the MDRD study equation modified for Japanese patients with chronic kidney disease</article-title><source>Clin Exp Nephrol</source><year>2007</year><month>03</month><volume>11</volume><issue>1</issue><fpage>41</fpage><lpage>50</lpage><pub-id pub-id-type="doi">10.1007/s10157-006-0453-4</pub-id><pub-id pub-id-type="medline">17384997</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kokubo</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Watanabe</surname><given-names>M</given-names> </name><name name-style="western"><surname>Higashiyama</surname><given-names>A</given-names> </name><name name-style="western"><surname>Nakao</surname><given-names>YM</given-names> </name><name name-style="western"><surname>Nakamura</surname><given-names>F</given-names> </name><name name-style="western"><surname>Miyamoto</surname><given-names>Y</given-names> </name></person-group><article-title>Impact of intima-media thickness progression in the common carotid arteries on the risk of incident cardiovascular disease in the Suita Study</article-title><source>J Am Heart Assoc</source><year>2018</year><month>06</month><day>1</day><volume>7</volume><issue>11</issue><fpage>e007720</fpage><pub-id pub-id-type="doi">10.1161/JAHA.117.007720</pub-id><pub-id pub-id-type="medline">29858361</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Christodoulou</surname><given-names>E</given-names> </name><name name-style="western"><surname>van Smeden</surname><given-names>M</given-names> </name><name name-style="western"><surname>Edlinger</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Adaptive sample size determination for the development of clinical prediction models</article-title><source>Diagn Progn Res</source><year>2021</year><month>03</month><day>22</day><volume>5</volume><issue>1</issue><fpage>6</fpage><pub-id pub-id-type="doi">10.1186/s41512-021-00096-5</pub-id><pub-id pub-id-type="medline">33745449</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Riley</surname><given-names>RD</given-names> </name><name name-style="western"><surname>Ensor</surname><given-names>J</given-names> </name><name name-style="western"><surname>Snell</surname><given-names>KIE</given-names> </name><etal/></person-group><article-title>Calculating the sample size required for developing a clinical prediction model</article-title><source>BMJ</source><year>2020</year><month>03</month><day>18</day><volume>368</volume><fpage>m441</fpage><pub-id pub-id-type="doi">10.1136/bmj.m441</pub-id><pub-id pub-id-type="medline">32188600</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bewick</surname><given-names>V</given-names> </name><name name-style="western"><surname>Cheek</surname><given-names>L</given-names> </name><name name-style="western"><surname>Ball</surname><given-names>J</given-names> </name></person-group><article-title>Statistics review 14: logistic regression</article-title><source>Crit Care</source><year>2005</year><month>02</month><volume>9</volume><issue>1</issue><fpage>112</fpage><lpage>118</lpage><pub-id pub-id-type="doi">10.1186/cc3045</pub-id><pub-id pub-id-type="medline">15693993</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Su</surname><given-names>X</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>Prediction for cardiovascular diseases based on laboratory data: an analysis of random forest model</article-title><source>J Clin Lab Anal</source><year>2020</year><month>09</month><volume>34</volume><issue>9</issue><fpage>e23421</fpage><pub-id pub-id-type="doi">10.1002/jcla.23421</pub-id><pub-id pub-id-type="medline">32725839</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Unnikrishnan</surname><given-names>P</given-names> </name><name name-style="western"><surname>Kumar</surname><given-names>DK</given-names> </name><name name-style="western"><surname>Poosapadi Arjunan</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kumar</surname><given-names>H</given-names> </name><name name-style="western"><surname>Mitchell</surname><given-names>P</given-names> </name><name name-style="western"><surname>Kawasaki</surname><given-names>R</given-names> </name></person-group><article-title>Development of health parameter model for risk prediction of CVD using SVM</article-title><source>Comput Math Methods Med</source><year>2016</year><volume>2016</volume><fpage>3016245</fpage><pub-id pub-id-type="doi">10.1155/2016/3016245</pub-id><pub-id pub-id-type="medline">27594895</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Son</surname><given-names>YJ</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>HG</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>EH</given-names> </name><name name-style="western"><surname>Choi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SK</given-names> </name></person-group><article-title>Application of support vector machine for prediction of medication adherence in heart failure patients</article-title><source>Healthc Inform Res</source><year>2010</year><month>12</month><volume>16</volume><issue>4</issue><fpage>253</fpage><lpage>259</lpage><pub-id pub-id-type="doi">10.4258/hir.2010.16.4.253</pub-id><pub-id pub-id-type="medline">21818444</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Dawadi</surname><given-names>R</given-names> </name><name name-style="western"><surname>Yamamoto</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Prediction of depressive disorder using machine learning approaches: findings from the NHANES</article-title><source>BMC Med Inform Decis Mak</source><year>2025</year><month>02</month><day>17</day><volume>25</volume><issue>1</issue><fpage>83</fpage><pub-id pub-id-type="doi">10.1186/s12911-025-02903-1</pub-id><pub-id pub-id-type="medline">39962516</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vickers</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>van Calster</surname><given-names>B</given-names> </name><name name-style="western"><surname>Steyerberg</surname><given-names>EW</given-names> </name></person-group><article-title>A simple, step-by-step guide to interpreting decision curve analysis</article-title><source>Diagn Progn Res</source><year>2019</year><volume>3</volume><fpage>18</fpage><pub-id pub-id-type="doi">10.1186/s41512-019-0064-7</pub-id><pub-id pub-id-type="medline">31592444</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Rousson</surname><given-names>V</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>WC</given-names> </name><etal/></person-group><article-title>Decision curve analysis: a technical note</article-title><source>Ann Transl Med</source><year>2018</year><month>08</month><volume>6</volume><issue>15</issue><fpage>308</fpage><pub-id pub-id-type="doi">10.21037/atm.2018.07.02</pub-id><pub-id pub-id-type="medline">30211196</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bloch</surname><given-names>L</given-names> </name><name name-style="western"><surname>Friedrich</surname><given-names>CM</given-names> </name><collab>Alzheimer&#x2019;s Disease Neuroimaging Initiative</collab></person-group><article-title>Data analysis with Shapley values for automatic subject selection in Alzheimer&#x2019;s disease data sets using interpretable machine learning</article-title><source>Alzheimers Res Ther</source><year>2021</year><month>09</month><day>15</day><volume>13</volume><issue>1</issue><fpage>155</fpage><pub-id pub-id-type="doi">10.1186/s13195-021-00879-4</pub-id><pub-id pub-id-type="medline">34526114</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kawai</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ohishi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Takeya</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Carotid plaque score and intima media thickness as predictors of stroke and mortality in hypertensive patients</article-title><source>Hypertens Res</source><year>2013</year><month>10</month><volume>36</volume><issue>10</issue><fpage>902</fpage><lpage>909</lpage><pub-id pub-id-type="doi">10.1038/hr.2013.61</pub-id><pub-id pub-id-type="medline">23823172</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nambi</surname><given-names>V</given-names> </name><name name-style="western"><surname>Chambless</surname><given-names>L</given-names> </name><name name-style="western"><surname>Folsom</surname><given-names>AR</given-names> </name><etal/></person-group><article-title>Carotid intima-media thickness and presence or absence of plaque improves prediction of coronary heart disease risk: the ARIC (Atherosclerosis Risk In Communities) study</article-title><source>J Am Coll Cardiol</source><year>2010</year><month>04</month><day>13</day><volume>55</volume><issue>15</issue><fpage>1600</fpage><lpage>1607</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2009.11.075</pub-id><pub-id pub-id-type="medline">20378078</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ji</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>N</given-names> </name><name name-style="western"><surname>Shi</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Level of systolic blood pressure within the normal range and risk of cardiovascular events in the absence of risk factors in Chinese</article-title><source>J Hum Hypertens</source><year>2022</year><month>10</month><volume>36</volume><issue>10</issue><fpage>933</fpage><lpage>939</lpage><pub-id pub-id-type="doi">10.1038/s41371-021-00598-1</pub-id><pub-id pub-id-type="medline">34480099</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Whelton</surname><given-names>SP</given-names> </name><name name-style="western"><surname>McEvoy</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Shaw</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Association of normal systolic blood pressure level with cardiovascular disease in the absence of risk factors</article-title><source>JAMA Cardiol</source><year>2020</year><month>09</month><day>1</day><volume>5</volume><issue>9</issue><fpage>1011</fpage><lpage>1018</lpage><pub-id pub-id-type="doi">10.1001/jamacardio.2020.1731</pub-id><pub-id pub-id-type="medline">32936272</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Somers</surname><given-names>VK</given-names> </name><name name-style="western"><surname>Gao</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Evaluation of optimal diastolic blood pressure range among adults with treated systolic blood pressure less than 130 mm Hg</article-title><source>JAMA Netw Open</source><year>2021</year><month>02</month><day>1</day><volume>4</volume><issue>2</issue><fpage>e2037554</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2020.37554</pub-id><pub-id pub-id-type="medline">33595663</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guo</surname><given-names>LL</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>YQ</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>QZ</given-names> </name><etal/></person-group><article-title>Non-HDL-C Is more stable than LDL-C in assessing the percent attainment of non-fasting lipid for coronary heart disease patients</article-title><source>Front Cardiovasc Med</source><year>2021</year><volume>8</volume><fpage>649181</fpage><pub-id pub-id-type="doi">10.3389/fcvm.2021.649181</pub-id><pub-id pub-id-type="medline">33869310</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saito</surname><given-names>I</given-names> </name><name name-style="western"><surname>Yamagishi</surname><given-names>K</given-names> </name><name name-style="western"><surname>Kokubo</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Non-high-density lipoprotein cholesterol and risk of stroke subtypes and coronary heart disease: The Japan Public Health Center-Based Prospective (JPHC) Study</article-title><source>JAT</source><year>2020</year><volume>27</volume><issue>4</issue><fpage>363</fpage><lpage>374</lpage><pub-id pub-id-type="doi">10.5551/jat.50385</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dong</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Zhuang</surname><given-names>Q</given-names> </name><etal/></person-group><article-title>The associations of lipid profiles with cardiovascular diseases and death in a 10-year prospective cohort study</article-title><source>Front Cardiovasc Med</source><year>2021</year><volume>8</volume><fpage>745539</fpage><pub-id pub-id-type="doi">10.3389/fcvm.2021.745539</pub-id><pub-id pub-id-type="medline">34901209</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhao</surname><given-names>X</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>D</given-names> </name><name name-style="western"><surname>Qin</surname><given-names>L</given-names> </name></person-group><article-title>Lipid profile and prognosis in patients with coronary heart disease: a meta-analysis of prospective cohort studies</article-title><source>BMC Cardiovasc Disord</source><year>2021</year><month>02</month><day>3</day><volume>21</volume><issue>1</issue><fpage>69</fpage><pub-id pub-id-type="doi">10.1186/s12872-020-01835-0</pub-id><pub-id pub-id-type="medline">33535982</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Poznyak</surname><given-names>AV</given-names> </name><name name-style="western"><surname>Litvinova</surname><given-names>L</given-names> </name><name name-style="western"><surname>Poggio</surname><given-names>P</given-names> </name><name name-style="western"><surname>Sukhorukov</surname><given-names>VN</given-names> </name><name name-style="western"><surname>Orekhov</surname><given-names>AN</given-names> </name></person-group><article-title>Effect of glucose levels on cardiovascular risk</article-title><source>Cells</source><year>2022</year><month>09</month><day>28</day><volume>11</volume><issue>19</issue><fpage>3034</fpage><pub-id pub-id-type="doi">10.3390/cells11193034</pub-id><pub-id pub-id-type="medline">36230996</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Riise</surname><given-names>HKR</given-names> </name><name name-style="western"><surname>Igland</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sulo</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Casual blood glucose and subsequent cardiovascular disease and all-cause mortality among 159&#x2009;731 participants in Cohort of Norway (CONOR)</article-title><source>BMJ Open Diabetes Res Care</source><year>2021</year><month>02</month><volume>9</volume><issue>1</issue><fpage>e001928</fpage><pub-id pub-id-type="doi">10.1136/bmjdrc-2020-001928</pub-id><pub-id pub-id-type="medline">33622686</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Selvin</surname><given-names>E</given-names> </name><name name-style="western"><surname>Coresh</surname><given-names>J</given-names> </name><name name-style="western"><surname>Golden</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Brancati</surname><given-names>FL</given-names> </name><name name-style="western"><surname>Folsom</surname><given-names>AR</given-names> </name><name name-style="western"><surname>Steffes</surname><given-names>MW</given-names> </name></person-group><article-title>Glycemic control and coronary heart disease risk in persons with and without diabetes</article-title><source>Arch Intern Med</source><year>2005</year><month>09</month><day>12</day><volume>165</volume><issue>16</issue><fpage>1910</fpage><pub-id pub-id-type="doi">10.1001/archinte.165.16.1910</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Charoen</surname><given-names>P</given-names> </name><name name-style="western"><surname>Nitsch</surname><given-names>D</given-names> </name><name name-style="western"><surname>Engmann</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Mendelian randomisation study of the influence of eGFR on coronary heart disease</article-title><source>Sci Rep</source><year>2016</year><month>06</month><day>24</day><volume>6</volume><fpage>28514</fpage><pub-id pub-id-type="doi">10.1038/srep28514</pub-id><pub-id pub-id-type="medline">27338949</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jankowski</surname><given-names>J</given-names> </name><name name-style="western"><surname>Floege</surname><given-names>J</given-names> </name><name name-style="western"><surname>Fliser</surname><given-names>D</given-names> </name><name name-style="western"><surname>B&#x00F6;hm</surname><given-names>M</given-names> </name><name name-style="western"><surname>Marx</surname><given-names>N</given-names> </name></person-group><article-title>Cardiovascular disease in chronic kidney disease</article-title><source>Circulation</source><year>2021</year><month>03</month><day>16</day><volume>143</volume><issue>11</issue><fpage>1157</fpage><lpage>1172</lpage><pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.120.050686</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brugts</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Knetsch</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Mattace-Raso</surname><given-names>FUS</given-names> </name><name name-style="western"><surname>Hofman</surname><given-names>A</given-names> </name><name name-style="western"><surname>Witteman</surname><given-names>JCM</given-names> </name></person-group><article-title>Renal function and risk of myocardial infarction in an elderly population: the Rotterdam Study</article-title><source>Arch Intern Med</source><year>2005</year><volume>165</volume><issue>22</issue><fpage>2659</fpage><lpage>2665</lpage><pub-id pub-id-type="doi">10.1001/archinte.165.22.2659</pub-id><pub-id pub-id-type="medline">16344425</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Maas</surname><given-names>A</given-names> </name><name name-style="western"><surname>Appelman</surname><given-names>YEA</given-names> </name></person-group><article-title>Gender differences in coronary heart disease</article-title><source>Neth Heart J</source><year>2010</year><month>12</month><volume>18</volume><issue>12</issue><fpage>598</fpage><lpage>602</lpage><pub-id pub-id-type="doi">10.1007/s12471-010-0841-y</pub-id><pub-id pub-id-type="medline">21301622</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shah</surname><given-names>T</given-names> </name><name name-style="western"><surname>Palaskas</surname><given-names>N</given-names> </name><name name-style="western"><surname>Ahmed</surname><given-names>A</given-names> </name></person-group><article-title>An update on gender disparities in coronary heart disease care</article-title><source>Curr Atheroscler Rep</source><year>2016</year><month>05</month><volume>18</volume><issue>5</issue><fpage>28</fpage><pub-id pub-id-type="doi">10.1007/s11883-016-0574-5</pub-id><pub-id pub-id-type="medline">27029220</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Percentage of missing data across all variables prior to imputation (Japanese participants, aged 30-84 years, Suita Study).</p><media xlink:href="cardio_v9i1e68066_app1.png" xlink:title="PNG File, 93 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Correlation Coefficients for variables used in CHD Incidence prediction (Japanese participants, aged 30-84 years, Suita Study).</p><media xlink:href="cardio_v9i1e68066_app2.png" xlink:title="PNG File, 260 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>List of variables included in the CHD Incidence prediction model (Japanese participants, aged 30-84 years, Suita Study).</p><media xlink:href="cardio_v9i1e68066_app3.docx" xlink:title="DOCX File, 19 KB"/></supplementary-material><supplementary-material id="app4"><label>Checklist 1</label><p>TRIPOD + AI (Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis or Diagnosis and Artificial Intelligence) checklist</p><media xlink:href="cardio_v9i1e68066_app4.pdf" xlink:title="PDF File, 1663 KB"/></supplementary-material></app-group></back></article>