<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JCARD</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Cardio</journal-id>
      <journal-title>JMIR Cardio</journal-title>
      <issn pub-type="epub">2561-1011</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i1e47736</article-id>
      <article-id pub-id-type="pmid">37494080</article-id>
      <article-id pub-id-type="doi">10.2196/47736</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Comparing Explainable Machine Learning Approaches With Traditional Statistical Methods for Evaluating Stroke Risk Models: Retrospective Cohort Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhang</surname>
            <given-names>Yonglai</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Bao</surname>
            <given-names>Bokan</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Lolak</surname>
            <given-names>Sermkiat</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6379-523X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Attia</surname>
            <given-names>John</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9800-1308</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>McKay</surname>
            <given-names>Gareth J</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8197-6280</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Thakkinstian</surname>
            <given-names>Ammarin</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Clinical Epidemiology and Biostatistics, Faculty of Medicine</institution>
            <institution>Ramathibodi Hospital</institution>
            <institution>Mahidol University</institution>
            <addr-line>4th Floor, Sukho Place Building</addr-line>
            <addr-line>218/11 Sukhothai Road, Suan Chitlada, Dusit</addr-line>
            <addr-line>Bangkok, 10300</addr-line>
            <country>Thailand</country>
            <phone>66 2 201 1269</phone>
            <email>ammarin.tha@mahidol.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9991-386X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Clinical Epidemiology and Biostatistics, Faculty of Medicine</institution>
        <institution>Ramathibodi Hospital</institution>
        <institution>Mahidol University</institution>
        <addr-line>Bangkok</addr-line>
        <country>Thailand</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Centre for Clinical Epidemiology and Biostatistics, School of Medicine and Public Health</institution>
        <institution>Hunter Medical Research Institute</institution>
        <institution>University of Newcastle</institution>
        <addr-line>New South Wales</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Centre for Public Health, School of Medicine</institution>
        <institution>Dentistry and Biomedical Sciences</institution>
        <institution>Queen's University Belfast</institution>
        <addr-line>Belfast</addr-line>
        <country>United Kingdom</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Ammarin Thakkinstian <email>ammarin.tha@mahidol.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>26</day>
        <month>7</month>
        <year>2023</year>
      </pub-date>
      <volume>7</volume>
      <elocation-id>e47736</elocation-id>
      <history>
        <date date-type="received">
          <day>30</day>
          <month>3</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>11</day>
          <month>5</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>22</day>
          <month>5</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>15</day>
          <month>6</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Sermkiat Lolak, John Attia, Gareth J McKay, Ammarin Thakkinstian. Originally published in JMIR Cardio (https://cardio.jmir.org), 26.07.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Cardio, is properly cited. The complete bibliographic information, a link to the original publication on https://cardio.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://cardio.jmir.org/2023/1/e47736" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Stroke has multiple modifiable and nonmodifiable risk factors and represents a leading cause of death globally. Understanding the complex interplay of stroke risk factors is thus not only a scientific necessity but a critical step toward improving global health outcomes.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aim to assess the performance of explainable machine learning models in predicting stroke risk factors using real-world cohort data by comparing explainable machine learning models with conventional statistical methods.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>This retrospective cohort included high-risk patients from Ramathibodi Hospital in Thailand between January 2010 and December 2020. We compared the performance and explainability of logistic regression (LR), Cox proportional hazard, Bayesian network (BN), tree-augmented Naïve Bayes (TAN), extreme gradient boosting (XGBoost), and explainable boosting machine (EBM) models. We used multiple imputation by chained equations for missing data and discretized continuous variables as needed. Models were evaluated using C-statistics and <italic>F</italic><sub>1</sub>-scores.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Out of 275,247 high-risk patients, 9659 (3.5%) experienced a stroke. XGBoost demonstrated the highest performance with a C-statistic of 0.89 and an <italic>F</italic><sub>1</sub>-score of 0.80 followed by EBM and TAN with C-statistics of 0.87 and 0.83, respectively; LR and BN had similar C-statistics of 0.80. Significant factors associated with stroke included atrial fibrillation (AF), hypertension (HT), antiplatelets, HDL, and age. AF, HT, and antihypertensive medication were common significant factors across most models, with AF being the strongest factor in LR, XGBoost, BN, and TAN models.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our study developed stroke prediction models to identify crucial predictive factors such as AF, HT, or systolic blood pressure or antihypertensive medication, anticoagulant medication, HDL, age, and statin use in high-risk patients. The explainable XGBoost was the best model in predicting stroke risk, followed by EBM.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>stroke</kwd>
        <kwd>machine learning</kwd>
        <kwd>risk prediction model</kwd>
        <kwd>explainable artificial Intelligence</kwd>
        <kwd>risk factor</kwd>
        <kwd>cohort study</kwd>
        <kwd>high-risk patient</kwd>
        <kwd>hypertension</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Cardiovascular disease, especially stroke, is a major cause of death globally. Many risk factors for stroke include nonmodifiable (eg, ethnicity, age, and sex) and modifiable risk factors (eg, hypertension [HT], diabetes mellitus [DM], dyslipidemia [DLP], smoking, and alcohol consumption) [<xref ref-type="bibr" rid="ref1">1</xref>]. Improved understanding of disease prediction and risk stratification are active epidemiological research areas to help clinicians target preventive treatment to those most likely to benefit.</p>
      <p>The American Heart Association or American Stroke Association defines ischemic and hemorrhagic stroke [<xref ref-type="bibr" rid="ref2">2</xref>]. Ischemic stroke is defined as an episode of neurological dysfunction caused by focal cerebral, spinal, or retinal infarction. A hemorrhagic stroke is characterized by an intracerebral hemorrhage, which involves bleeding within the brain tissue (parenchyma) or ventricular system. This condition, which is not caused by trauma, encompasses instances of spontaneous parenchymal hemorrhages or those occurring following a brain infarction. The rapid development of neurological dysfunction symptoms is a defining consequence of this internal bleeding.</p>
      <p>There are 2 common sources of ischemic stroke: atherosclerotic stroke and cerebral embolism [<xref ref-type="bibr" rid="ref3">3</xref>], with the former being more common. Atherosclerosis within a significant cerebral blood vessel can vary in severity from small changes in diameter to severe stenosis that can cause clotting at the site of the atherosclerotic plaque leading to blood flow obstruction, causing a stroke [<xref ref-type="bibr" rid="ref4">4</xref>]. While a cerebral embolism can originate from other regions of the body, sometimes as a consequence of atrial fibrillation (AF), the emboli travel and obstruct the distal cerebral arteries preventing brain tissue perfusion leading to ischemia.</p>
      <p>There are multiple risk factors for stroke given the various pathological pathways involved [<xref ref-type="bibr" rid="ref5">5</xref>]. The Framingham Stroke Risk Profile is a composite vascular risk score that predicts 10-year stroke risk based on 8 risk factors, that is, age, systolic blood pressure (SBP), antihypertensive therapy, DM, cigarette smoking, cardiovascular disease, AF, and left ventricular hypertrophy [<xref ref-type="bibr" rid="ref6">6</xref>]. The INTERSTROKE consortia identified 10 modifiable risk factors associated with 90% of the stroke population-attributable risk [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. HT is regarded as the most important modifiable risk factor for hemorrhagic stroke, while recent smoking, DM, apolipoproteins, and cardiac causes are more critical factors associated with ischemic stroke.</p>
      <p>Risk or prognostic prediction models of stroke have been developed using conventional statistical methods (such as multiple logistic regression [LR] or Cox proportion hazard [CPH] models) based on linear relationships with the outcome measure, allowing for 2-way interactions between risk factors [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. In reality, the interaction between risk factors may be more complex, of a higher order, or nonlinear. Machine learning (ML) models free from prior hypotheses have been recently used for disease prediction given their ability to better consider the interactions present, including nonlinear relationships [<xref ref-type="bibr" rid="ref12">12</xref>]. However, the causal inference of these methods remains questionable, in particular, whether these ML models actually reflect the underlying relevant biology or simply improve prognostic performance.</p>
      <p>Many ML models (eg, decision tree, tree ensembles, support vector machines, and neural networks) and deep learning approaches have been compared to conventional statistical models to assess their ability to detect nonlinear associations and multifaceted interactions [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref17">17</xref>]. Deep learning models are composed of multiple hidden layers that include millions of parameters without clear mechanistic meaning, representing “black-box” models with little transparency [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. To address this shortcoming, explainable ML approaches have become popular by improving features such as understandability, comprehensibility, interpretability, explainability, and transparency [<xref ref-type="bibr" rid="ref18">18</xref>]. Explainable models include Bayesian network (BN) and tree-augmented Naïve Bayes (TAN) models, both of which are probabilistic graphical models [<xref ref-type="bibr" rid="ref20">20</xref>]. An explainable boosting machine (EBM) is based on a generalized additive model and is considered a ”glass-box” model given its improved transparency and interpretability [<xref ref-type="bibr" rid="ref21">21</xref>]. These models excel in capturing complex relationships and dependencies among features, providing a more comprehensive understanding of the data structure and interplay between different risk factors when compared with the traditional statistical LR model. Furthermore, extreme gradient boosting (XGBoost) is considered a state-of-the-art approach for evaluating tabular data [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
      <p>Therefore, this study used real-world cohort data and explainable ML models to identify risk factors for stroke occurrence in high-risk patients. The importance and ranking of risk factors were used as a proxy for explainability.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design</title>
        <p>This study is a retrospective cohort analysis of high-risk patients with stroke treated at Ramathibodi Hospital in Bangkok, Thailand, from January 2010 to December 2020. The study included patients aged 18 years or older with at least 1 diagnosis of HT, AF, DM, or DLP. Participants were excluded if they had a prior stroke at the initial hospital visit or had only 1 visit during the study period.</p>
        <p>The patient cohort was identified from Ramathibodi Hospital's electronic database using the International Classification of Diseases, 10th Revision (ICD-10) codes for risk factors and clinical features, such as HT (I10-I16), DM (E08-E13), AF (I48), and DLP (E78). The primary end points of interest were the development of ischemic stroke (I63) and hemorrhagic stroke (I61), as indicated by their respective ICD-10 codes. The features and criteria used in this study can be found in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
      </sec>
      <sec>
        <title>Predictive Features and Outcome</title>
        <p>Each patient was followed up until stroke occurrence, loss to follow-up, or censoring at study end (December 31, 2020). The latter 2 events were censored on their final visit or study end date, respectively.</p>
        <p>Baseline study predictive features included age, sex, AF, HT, DM, DLP, SBP, plasma glucose (PG), serum creatinine, BMI, low-density lipoprotein and high-density lipoprotein (HDL), triglyceride level, and medications (antihypertensives, antiplatelets, oral hypoglycemics and insulin, statin and nonstatin lipid-lowering drugs, and anticoagulants). These baseline features were identified and retrieved when patients were first identified in our electronic medical records. The missing data in this study, assumed to be missing at random, were filled in using multiple imputation by chained equations via scikit-learn’s IterativeImputer [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. The percentage of missing data and features used in multiple imputation by chained equations for each imputed variable are detailed in Table S1-S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Continuous data were categorized on the basis of previous literature to improve interpretation and as a requirement of the BN model [<xref ref-type="bibr" rid="ref25">25</xref>]. Details of discretization are provided in Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. We randomly separated the data by hospital numbers into development and test sets with a ratio of 80:20; each patient appeared in only 1 data set to maintain independence between the data sets. Characteristics of patients between the 2 data sets are comparable, see Table S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
      </sec>
      <sec>
        <title>Model Construction</title>
        <p>We compared model performance and explainability between LR, CPH, BN, TAN, XGBoost, and EBM. We normalized continuous variables and used recursive feature elimination to select features in the LR model, whereas feature selection in XGBoost and EBM included self-selecting features during node splitting [<xref ref-type="bibr" rid="ref26">26</xref>]. We manually selected features in the BN and TAN based on stroke pathophysiology and considered the appropriate network structure.</p>
        <p>Scikit-learn served as the ML library for LR and XGBoost, with hyperparameter tuning using grid and random searches with successive halving (HalvingGridSearchCV and HalvingRandomSearchCV) and assigned imbalance ratio as weights to counter imbalanced class effects. We extracted LR coefficients and XGBoost’s features’ importance together with Shapley Additive Explanations (SHAP) to represent their explainability [<xref ref-type="bibr" rid="ref27">27</xref>]. We constructed EBM using the open-source package <italic>InterpretML</italic> (Microsoft) [<xref ref-type="bibr" rid="ref21">21</xref>]. Variable and interaction effects were plotted to determine their impact on the outcome.</p>
        <p>We built a BN using GeNIe Modeler (BayesFusion, LLC) software based on the known causal pathways of disease [<xref ref-type="bibr" rid="ref28">28</xref>] and trained it using discretized data. TAN structures were also determined using the training data and GeNIe (BayesFusion, LLC) software. The architectural details of the BN and TAN are shown in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>. Models were evaluated with C-statistics and <italic>F</italic><sub>1</sub>-scores. C-statistics, or area under receiver operating characteristics curve (AUC-ROC), provide a measure of a models’ ability to accurately distinguish between positive and negative classes (0.5 being no predictive ability beyond chance and 1 being perfect prediction), while the <italic>F</italic><sub>1</sub>-score represents a measurement of the balance between precision and recall in binary classification, which computes by harmonic mean between precision and recall.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>The data were anonymized to ensure confidentiality and privacy protection. This study was approved by Human Research Ethics Committee, Faculty of Medicine Ramathibodi Hospital, Mahidol University (COA. MURA2021/255). The committee waived the need to obtain consent for the collection, analysis, and publication of the retrospectively obtained and anonymized data for this noninterventional study.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>A total of 275,247 high-risk patients were included in this cohort, of whom 9659 (3.5%) experienced a stroke. Specifically, 7874 patients had an ischemic stroke, and 2427 patients had a hemorrhagic stroke. The patient cohort included 19,324 (7%) patients with AF, 98,836 (36%) with DM, 228,055 (83%) with DLP, and 211,430 (77%) with HT. <xref ref-type="table" rid="table1">Table 1</xref> presents the baseline characteristics, revealing significant differences between the stroke and nonstroke groups for almost all variables, except for DLP (<italic>P</italic>=.70). The data set was divided into development and validation sets, comprising 220,198 and 55,049 patients, respectively.</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Cohort summary statistics.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="30"/>
          <col width="300"/>
          <col width="0"/>
          <col width="270"/>
          <col width="0"/>
          <col width="270"/>
          <col width="0"/>
          <col width="0"/>
          <col width="100"/>
          <thead>
            <tr valign="top">
              <td colspan="4">
                <break/>
              </td>
              <td colspan="2">Stroke (N=9659)</td>
              <td colspan="2">Nonstroke (N=265,588)</td>
              <td colspan="2"><italic>P</italic> value</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="4">Age (years), mean (SD)</td>
              <td colspan="2">64.7 (13)</td>
              <td colspan="2">58 (14.1)</td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td colspan="9">
                <bold>Sex</bold>
              </td>
              <td>&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">Male, n (%)</td>
              <td colspan="2">5107 (0.05)</td>
              <td colspan="2">101,700 (0.95)</td>
              <td colspan="2">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">Female, n (%)</td>
              <td colspan="2">4552 (0.03)</td>
              <td colspan="2">168,440 (0.97)</td>
              <td colspan="2">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="10">
                <bold>Medication,</bold>
                <bold>n (%)</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="7">
                <bold>Antihypertensive medication</bold>
              </td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Yes</td>
              <td colspan="2">4096 (0.03)</td>
              <td colspan="2">141,188 (0.97)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>No</td>
              <td colspan="2">5563 (0.04)</td>
              <td colspan="2">124,400 (0.96)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="7">
                <bold>Hypoglycemic medication</bold>
              </td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Yes</td>
              <td colspan="2">1659 (0.03)</td>
              <td colspan="2">59,150 (0.97)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>No</td>
              <td colspan="2">8000 (0.04)</td>
              <td colspan="2">206,438 (0.96)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="7">
                <bold>Lipid-lowering medication (nonstatin)</bold>
              </td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Yes</td>
              <td colspan="2">913 (0.02)</td>
              <td colspan="2">38,580 (0.98)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>No</td>
              <td colspan="2">8746 (0.04)</td>
              <td colspan="2">227,008 (0.96)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="7">
                <bold>Statin medication</bold>
              </td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Yes</td>
              <td colspan="2">3369 (0.03)</td>
              <td colspan="2">126,508 (0.97)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>No</td>
              <td colspan="2">6290 (0.04)</td>
              <td colspan="2">145,370 (0.96)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="7">
                <bold>Antiplatelet medication</bold>
              </td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Yes</td>
              <td colspan="2">2868 (0.05)</td>
              <td colspan="2">54,992 (0.95)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>No</td>
              <td colspan="2">6791 (0.03)</td>
              <td colspan="2">217,387 (0.97)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="7">
                <bold>Anticoagulant medication</bold>
              </td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Yes</td>
              <td colspan="2">622 (0.06)</td>
              <td colspan="2">10,015 (0.94)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>No</td>
              <td colspan="2">9037 (0.03)</td>
              <td colspan="2">255,573 (0.97)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="10">
                <bold>Vital signs, mean (SD)</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">Systolic blood pressure (mm Hg)</td>
              <td colspan="2">138 (22.7)</td>
              <td colspan="2">133.6 (20.9)</td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">Diastolic blood pressure (mm Hg)</td>
              <td colspan="2">77.5 (11.1)</td>
              <td colspan="2">78 (10)</td>
              <td colspan="2">.002</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">BMI (kg/m<sup>2</sup>)</td>
              <td colspan="2">25.2 (4.4)</td>
              <td colspan="2">25.5 (4.8)</td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td colspan="10">
                <bold>Risk factors,</bold>
                <bold>n (%)</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="7">
                <bold>Atrial fibrillation</bold>
              </td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Present</td>
              <td colspan="2">2591 (0.13)</td>
              <td colspan="2">16,733 (0.87)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Absent</td>
              <td colspan="2">7068 (0.02)</td>
              <td colspan="2">248,855 (0.98)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="7">
                <bold>Dyslipidemia</bold>
              </td>
              <td colspan="2">.70</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Present</td>
              <td colspan="2">8017 (0.04)</td>
              <td colspan="2">220,038 (0.96)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Absent</td>
              <td colspan="2">1642 (0.03)</td>
              <td colspan="2">45,550 (0.97)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="7">
                <bold>Hypertension</bold>
              </td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Present</td>
              <td colspan="2">8936 (0.04)</td>
              <td colspan="2">202,494 (0.96)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Absent</td>
              <td colspan="2">723 (0.01)</td>
              <td colspan="2">63,094 (0.99)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="7">
                <bold>Diabetes mellitus</bold>
              </td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Present</td>
              <td colspan="2">4202 (0.04)</td>
              <td colspan="2">94,634 (0.96)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>
                <break/>
              </td>
              <td>Absent</td>
              <td colspan="2">5457 (0.03)</td>
              <td colspan="2">170,954 (0.97)</td>
              <td colspan="3">
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="10">
                <bold>Laboratory values,</bold>
                <bold>mean (SD)</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">Plasma creatinine (mg/dL)</td>
              <td colspan="2">1.2 (1.4)</td>
              <td colspan="2">1.14 (1.7)</td>
              <td colspan="2">.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">Blood sugar (mg/dL)</td>
              <td colspan="2">128.3 (64.2)</td>
              <td colspan="2">111.6 (46)</td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">Hemoglobin A<sub>1c</sub> (%)</td>
              <td colspan="2">6.7 (1.7)</td>
              <td colspan="2">6.4 (1.5)</td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">Low-density lipoprotein (LDL) (mg/dL)</td>
              <td colspan="2">119.9 (43.2)</td>
              <td colspan="2">128.3 (41.1)</td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">High-density lipoprotein (HDL) (mg/dL)</td>
              <td colspan="2">45.7 (13.5)</td>
              <td colspan="2">50.9 (14)</td>
              <td colspan="2">&#60;.001</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td colspan="3">Triglyceride (md/dL)</td>
              <td colspan="2">142 (96.7)</td>
              <td colspan="2">136.1 (94.8)</td>
              <td colspan="2">&#60;.001</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>In terms of discriminative performance, the XGBoost model yielded the highest C-statistic (0.89, 95% CI 0.88-0.90) and <italic>F</italic><sub>1</sub>-score (0.80), followed by EBM and TAN with C-statistics of 0.87 (95% CI 0.86-0.87) and 0.83 (95% CI 0.82-0.83), respectively. LR and BN models demonstrated similar performances, with C-statistics of 0.80 (95% CI 0.79-0.81). These results are presented in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Model performance of stroke risk prediction over a 10-year period.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="340"/>
          <col width="330"/>
          <col width="330"/>
          <thead>
            <tr valign="top">
              <td>Model</td>
              <td>C-statistics (95% CI)</td>
              <td><italic>F</italic><sub>1</sub>-score</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Logistic regression</td>
              <td>0.80 (0.79-0.81)</td>
              <td>0.73</td>
            </tr>
            <tr valign="top">
              <td>Bayesian network</td>
              <td>0.80 (0.79-0.81)</td>
              <td>0.73</td>
            </tr>
            <tr valign="top">
              <td>Explainable boosting machine</td>
              <td>0.87 (0.86-0.87)</td>
              <td>0.78</td>
            </tr>
            <tr valign="top">
              <td>XGBoost<sup>a</sup></td>
              <td>0.89 (0.88-0.90)</td>
              <td>0.80</td>
            </tr>
            <tr valign="top">
              <td>Tree-augmented Naïve Bayes</td>
              <td>0.83 (0.82-0.83)</td>
              <td>0.73</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table2fn1">
            <p><sup>a</sup>XGBoost: extreme gradient boosting.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>The LR model identified several factors significantly associated with stroke including AF (odds ratio [OR] 5.93, 95% CI 5.86-5.99), HT (OR 5.14, 95% CI 5.1-5.18), antihypertensive medication (OR 0.3, 95% CI 0.24-0.35), antiplatelets (OR 3.01, 95% CI 2.96-3.07), HDL (OR 0.76, 95% CI 0.74-0.78), and age (OR 1.31, 95% CI 1.29-1.33) as shown in <xref ref-type="table" rid="table3">Table 3</xref>. Based on feature importance ranking and SHA<italic>P</italic> values, the XGBoost model identified AF, SBP, HDL, PG, antihypertensive medication, HT, and antiplatelets as significant factors associated with stroke occurrence (Figure S1 in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). The EBM model identified PG, antihypertensive medication, SBP, HDL, HT, and AF as significant features, with interaction terms providing no additional predictive power (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). For the BN and TAN models, advanced age (&#62;75 years) combined with AF were the strongest factors. Overall, AF, HT, and antihypertensive medication emerged as common significant factors across most models. Notably, AF was the strongest factor in the LR, XGBoost, BN, and TAN models. Receiver operating characteristic and precision-recall curves of each model are provided in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p>
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>Odds ratio (OR) of variables from multivariate logistic regression model.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="500"/>
          <col width="0"/>
          <col width="470"/>
          <thead>
            <tr valign="top">
              <td colspan="3">
                <break/>
              </td>
              <td>OR (95% CI)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="4">
                <bold>Categorical variable</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>AF<sup>a</sup></td>
              <td colspan="2">5.93 (5.86-5.99)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>HT<sup>b</sup></td>
              <td colspan="2">5.14 (5.1-5.18)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>antiHT<sup>c</sup></td>
              <td colspan="2">0.3 (0.24-0.35)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>antiPL<sup>d</sup></td>
              <td colspan="2">3.01 (2.96-3.07)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>antiDM<sup>e</sup></td>
              <td colspan="2">0.51 (0.43-0.6)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>DLP<sup>f</sup></td>
              <td colspan="2">1.86 (1.78-1.93)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Statin</td>
              <td colspan="2">0.61 (0.56-0.67)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>antiDLP<sup>g</sup></td>
              <td colspan="2">0.67 (0.59-0.75)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>antiCoag<sup>h</sup></td>
              <td colspan="2">0.68 (0.58-0.79)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>isMale<sup>i</sup></td>
              <td colspan="2">1.4 (1.36-1.44)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>DM<sup>j</sup></td>
              <td colspan="2">1.31 (1.25-1.36)</td>
            </tr>
            <tr valign="top">
              <td colspan="4">
                <bold>Continuous variable</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>HDL<sup>k</sup> (mg/dL)</td>
              <td colspan="2">0.76 (0.74-0.78)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Age (years)</td>
              <td colspan="2">1.31 (1.29-1.33)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>PG<sup>l</sup> (mg/dL)</td>
              <td colspan="2">1.31 (1.29-1.32)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Cr<sup>m</sup> (mg/dL)</td>
              <td colspan="2">0.89 (0.87-0.91)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>SBP<sup>n</sup> (mmHg)</td>
              <td colspan="2">1.11 (1.09-1.13)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>BMIcalc<sup>o</sup> (kg/m<sup>2</sup>)</td>
              <td colspan="2">0.94 (0.92-0.96)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>LDL<sup>p</sup> (mg/dL)</td>
              <td colspan="2">1.04 (1.02-1.07)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>TG<sup>q</sup> (mg/dL)</td>
              <td colspan="2">0.97 (0.95-0.99)</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table3fn1">
            <p><sup>a</sup>AF: atrial fibrillation.</p>
          </fn>
          <fn id="table3fn2">
            <p><sup>b</sup>HT: hypertension.</p>
          </fn>
          <fn id="table3fn3">
            <p><sup>c</sup>antiHT: antihypertensive medication.</p>
          </fn>
          <fn id="table3fn4">
            <p><sup>d</sup>antiPL: antiplatelet medication.</p>
          </fn>
          <fn id="table3fn5">
            <p><sup>e</sup>antiDM: hypoglycemic medication.</p>
          </fn>
          <fn id="table3fn6">
            <p><sup>f</sup>DLP: dyslipidemia.</p>
          </fn>
          <fn id="table3fn7">
            <p><sup>g</sup>antiDLP: nonstatin lipid-lowering medication.</p>
          </fn>
          <fn id="table3fn8">
            <p><sup>h</sup>antiCoag: anticoagulant medication.</p>
          </fn>
          <fn id="table3fn9">
            <p><sup>i</sup>isMale: male.</p>
          </fn>
          <fn id="table3fn10">
            <p><sup>j</sup>DM: diabetes mellitus.</p>
          </fn>
          <fn id="table3fn11">
            <p><sup>k</sup>HDL: high-density lipoprotein.</p>
          </fn>
          <fn id="table3fn12">
            <p><sup>l</sup>PG: plasma glucose.</p>
          </fn>
          <fn id="table3fn13">
            <p><sup>m</sup>Cr: serum creatinine.</p>
          </fn>
          <fn id="table3fn14">
            <p><sup>n</sup>SBP: systolic blood pressure.</p>
          </fn>
          <fn id="table3fn15">
            <p><sup>o</sup>BMIcalc: body mass index.</p>
          </fn>
          <fn id="table3fn16">
            <p><sup>p</sup>LDL: low-density lipoprotein.</p>
          </fn>
          <fn id="table3fn17">
            <p><sup>q</sup>TG: triglycerides.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>We investigated a retrospective cohort of patients at high risk of developing stroke to develop prediction models for stroke occurrence. The models identified AF, HT, or SBP or antihypertensive medication, anticoagulant medication, HDL, age, and statin use as important features in predicting stroke using both conventional LR and ML models. Our findings provide robust, transparent, and explainable ML models for stroke risk prediction using routinely collected clinical data accessible in general health care settings.</p>
      </sec>
      <sec>
        <title>Explainability</title>
        <p>Explainability and transparency of risk prediction models are important for facilitating the prescribing of individualized treatments (precision medicine) in real-world clinical settings [<xref ref-type="bibr" rid="ref29">29</xref>]. Improved patient understanding also leads to empowerment and improved medication or treatment adherence [<xref ref-type="bibr" rid="ref30">30</xref>]. Improved understanding and use of ML models in both prehoc and post hoc analyses are growing. According to Arrieta et al [<xref ref-type="bibr" rid="ref18">18</xref>], LR, CPH, BN, TAN, and EBM models are considered transparent and understandable in themselves, while XGBoost requires post hoc analysis to improve explainability, including local interpretable model-agnostic explanations [<xref ref-type="bibr" rid="ref31">31</xref>], SHAP, partial dependence plots, feature importance [<xref ref-type="bibr" rid="ref32">32</xref>], or DeepLIFT [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]. Explainability can be classified into 3 types: application-grounded, human-grounded, and functionality-grounded [<xref ref-type="bibr" rid="ref34">34</xref>]. Application- and human-grounded categories involve human interpretability, that is, models that are easily comprehensible to a layperson, without the need for specialized technical knowledge or expertise; functionality grounded refers to the methods or algorithms used and their quantitative evaluation.</p>
        <p>Some studies have explored the benefits of white-box ML prediction models, such as BN and EBM. For example, Park et al [<xref ref-type="bibr" rid="ref35">35</xref>] used BN with a TAN algorithm to predict 3-month functional outcomes after stroke with an AUC-ROC of 0.889. Kanwar et al [<xref ref-type="bibr" rid="ref36">36</xref>] used a BN-derived risk prediction model that improved the prediction of 1-year survival in patients with pulmonary arterial HT compared to the Kaplan-Meier method in REVEAL (version 2.0), with an AUC-ROC of 0.8 versus 0.76 [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. Lou et al [<xref ref-type="bibr" rid="ref39">39</xref>] showed that EBM approaches could achieve accuracy close to that provided by random forest models while providing good interpretability. White-box EBM approaches are also known as “glass-box” models that allow for interaction terms between variables within the model. All of these models performed well, and their white-box nature enables transparency, making them useful for clinicians to explain and translate medical knowledge for a more confident application in clinical settings. A previous study compared multiple ML models to predict stroke and address the class imbalance problem using a multilayer perceptron classifier to achieve the lowest false-negative rate (18.60%) and SHAP to investigate the impact of risk factors on stroke prediction [<xref ref-type="bibr" rid="ref40">40</xref>]. However, this approach was considered a post hoc analysis and not representative of a white-box model.</p>
        <p>To date, investigation of the predictive capabilities of multiple explainable models in the context of stroke risk assessment using real-world data has been limited. Our study addresses this knowledge gap through a novel approach that compares the performance metrics for several explainable models, resulting in significantly improved predictive accuracy, further informing the existing literature. ML models generally outperform traditional statistical methods, supported by AUC-ROCs that represent sufficient improvement to be clinically actionable, that is, AUC-ROCs over 0.80-0.85. This does not mean that all ML methods are superior to traditional statistical methods in all applications, and users should keep an open mind. Another benefit of transparent and explainable models is the rational and selective approach to the choice of predictors. Data mining methods used without regard to causative pathways can include variables that cause collider bias and reduce model performance or may lead to embedded bias within the observational data.</p>
        <p>We seek to further contextualize our study findings in relation to the existing literature while also acknowledging the unique characteristics of our study population. The significant features we identified as contributing to stroke risks, such as AF and HT, have been extensively reported previously, providing validation of our findings [<xref ref-type="bibr" rid="ref41">41</xref>]. However, it is important to note that our study offers additional insight into the strength and interaction of these risk factors to improve our understanding of stroke risk. They also show the potential to improve model performance over traditional approaches even when starting with an identical data set.</p>
        <p>The integration of these models into clinical workflows could provide real-time, personalized risk assessments, guiding clinicians toward more targeted and effective interventions. For instance, a patient identified as high risk could be prioritized for aggressive preventive measures, such as rigorous lifestyle modification, counseling, or intensified medication regimens. Conversely, if a patient is predicted to have a lower stroke risk, they may avoid unnecessary treatments and potential side effects, or they might require less intensive follow-up within the hospital setting. This individualized approach would enhance the personalization of stroke prevention strategies, potentially improving patient outcomes.</p>
        <p>In addition, the interpretability of the models used helps health care professionals to better understand the key drivers of the predicted stroke risk. This transparency could facilitate more informed and confident decision-making, bridging the gap between complex ML algorithms and their practical application in a clinical setting. Ultimately, these advances could lead to more efficient and effective personalized health care, underpinned by evidence-based, data-driven decisions.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>There were several limitations to our study. First, other important epidemiological factors, such as smoking status, education, and alcohol consumption, were not included within our risk prediction models as the information was not recorded in the electronic medical records. Many variables rely on the accuracy of ICD-10 coding, which may be subject to miscoding or misdiagnosis that would reduce model performance. Our study cohort encompassed a somewhat narrow demographic range of an “at-risk” population. We recognize that stroke risk factors may vary across different populations, highlighting the need for externally validating our stroke prediction model in the future before wider application.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Our study demonstrates predictive accuracy and explainability for stroke risk prediction models in high-risk patients. The key findings highlight the impact of AF, HT, and blood pressure control as significant risk factors for stroke emphasizing the potential benefits of screening and early detection, especially within patients for whom these risk factors are prominent. Furthermore, our findings confirm the robustness and interpretability of ML models such as XGBoost, EBM, and BN in handling complex, real-world health data and the potential to improve model performance even when starting with the same data set as traditional approaches.</p>
        <p>Looking ahead, we anticipate significant opportunities for further research using these approaches. The continued evolution of ML techniques provides an avenue for refining prediction models, possibly by incorporating additional or alternative feature sets. Moreover, future studies could explore the effects of different interventions on stroke risk, such as lifestyle modifications or novel therapeutic agents. In doing so, our understanding of stroke prevention and management may be enhanced, potentially improving patient outcomes. By pushing the boundaries of explainable ML in health care, these findings hold the potential to revolutionize clinical practice, empowering physicians and patients with clear, actionable insights for better health outcomes.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Data management.</p>
        <media xlink:href="cardio_v7i1e47736_app1.docx" xlink:title="DOCX File , 27 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Bayesian network and tree-augmented Naïve Bayes.</p>
        <media xlink:href="cardio_v7i1e47736_app2.docx" xlink:title="DOCX File , 723 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Extreme gradient boosting.</p>
        <media xlink:href="cardio_v7i1e47736_app3.docx" xlink:title="DOCX File , 61 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Explainable boosting machine.</p>
        <media xlink:href="cardio_v7i1e47736_app4.docx" xlink:title="DOCX File , 60 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Receiver operating characteristic curve and precision-recall curve from baseline models.</p>
        <media xlink:href="cardio_v7i1e47736_app5.docx" xlink:title="DOCX File , 110 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AF</term>
          <def>
            <p>atrial fibrillation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUC-ROC</term>
          <def>
            <p>area under receiver operating characteristics curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BN</term>
          <def>
            <p>Bayesian network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CPH</term>
          <def>
            <p>Cox proportional hazard</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">DLP</term>
          <def>
            <p>dyslipidemia</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">DM</term>
          <def>
            <p>diabetes mellitus</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">EBM</term>
          <def>
            <p>explainable boosting machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">HDL</term>
          <def>
            <p>high-density lipoprotein</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">HT</term>
          <def>
            <p>hypertension</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">ICD-10</term>
          <def>
            <p>International Classification of Diseases, 10th Revision</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">LR</term>
          <def>
            <p>logistic regression</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">OR</term>
          <def>
            <p>odds ratio</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">PG</term>
          <def>
            <p>plasma glucose</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">SBP</term>
          <def>
            <p>systolic blood pressure</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">SHAP</term>
          <def>
            <p>Shapley Additive Explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">TAN</term>
          <def>
            <p>tree-augmented Naïve Bayes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">XGBoost</term>
          <def>
            <p>extreme gradient boosting</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was funded by the National Research Council of Thailand (N42A640323). The grant agency was not involved in review methods (selection of studies, risk of bias assessment, data extraction, data analysis, and interpretation of findings), paper writing, and did not impose any restriction regarding paper publication.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>Further use of data can be requested from the corresponding author.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>GBD 2017 Causes of Death Collaborators</collab>
          </person-group>
          <article-title>Global, regional, and national age-sex-specific mortality for 282 causes of death in 195 countries and territories, 1980-2017: a systematic analysis for the Global Burden of Disease Study 2017</article-title>
          <source>Lancet</source>
          <year>2018</year>
          <month>11</month>
          <day>10</day>
          <volume>392</volume>
          <issue>10159</issue>
          <fpage>1736</fpage>
          <lpage>1788</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0140-6736(18)32203-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(18)32203-7</pub-id>
          <pub-id pub-id-type="medline">30496103</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(18)32203-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC6227606</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sacco</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Kasner</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Broderick</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Caplan</surname>
              <given-names>LR</given-names>
            </name>
            <name name-style="western">
              <surname>Connors</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Culebras</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Elkind</surname>
              <given-names>MSV</given-names>
            </name>
            <name name-style="western">
              <surname>George</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Hamdan</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Higashida</surname>
              <given-names>RT</given-names>
            </name>
            <name name-style="western">
              <surname>Hoh</surname>
              <given-names>BL</given-names>
            </name>
            <name name-style="western">
              <surname>Janis</surname>
              <given-names>LS</given-names>
            </name>
            <name name-style="western">
              <surname>Kase</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Kleindorfer</surname>
              <given-names>DO</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Moseley</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>ED</given-names>
            </name>
            <name name-style="western">
              <surname>Turan</surname>
              <given-names>TN</given-names>
            </name>
            <name name-style="western">
              <surname>Valderrama</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Vinters</surname>
              <given-names>HV</given-names>
            </name>
            <collab>American Heart Association Stroke Council</collab>
            <collab>Council on Cardiovascular Surgery and Anesthesia</collab>
            <collab>Council on Cardiovascular Radiology and Intervention</collab>
            <collab>Council on Cardiovascular and Stroke Nursing</collab>
            <collab>Council on Epidemiology and Prevention</collab>
            <collab>Council on Peripheral Vascular Disease</collab>
            <collab>Council on Nutrition‚ Physical Activity and Metabolism</collab>
          </person-group>
          <article-title>An updated definition of stroke for the 21st century: a statement for healthcare professionals from the American Heart Association/American Stroke Association</article-title>
          <source>Stroke</source>
          <year>2013</year>
          <volume>44</volume>
          <issue>7</issue>
          <fpage>2064</fpage>
          <lpage>2089</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ahajournals.org/doi/10.1161/STR.0b013e318296aeca"/>
          </comment>
          <pub-id pub-id-type="doi">10.1161/STR.0b013e318296aeca</pub-id>
          <pub-id pub-id-type="medline">23652265</pub-id>
          <pub-id pub-id-type="pii">STR.0b013e318296aeca</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>Atherosclerosis and stroke</article-title>
          <source>American Stroke Association</source>
          <year>2018</year>
          <access-date>2023-06-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.stroke.org/en/about-stroke/stroke-risk-factors/atherosclerosis-and-stroke">https://www.stroke.org/en/about-stroke/stroke-risk-factors/atherosclerosis-and-stroke</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Banerjee</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chimowitz</surname>
              <given-names>MI</given-names>
            </name>
          </person-group>
          <article-title>Stroke caused by atherosclerosis of the major intracranial arteries</article-title>
          <source>Circ Res</source>
          <year>2017</year>
          <volume>120</volume>
          <issue>3</issue>
          <fpage>502</fpage>
          <lpage>513</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ahajournals.org/doi/10.1161/CIRCRESAHA.116.308441"/>
          </comment>
          <pub-id pub-id-type="doi">10.1161/CIRCRESAHA.116.308441</pub-id>
          <pub-id pub-id-type="medline">28154100</pub-id>
          <pub-id pub-id-type="pii">CIRCRESAHA.116.308441</pub-id>
          <pub-id pub-id-type="pmcid">PMC5312775</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boehme</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Esenwa</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Elkind</surname>
              <given-names>MSV</given-names>
            </name>
          </person-group>
          <article-title>Stroke Risk Factors, Genetics, and Prevention</article-title>
          <source>Circ Res</source>
          <year>2017</year>
          <month>02</month>
          <day>03</day>
          <volume>120</volume>
          <issue>3</issue>
          <fpage>472</fpage>
          <lpage>495</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28154098"/>
          </comment>
          <pub-id pub-id-type="doi">10.1161/CIRCRESAHA.116.308398</pub-id>
          <pub-id pub-id-type="medline">28154098</pub-id>
          <pub-id pub-id-type="pii">CIRCRESAHA.116.308398</pub-id>
          <pub-id pub-id-type="pmcid">PMC5321635</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>D'Agostino</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Belanger</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kannel</surname>
              <given-names>WB</given-names>
            </name>
          </person-group>
          <article-title>Stroke risk profile: adjustment for antihypertensive medication. The Framingham study</article-title>
          <source>Stroke</source>
          <year>1994</year>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>40</fpage>
          <lpage>43</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ahajournals.org/doi/10.1161/01.STR.25.1.40"/>
          </comment>
          <pub-id pub-id-type="doi">10.1161/01.str.25.1.40</pub-id>
          <pub-id pub-id-type="medline">8266381</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Donnell</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Xavier</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chin</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Rao-Melacini</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rangarajan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pais</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>McQueen</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mondo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Damasceno</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lopez-Jaramillo</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hankey</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dans</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Yusoff</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Truelsen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Diener</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Sacco</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Ryglewicz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Czlonkowska</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weimar</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yusuf</surname>
              <given-names>S</given-names>
            </name>
            <collab>INTERSTROKE investigators</collab>
          </person-group>
          <article-title>Risk factors for ischaemic and intracerebral haemorrhagic stroke in 22 countries (the INTERSTROKE study): a case-control study</article-title>
          <source>Lancet</source>
          <year>2010</year>
          <volume>376</volume>
          <issue>9735</issue>
          <fpage>112</fpage>
          <lpage>123</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(10)60834-3</pub-id>
          <pub-id pub-id-type="medline">20561675</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(10)60834-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Donnell</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chin</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Rangarajan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Xavier</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rao-Melacini</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Pais</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Agapay</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lopez-Jaramillo</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Damasceno</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Langhorne</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>McQueen</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rosengren</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dehghan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hankey</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dans</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Elsayed</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Avezum</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mondo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Diener</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Ryglewicz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Czlonkowska</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pogosova</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Weimar</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Iqbal</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Diaz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yusoff</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yusufali</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Oguz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Penaherrera</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lanas</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ogah</surname>
              <given-names>OS</given-names>
            </name>
            <name name-style="western">
              <surname>Ogunniyi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Iversen</surname>
              <given-names>HK</given-names>
            </name>
            <name name-style="western">
              <surname>Malaga</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rumboldt</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Oveisgharan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Al Hussain</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Magazi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nilanont</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ferguson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pare</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yusuf</surname>
              <given-names>S</given-names>
            </name>
            <collab>INTERSTROKE investigators</collab>
          </person-group>
          <article-title>Global and regional effects of potentially modifiable risk factors associated with acute stroke in 32 countries (INTERSTROKE): a case-control study</article-title>
          <source>Lancet</source>
          <year>2016</year>
          <volume>388</volume>
          <issue>10046</issue>
          <fpage>761</fpage>
          <lpage>775</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(16)30506-2</pub-id>
          <pub-id pub-id-type="medline">27431356</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(16)30506-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dufouil</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Beiser</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McLure</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Tzourio</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Howard</surname>
              <given-names>VJ</given-names>
            </name>
            <name name-style="western">
              <surname>Westwood</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Himali</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Aparicio</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kelly-Hayes</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ritchie</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kase</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Pikula</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Romero</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>D'Agostino</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Samieri</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Vasan</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Chêne</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Howard</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Seshadri</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Revised framingham stroke risk profile to reflect temporal trends</article-title>
          <source>Circulation</source>
          <year>2017</year>
          <volume>135</volume>
          <issue>12</issue>
          <fpage>1145</fpage>
          <lpage>1159</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ahajournals.org/doi/10.1161/CIRCULATIONAHA.115.021275"/>
          </comment>
          <pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.115.021275</pub-id>
          <pub-id pub-id-type="medline">28159800</pub-id>
          <pub-id pub-id-type="pii">CIRCULATIONAHA.115.021275</pub-id>
          <pub-id pub-id-type="pmcid">PMC5504355</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boysen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Nyboe</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Appleyard</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sørensen</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Boas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Somnier</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Schnohr</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Stroke incidence and risk factors for stroke in Copenhagen, Denmark</article-title>
          <source>Stroke</source>
          <year>1988</year>
          <volume>19</volume>
          <issue>11</issue>
          <fpage>1345</fpage>
          <lpage>1353</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ahajournals.org/doi/10.1161/01.STR.19.11.1345"/>
          </comment>
          <pub-id pub-id-type="doi">10.1161/01.str.19.11.1345</pub-id>
          <pub-id pub-id-type="medline">3188119</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gage</surname>
              <given-names>BF</given-names>
            </name>
            <name name-style="western">
              <surname>Waterman</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Shannon</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Boechler</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rich</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Radford</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Validation of clinical classification schemes for predicting stroke: results from the National Registry of Atrial Fibrillation</article-title>
          <source>JAMA</source>
          <year>2001</year>
          <volume>285</volume>
          <issue>22</issue>
          <fpage>2864</fpage>
          <lpage>2870</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jamanetwork.com/journals/jama/fullarticle/193912"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.285.22.2864</pub-id>
          <pub-id pub-id-type="medline">11401607</pub-id>
          <pub-id pub-id-type="pii">joc01974</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khosla</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>CCY</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>HK</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>An integrated machine learning approach to stroke prediction</article-title>
          <year>2010</year>
          <conf-name>Proceedings of the 16th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>July 25-28, 2010</conf-date>
          <conf-loc>Washington DC, USA</conf-loc>
          <publisher-loc>New York, NY, United States</publisher-loc>
          <publisher-name>Association for Computing Machinery</publisher-name>
          <fpage>183</fpage>
          <lpage>192</lpage>
          <pub-id pub-id-type="doi">10.1145/1835804.1835830</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sirsat</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Fermé</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Câmara</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for brain stroke: a review</article-title>
          <source>J Stroke Cerebrovasc Dis</source>
          <year>2020</year>
          <volume>29</volume>
          <issue>10</issue>
          <fpage>105162</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jstrokecerebrovasdis.2020.105162</pub-id>
          <pub-id pub-id-type="medline">32912543</pub-id>
          <pub-id pub-id-type="pii">S1052-3057(20)30580-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huysmans</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dejaeger</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mues</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Vanthienen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Baesens</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>An empirical evaluation of the comprehensibility of decision table, tree and rule based predictive models</article-title>
          <source>Decis Support Syst</source>
          <year>2011</year>
          <volume>51</volume>
          <issue>1</issue>
          <fpage>141</fpage>
          <lpage>154</lpage>
          <pub-id pub-id-type="doi">10.1016/j.dss.2010.12.003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Freitas</surname>
              <given-names>AA</given-names>
            </name>
          </person-group>
          <article-title>Comprehensible classification models</article-title>
          <source>SIGKDD Explor Newsl</source>
          <year>2014</year>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1145/2594473.2594475</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Castelvecchi</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Can we open the black box of AI?</article-title>
          <source>Nature</source>
          <year>2016</year>
          <volume>538</volume>
          <issue>7623</issue>
          <fpage>20</fpage>
          <lpage>23</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nature.com/news/can-we-open-the-black-box-of-ai-1.20731"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/538020a</pub-id>
          <pub-id pub-id-type="medline">27708329</pub-id>
          <pub-id pub-id-type="pii">538020a</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guidotti</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Monreale</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ruggieri</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Turini</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Giannotti</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Pedreschi</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A survey of methods for explaining black box models</article-title>
          <source>ACM Comput Surv</source>
          <year>2018</year>
          <volume>51</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <lpage>42</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/abs/10.1145/3236009"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3236009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arrieta</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Díaz-Rodríguez</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Del Ser</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bennetot</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tabik</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Barbado</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gil-Lopez</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Molina</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Benjamins</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chatila</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Herrera</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Explainable artificial intelligence (XAI): concepts, taxonomies, opportunities and challenges toward responsible AI</article-title>
          <source>Inf Fusion</source>
          <year>2020</year>
          <volume>58</volume>
          <fpage>82</fpage>
          <lpage>115</lpage>
          <pub-id pub-id-type="doi">10.1016/j.inffus.2019.12.012</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Unbox the black-box for the medical explainable AI via multi-modal and multi-centre data fusion: a mini-review, two showcases and beyond</article-title>
          <source>Inf Fusion</source>
          <year>2022</year>
          <volume>77</volume>
          <fpage>29</fpage>
          <lpage>52</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/pii/S1566253521001597?via%3Dihub"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.inffus.2021.07.016</pub-id>
          <pub-id pub-id-type="medline">34980946</pub-id>
          <pub-id pub-id-type="pii">S1566-2535(21)00159-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC8459787</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Geiger</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Goldszmidt</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Bayesian network classifiers</article-title>
          <source>Mach Learn</source>
          <year>1997</year>
          <volume>29</volume>
          <fpage>131</fpage>
          <lpage>163</lpage>
          <pub-id pub-id-type="doi">10.1023/A:1007465528199</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nori</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jenkins</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Koch</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Caruana</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Interpretml: a unified framework for machine learning interpretability</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online on September 19, 2019</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1909.09223"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shwartz-Ziv</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Armon</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Tabular data: deep learning is not all you need</article-title>
          <source>Inf Fusion</source>
          <year>2022</year>
          <volume>81</volume>
          <fpage>84</fpage>
          <lpage>90</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/pii/S1566253521002360"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.inffus.2021.11.011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>White</surname>
              <given-names>IR</given-names>
            </name>
            <name name-style="western">
              <surname>Royston</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Multiple imputation using chained equations: issues and guidance for practice</article-title>
          <source>Stat Med</source>
          <year>2011</year>
          <volume>30</volume>
          <issue>4</issue>
          <fpage>377</fpage>
          <lpage>399</lpage>
          <pub-id pub-id-type="doi">10.1002/sim.4067</pub-id>
          <pub-id pub-id-type="medline">21225900</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Michel</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Thirion</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Grisel</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Blondel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Prettenhofer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dubourg</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Vanderplas</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Scikit-learn: machine learning in Python</article-title>
          <source>J Mach Learn Res</source>
          <year>2011</year>
          <volume>12</volume>
          <fpage>2825</fpage>
          <lpage>2830</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume12/pedregosa11a/pedregosa11a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Whelton</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Carey</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Aronow</surname>
              <given-names>WS</given-names>
            </name>
            <name name-style="western">
              <surname>Casey</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Himmelfarb</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>DePalma</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Gidding</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jamerson</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>MacLaughlin</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Muntner</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ovbiagele</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Spencer</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Stafford</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Taler</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Williamson</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>JT</given-names>
            </name>
          </person-group>
          <article-title>2017 ACC/AHA/AAPA/ABC/ACPM/AGS/APhA/ASH/ASPC/NMA/PCNA guideline for the prevention, detection, evaluation, and management of high blood pressure in adults: a report of the American College of Cardiology/American Heart Association Task Force on clinical practice guidelines</article-title>
          <source>J Am Coll Cardiol</source>
          <year>2018</year>
          <volume>71</volume>
          <issue>19</issue>
          <fpage>e127</fpage>
          <lpage>e248</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0735-1097(17)41519-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jacc.2017.11.006</pub-id>
          <pub-id pub-id-type="medline">29146535</pub-id>
          <pub-id pub-id-type="pii">S0735-1097(17)41519-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guyon</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Weston</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Barnhill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vapnik</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Gene selection for cancer classification using support vector machines</article-title>
          <source>Mach Learn</source>
          <year>2002</year>
          <volume>46</volume>
          <issue>1-3</issue>
          <fpage>389</fpage>
          <lpage>422</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://link.springer.com/article/10.1023/A:1012487302797"/>
          </comment>
          <pub-id pub-id-type="doi">10.1023/A:1012487302797</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SI</given-names>
            </name>
          </person-group>
          <article-title>A unified approach to interpreting model predictions</article-title>
          <year>2017</year>
          <conf-name>31st Conference on Neural Information Processing Systems (NIPS 2017)</conf-name>
          <conf-date>December 4-9, 2017</conf-date>
          <conf-loc>Long Beach, CA, USA</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://proceedings.neurips.cc/paper_files/paper/2017/file/8a20a8621978632d76c43dfd28b67767-Paper.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>BayesFusion, LLC</collab>
          </person-group>
          <article-title>GeNie</article-title>
          <source>BayesFusion Downloads for Academia</source>
          <year>2016</year>
          <access-date>2023-06-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://download.bayesfusion.com/files.html">https://download.bayesfusion.com/files.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Holzinger</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Biemann</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pattichis</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Kell</surname>
              <given-names>DB</given-names>
            </name>
          </person-group>
          <article-title>What do we need to build explainable AI systems for the medical domain?</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online on December 28, 2017</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1712.09923"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1712.09923</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tjoa</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Guan</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A survey on explainable artificial intelligence (XAI): toward medical XAI</article-title>
          <source>IEEE Trans Neural Netw Learn Syst</source>
          <year>2021</year>
          <volume>32</volume>
          <issue>11</issue>
          <fpage>4793</fpage>
          <lpage>4813</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ieeexplore.ieee.org/document/9233366"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/TNNLS.2020.3027314</pub-id>
          <pub-id pub-id-type="medline">33079674</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ribeiro</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>"Why should I trust you?": explaining the predictions of any classifier</article-title>
          <year>2016</year>
          <conf-name>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>August 13-17, 2016</conf-date>
          <conf-loc>San Francisco, California, USA</conf-loc>
          <publisher-loc>New York, NY, United States</publisher-loc>
          <publisher-name>Association for Computing Machinery</publisher-name>
          <fpage>1135</fpage>
          <lpage>1144</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/abs/10.1145/2939672.2939778"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2939672.2939778</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Breiman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stone</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Olshen</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <source>Classification and Regression Trees</source>
          <year>1984</year>
          <publisher-loc>Boca Raton, FL</publisher-loc>
          <publisher-name>Chapman &#38; Hall/CRC</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shrikumar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Greenside</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kundaje</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Learning important features through propagating activation differences</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online on October 12, 2019</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1704.02685"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doshi-Velez</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Towards a rigorous science of interpretable machine learning</article-title>
          <source>ArXiv.</source>
          <comment>Preprint posted online on March 2, 2017</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1702.08608"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Nam</surname>
              <given-names>HS</given-names>
            </name>
          </person-group>
          <article-title>A Bayesian network model for predicting post-stroke outcomes with available risk factors</article-title>
          <source>Front Neurol</source>
          <year>2018</year>
          <volume>9</volume>
          <fpage>699</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.frontiersin.org/articles/10.3389/fneur.2018.00699/full"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fneur.2018.00699</pub-id>
          <pub-id pub-id-type="medline">30245663</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kanwar</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Gomberg-Maitland</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hoeper</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pausch</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pittrow</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Strange</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>JV</given-names>
            </name>
            <name name-style="western">
              <surname>Druzdzel</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kraisangka</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lohmueller</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Antaki</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Benza</surname>
              <given-names>RL</given-names>
            </name>
          </person-group>
          <article-title>Risk stratification in pulmonary arterial hypertension using Bayesian analysis</article-title>
          <source>Eur Respir J</source>
          <year>2020</year>
          <volume>56</volume>
          <issue>2</issue>
          <fpage>2000008</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://erj.ersjournals.com/cgi/pmidlookup?view=long&#38;pmid=32366491"/>
          </comment>
          <pub-id pub-id-type="doi">10.1183/13993003.00008-2020</pub-id>
          <pub-id pub-id-type="medline">32366491</pub-id>
          <pub-id pub-id-type="pii">13993003.00008-2020</pub-id>
          <pub-id pub-id-type="pmcid">PMC7495922</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benza</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Gomberg-Maitland</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Elliott</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Farber</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Foreman</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Frost</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>McGoon</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Pasta</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Selej</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Burger</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Frantz</surname>
              <given-names>RP</given-names>
            </name>
          </person-group>
          <article-title>Predicting survival in patients with pulmonary arterial hypertension: the REVEAL risk score calculator 2.0 and comparison with ESC/ERS-based risk assessment strategies</article-title>
          <source>Chest</source>
          <year>2019</year>
          <volume>156</volume>
          <issue>2</issue>
          <fpage>323</fpage>
          <lpage>337</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0012-3692(19)30152-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.chest.2019.02.004</pub-id>
          <pub-id pub-id-type="medline">30772387</pub-id>
          <pub-id pub-id-type="pii">S0012-3692(19)30152-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>D'Alonzo</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Barst</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ayres</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Bergofsky</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Brundage</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Detre</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Fishman</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Goldring</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Groves</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Kernis</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Pietra</surname>
              <given-names>GG</given-names>
            </name>
            <name name-style="western">
              <surname>Reid</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Reeves</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Rich</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vreim</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Survival in patients with primary pulmonary hypertension</article-title>
          <source>Ann Intern Med</source>
          <year>1991</year>
          <volume>115</volume>
          <issue>5</issue>
          <fpage>343</fpage>
          <lpage>349</lpage>
          <pub-id pub-id-type="doi">10.7326/0003-4819-115-5-343</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Caruana</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gehrke</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Intelligible models for classification and regression</article-title>
          <year>2012</year>
          <conf-name>KDD '12: Proceedings of the 18th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>August 12-16, 2012</conf-date>
          <conf-loc>Beijing China</conf-loc>
          <publisher-loc>New York, NY, United States</publisher-loc>
          <publisher-name>Association for Computing Machinery</publisher-name>
          <pub-id pub-id-type="doi">10.1145/2339530.2339556</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kokkotis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Giarmatzis</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Giannakou</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Moustakidis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tsatalas</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tsiptsios</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Vadikolias</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Aggelousis</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>An explainable machine learning pipeline for stroke prediction on imbalanced data</article-title>
          <source>Diagnostics (Basel)</source>
          <year>2022</year>
          <volume>12</volume>
          <issue>10</issue>
          <fpage>2392</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=diagnostics12102392"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/diagnostics12102392</pub-id>
          <pub-id pub-id-type="medline">36292081</pub-id>
          <pub-id pub-id-type="pii">diagnostics12102392</pub-id>
          <pub-id pub-id-type="pmcid">PMC9600473</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kleindorfer</surname>
              <given-names>DO</given-names>
            </name>
            <name name-style="western">
              <surname>Towfighi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chaturvedi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cockroft</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Gutierrez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lombardi-Hill</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kamel</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kernan</surname>
              <given-names>WN</given-names>
            </name>
            <name name-style="western">
              <surname>Kittner</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Leira</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Lennon</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Meschia</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>TN</given-names>
            </name>
            <name name-style="western">
              <surname>Pollak</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Santangeli</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sharrief</surname>
              <given-names>AZ</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Turan</surname>
              <given-names>TN</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>LS</given-names>
            </name>
          </person-group>
          <article-title>2021 Guideline for the prevention of stroke in patients with stroke and transient ischemic attack: a guideline from the American Heart Association/American Stroke Association</article-title>
          <source>Stroke</source>
          <year>2021</year>
          <volume>52</volume>
          <issue>7</issue>
          <fpage>e364</fpage>
          <lpage>e467</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ahajournals.org/doi/abs/10.1161/STR.0000000000000375?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1161/STR.0000000000000375</pub-id>
          <pub-id pub-id-type="medline">34024117</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
