<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Cardio</journal-id><journal-id journal-id-type="publisher-id">cardio</journal-id><journal-id journal-id-type="index">26</journal-id><journal-title>JMIR Cardio</journal-title><abbrev-journal-title>JMIR Cardio</abbrev-journal-title><issn pub-type="epub">2561-1011</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e50627</article-id><article-id pub-id-type="doi">10.2196/50627</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Application of Dragonnet and Conformal Inference for Estimating Individualized Treatment Effects for Personalized Stroke Prevention: Retrospective Cohort Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Lolak</surname><given-names>Sermkiat</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Attia</surname><given-names>John</given-names></name><degrees>MD, Prof Dr, PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>McKay</surname><given-names>Gareth J</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Thakkinstian</surname><given-names>Ammarin</given-names></name><degrees>PhD, Prof Dr</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Clinical Epidemiology and Biostatistics, Faculty of Medicine, Ramathibodi Hospital, Mahidol University</institution><addr-line>4th Floor, Sukho Place Building, 218/11 Sukhothai Road</addr-line><addr-line>Suan Chitlada, Dusit</addr-line><country>Thailand</country></aff><aff id="aff2"><institution>Centre for Clinical Epidemiology and Biostatistics, School of Medicine and Public Health, Hunter Medical Research Institute, University of Newcastle</institution><addr-line>New Lambton, New South Wales</addr-line><country>Australia</country></aff><aff id="aff3"><institution>Centre for Public Health, School of Medicine, Dentistry and Biomedical Sciences, Queen&#x2019;s University Belfast</institution><addr-line>Belfast</addr-line><country>United Kingdom</country></aff><aff id="aff4"><institution>Department of Clinical Epidemiology and Biostatistics, Faculty of Medicine, Ramathibodi Hospital, Mahidol University</institution><addr-line>Bangkok</addr-line><country>Thailand</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Rivers</surname><given-names>John</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Wright</surname><given-names>Marcia</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Kakaletsis</surname><given-names>Nikolaos</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Jaroszewicz</surname><given-names>Szymon</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Sermkiat Lolak, MD, PhD, Department of Clinical Epidemiology and Biostatistics, Faculty of Medicine, Ramathibodi Hospital, Mahidol University, 4th Floor, Sukho Place Building, 218/11 Sukhothai Road, Suan Chitlada, Dusit, 10300, Thailand, 66 955073078; <email>macsermkiat@yahoo.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>8</day><month>1</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e50627</elocation-id><history><date date-type="received"><day>07</day><month>07</month><year>2023</year></date><date date-type="rev-recd"><day>23</day><month>11</month><year>2024</year></date><date date-type="accepted"><day>24</day><month>11</month><year>2024</year></date></history><copyright-statement>&#x00A9; Sermkiat Lolak, John Attia, Gareth J McKay, Ammarin Thakkinstian. Originally published in JMIR Cardio (<ext-link ext-link-type="uri" xlink:href="https://cardio.jmir.org">https://cardio.jmir.org</ext-link>), 8.1.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Cardio, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://cardio.jmir.org">https://cardio.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://cardio.jmir.org/2025/1/e50627"/><abstract><sec><title>Background</title><p>Stroke is a major cause of death and disability worldwide. Identifying individuals who would benefit most from preventative interventions, such as antiplatelet therapy, is critical for personalized stroke prevention. However, traditional methods for estimating treatment effects often focus on the average effect across a population and do not account for individual variations in risk and treatment response.</p></sec><sec><title>Objective</title><p>This study aimed to estimate the individualized treatment effects (ITEs) for stroke prevention using a novel combination of Dragonnet, a causal neural network, and conformal inference. The study also aimed to determine and validate the causal effects of known stroke risk factors&#x2014;hypertension (HT), diabetes mellitus (DM), dyslipidemia (DLP), and atrial fibrillation (AF)&#x2014;using both a conventional causal model and machine learning models.</p></sec><sec sec-type="methods"><title>Methods</title><p>A retrospective cohort study was conducted using data from 275,247 high-risk patients treated at Ramathibodi Hospital, Thailand, between 2010 and 2020. Patients aged &#x003E;18 years with HT, DM, DLP, or AF were eligible. The main outcome was ischemic or hemorrhagic stroke, identified using <italic>International Classification of Diseases, 10th Revision</italic> (<italic>ICD-10</italic>) codes. Causal effects of the risk factors were estimated using a range of methods, including: (1) propensity score&#x2013;based methods, such as stratified propensity scores, inverse probability weighting, and doubly robust estimation; (2) structural causal models; (3) double machine learning; and (4) Dragonnet, a causal neural network, which was used together with weighted split-conformal quantile regression to estimate ITEs.</p></sec><sec sec-type="results"><title>Results</title><p>AF, HT, and DM were identified as significant stroke risk factors. Average causal risk effect estimates for these risk factors ranged from 0.075 to 0.097 for AF, 0.017 to 0.025 for HT, and 0.006 to 0.010 for DM, depending on the method used. Dragonnet yielded causal risk ratios of 4.56 for AF, 2.44 for HT, and 1.41 for DM, which is comparable to other causal models and the standard epidemiological case-control study. Mean ITE analysis indicated that several patients with DM or DM with HT, who were not receiving antiplatelet treatment at the time of data collection, showed reductions in total risk of &#x2212;0.015 and &#x2212;0.016, respectively.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study provides a comprehensive evaluation of stroke risk factors and demonstrates the feasibility of using Dragonnet and conformal inference to estimate ITEs of antiplatelet therapy for stroke prevention. The mean ITE analysis suggested that those with DM or DM with HT, who were not receiving antiplatelet treatment at the time of data collection, could potentially benefit from this therapy. The findings highlight the potential of these advanced techniques to inform personalized treatment strategies for stroke, enabling clinicians to identify individuals who are most likely to benefit from specific interventions.</p></sec></abstract><kwd-group><kwd>stroke</kwd><kwd>causal effect</kwd><kwd>ITE</kwd><kwd>individual treatment effect</kwd><kwd>Dragonnet</kwd><kwd>conformal inference</kwd><kwd>mortality</kwd><kwd>hospital records</kwd><kwd>hypertension</kwd><kwd>risk factor</kwd><kwd>diabetes</kwd><kwd>dyslipidemia</kwd><kwd>atrial fibrillation</kwd><kwd>machine learning</kwd><kwd>treatment</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Stroke is a leading cause of death and disability, presenting both personal and economic burdens [<xref ref-type="bibr" rid="ref1">1</xref>]. Astonishingly, many epidemiological studies have identified important risk factors of stroke occurrence, especially through the use of cohort studies [<xref ref-type="bibr" rid="ref2">2</xref>], and randomized controlled trials (RCTs) have identified the impact of treating these risk factors. While RCTs control for confounding factors through study design, cohort studies attempt to address these factors using statistical methods. However, the possibility of residual confounding remains, highlighting the need for improved analysis approaches [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>Frameworks of causal effect have largely been confined to Pearl&#x2019;s [<xref ref-type="bibr" rid="ref4">4</xref>] structural causal models (SCMs) and Rubin&#x2019;s [<xref ref-type="bibr" rid="ref5">5</xref>] potential outcome models (POMs) [<xref ref-type="bibr" rid="ref6">6</xref>]. SCMs evaluate causal relationships between variables using a directed acyclic graph defined by a set of structural equations, which consider the influence of each variable by its parents, or causes, along with its probability distribution. In addition, SCMs can also assess the effect of interventions by estimating how changing one unit of treatment (or risk) leads to a change in outcome [<xref ref-type="bibr" rid="ref7">7</xref>]. Conversely, POMs focus on the concept of counterfactuals, specifically what would have happened if an individual had been exposed to a different treatment or risk [<xref ref-type="bibr" rid="ref8">8</xref>]. Consequently, this approach estimates 2 potential outcomes (POs) for each individual: if the individual had received the treatment and if they had not. Subsequently, Rosenbaum and Rubin [<xref ref-type="bibr" rid="ref9">9</xref>] developed propensity scores to reflect the probability of an individual being assigned to a certain treatment group. Therefore, these estimates are only considered valid if the 2 specific conditions&#x2014;strong ignorability and positivity&#x2014;are met. Statistical methods have been developed based on POMs and propensity scores, including matching [<xref ref-type="bibr" rid="ref10">10</xref>], stratified propensity score (SPS) [<xref ref-type="bibr" rid="ref11">11</xref>], inverse probability weighting (IPW) [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>], and doubly robust estimation (DRE) [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. Recently, nonconventional statistical models such as double machine learning (DML), meta-learners, and neural networks have also been developed to estimate unbiased causal effects without requiring strong underlying assumptions [<xref ref-type="bibr" rid="ref14">14</xref>]. Causal neural networks (NNs), including TARNet and Dragonnet, learn by sharing input data to estimate both factual and counterfactual outcomes. This approach is currently an active area of research [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref19">19</xref>]. Dragonnet also uses &#x201C;learned data&#x201D; to predict propensity scores by tradeoff with prediction quality, which yields better average treatment effect (ATE) estimates [<xref ref-type="bibr" rid="ref18">18</xref>].</p><p>Current causal modeling has shifted its focus from the ATE, which measures the treatment effect averaged across the entire study population, to the conditional average treatment effect (CATE), which assesses the ATE conditional on particular variables, such as sex, age, and other covariates. More recently, the focus has further evolved to the individualized treatment effect (ITE), which estimates the treatment effect for a particular individual. CATE has inherent variability depending on which covariate the model is conditioned on [<xref ref-type="bibr" rid="ref20">20</xref>]. However, estimating ITEs is challenging because it requires making assumptions about the underlying individual data-generating process and the model used to estimate the ITEs [<xref ref-type="bibr" rid="ref17">17</xref>]. A statistical technique called conformal inference may appropriately estimate the confidence intervals of ITEs by accounting for the uncertainty in their estimation. Despite being a novel technique, it has shown promise [<xref ref-type="bibr" rid="ref20">20</xref>]. Conformal inference uses nonconformity scores that measure the degree of disagreement between the estimated and observed outcomes, to provide a confidence interval or a precision of estimation [<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref23">23</xref>]. Therefore, we conducted this study to estimate the CATE of stroke occurrence based on real-world clinical data using Dragonnet NN models. Additionally, ITE was estimated to identify individuals at high risk of stroke who may benefit from lowering risk factors by combining the strengths of Dragonnet and conformal inference approaches. To the best of our knowledge, no prior studies have employed these methods in combination to estimate causal effects in a clinical setting.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p>The study population included a retrospective cohort of patients who were at high risk for stroke and had been treated and followed up at Ramathibodi Hospital, Thailand, between 2010 and 2020. Hospital records and the <italic>International Classification of Diseases, 10th Revision</italic> (<italic>ICD-10</italic>) classification system were used to identify patients. Patients were eligible if they were aged &#x003E;18 years and had one or more of the following conditions: hypertension (HT; <italic>ICD-10</italic> code I10-I16), diabetes mellitus (DM; <italic>ICD-10</italic> code E08-E13), dyslipidemia (DLP; <italic>ICD-10</italic> code E78), and atrial fibrillation (AF; <italic>ICD-10</italic> code I48). Patients were excluded if they had a stroke on their first visit or only had one visit during the study period. The main outcome measured in the study was the occurrence of ischemic or hemorrhagic stroke, which was identified using the <italic>ICD-10</italic> codes I63 and I61, respectively.</p><p>Patients were followed up from their index date (i.e., the date they were identified as high-risk patients) until they progressed to stroke, were lost to follow-up, or were stroke-free at the end of the study (December 31, 2020). Patients who were lost to follow-up or stroke-free at the end of the study period were censored on their last visit date or at the end of the study. A causal diagram was constructed (<xref ref-type="fig" rid="figure1">Figure 1</xref>), and potential predictors of stroke were collected, including age, sex, BMI, chronic kidney disease (CKD), AF, HT, DM, and DLP. HT, AF, and DM were considered as mediators, whereas the remaining variables were covariates in the models. A software library called DoWhy, now incorporated into PyWhy (Python Software Foundation), was used to construct models for stratification, IPW, DRE, and DML [<xref ref-type="bibr" rid="ref24">24</xref>]. Parameters of all estimators were set by default in the DoWhy package. The number of strata in the stratification method was automatically determined [<xref ref-type="bibr" rid="ref25">25</xref>]. The weighting scheme in IPW was set to default inverse propensity score. For DRE, the regression and propensity models were specified as lasso and logistic regression, respectively. For DML, linear and nonlinear cross-fitted models were applied to the outcome model (lasso and Extreme Gradient Boosting [XGBoost]), propensity model (logistic regression and XGBoost), and final model (linear regression and lasso). Estimands of each risk pathway were defined by PyWhy from the input causal graph. Graphical causal model&#x2013;based inferences from the DoWhy library were used for medication analysis to quantify the causal effects of direct and indirect pathways, termed natural direct effect (NDE) and natural indirect effect (NIE), respectively [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. NDE <inline-formula><mml:math id="ieqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msubsup><mml:mi>Y</mml:mi><mml:mrow><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mi>M</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mn>0</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:msubsup><mml:mo>&#x2212;</mml:mo><mml:msubsup><mml:mi>Y</mml:mi><mml:mrow><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mi>M</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mn>0</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:msubsup></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> refers to the change in the outcome of an individual when they are exposed to a specific treatment <inline-formula><mml:math id="ieqn2"><mml:msub><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:math></inline-formula>, compared to another treatment <inline-formula><mml:math id="ieqn3"><mml:msub><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub></mml:math></inline-formula>, while keeping the mediator variable constant at the baseline value or reference treatment <italic>M(0</italic>). In contrast, NIE <inline-formula><mml:math id="ieqn4"><mml:mo>(</mml:mo><mml:msubsup><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mi>M</mml:mi><mml:mo>(</mml:mo><mml:mn>1</mml:mn><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:msubsup><mml:mo>-</mml:mo><mml:mi> </mml:mi><mml:msubsup><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mi>M</mml:mi><mml:mo>(</mml:mo><mml:mn>0</mml:mn><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:msubsup><mml:mo>)</mml:mo></mml:math></inline-formula> refers to the difference between the counterfactual outcome value when treatment <inline-formula><mml:math id="ieqn5"><mml:msub><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:math></inline-formula> is fixed and the mediator assumes a certain value at a particular treatment <italic>M(1</italic>) and the counterfactual outcome value when the mediator assumes the same value at the baseline <italic>M(0</italic>) [<xref ref-type="bibr" rid="ref27">27</xref>].</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Causal diagram of patients at risk of stroke occurrence. AF: atrial fibrillation; CKD: chronic kidney disease; DLP: dyslipidemia; DM: diabetes mellitus; HT: hypertension.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e50627_fig01.png"/></fig><p>The Dragonnet NN was used to estimate PO and propensity scores. The architecture of Dragonnet was based on previous work (<xref ref-type="fig" rid="figure2">Figure 2</xref>) [<xref ref-type="bibr" rid="ref18">18</xref>]. It employs a deep net to create a representation layer <italic>ɸ(X</italic>) &#x2208; &#x211D;&#x1D3E;, which is used to forecast outcomes for both the treatment <italic>&#x0176;(1</italic>) and control groups <italic>&#x0176;(0</italic>). It utilizes 2 hidden layers for each outcome model while a basic fully connected layer with a sigmoid function is used for the propensity score (&#x1D73A;). CATE was estimated by subtracting treatment (risk) and control PO for each risk factor <inline-formula><mml:math id="ieqn6"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msubsup><mml:mi>Y</mml:mi><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:msubsup><mml:mo>&#x2212;</mml:mo><mml:msubsup><mml:mi>Y</mml:mi><mml:mrow><mml:mn>0</mml:mn></mml:mrow><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:msubsup><mml:mo>&#x2223;</mml:mo><mml:mi>Z</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> and risk ratios were estimated by division of PO (<inline-formula><mml:math id="ieqn7"><mml:mfrac><mml:mrow><mml:msubsup><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:msubsup></mml:mrow><mml:mrow><mml:msubsup><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mn>0</mml:mn></mml:mrow><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:mfrac><mml:mo>|</mml:mo><mml:mi> </mml:mi><mml:mi>Z</mml:mi></mml:math></inline-formula>); <italic>Y&#x2081;</italic> is the PO for the risk group, <italic>Y&#x2080;</italic> is the PO for the control group, <italic>x</italic> is an interested factor, and <italic>Z</italic> are other covariates.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Dragonnet architecture. <italic>X</italic> is the covariates, <italic>ɸ(X)</italic> is a learned representation of <italic>X</italic>. <italic>&#x0176;(1)</italic> is the predicted outcome of the treatment (risked) group. <italic>&#x0176;(0)</italic> is the predicted outcome of the control group. <italic>&#x03B5;</italic> is the estimated propensity score. C&#x00C2;TE is the conditional average treatment effect computed by <italic>&#x0176;(1)&#x2013;&#x0176;(0)</italic>.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e50627_fig02.png"/></fig><p>To accurately estimate the ITE, it is mandatory for the conditional independence assumption to hold, especially considering the unequal distribution of covariates between factual and counterfactual outcomes of the treatment and control groups, commonly known as covariate shift. To address this challenge, we employed a nested method of weighted split-conformal quantile regression (CQR) to estimate the ITE [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>] by incorporating antiplatelet medications as a treatment for stroke prevention. POs were estimated using quantile loss setting &#x03B1; at .05. The dataset was split evenly into training and evaluation sets; <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> shows the entire algorithm. All risk factors and covariates were similar between models, considering antiplatelet medication as a treatment and stratified by risk factor  <inline-formula><mml:math id="ieqn8"><mml:mo>(</mml:mo><mml:msubsup><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mi>a</mml:mi><mml:mi>n</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>p</mml:mi><mml:mi>l</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>e</mml:mi><mml:mi>l</mml:mi><mml:mi>e</mml:mi><mml:mi>t</mml:mi><mml:mi>s</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:msubsup><mml:mo>-</mml:mo><mml:mi> </mml:mi><mml:msubsup><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mi>a</mml:mi><mml:mi>n</mml:mi><mml:mi>t</mml:mi><mml:mi>i</mml:mi><mml:mi>p</mml:mi><mml:mi>l</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>e</mml:mi><mml:mi>l</mml:mi><mml:mi>e</mml:mi><mml:mi>t</mml:mi><mml:mi>s</mml:mi><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:msubsup><mml:mo>|</mml:mo><mml:mi> </mml:mi><mml:mi>Z</mml:mi><mml:mo>)</mml:mo><mml:mo>,</mml:mo></mml:math></inline-formula> with <italic>x</italic> representing the risk factors of interest (i.e., HT, DM, and DLP) and Z representing other covariates. AF was not included as a stratum for the estimation of ITE in this example since it is not an indication for the prescription of antiplatelet therapy, but it remained a covariate.</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>The data were anonymized to ensure confidentiality and privacy protection. This study was approved by the Human Research Ethics Committee, Faculty of Medicine Ramathibodi Hospital, Mahidol University (COA. MURA2021/255). The committee waived the need to obtain consent for the collection, analysis, and publication of the retrospectively obtained and anonymized data for this noninterventional study.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>A total of 275,247 high-risk patients were included in the cohort. Among them, 9659 patients developed stroke, resulting in an incidence of 3.5% (95% CI 3.4-3.6). The follow-up rate for the study population was 80% (7752/9659).</p><p>Baseline demographic and risk factors were compared between 9659 stroke patients and 265,588 nonstroke patients (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). Stroke patients had a mean age of 64.7 years and were more likely to be male. Stratification by risk indicated that 13% of AF patients, 4% of HT patients, 4% of DM patients, and 4% of DLP patients experienced stroke in contrast to only 2% of non-AF patients, 1% of non-HT patients, 3% of non-DM patients, and 3% of non-DLP patients, who developed stroke.</p><p>Causal effects of mediators including HT, DM, CKD, and AF on stroke were estimated based on the causal diagram in <xref ref-type="fig" rid="figure1">Figure 1</xref>. The estimands report as probability of stroke given the risk factors, <italic>P</italic>(<italic>Stroke</italic> | <italic>risk factors</italic>), are as follows: <italic>P</italic>(<italic>Stroke</italic> | <italic>HT, age, DM, DLP</italic>) for HT; <italic>P</italic>(<italic>Stroke</italic> | <italic>AF, age, HT</italic>) for AF<italic>; P</italic>(<italic>Stroke</italic> | <italic>age, DLP</italic>) for DLP; and <italic>P</italic>(<italic>Stroke</italic> | <italic>age, DM, BMI</italic>) for DM (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). For the POM approach, the SPS estimator showed AF as the highest risk of stroke, followed by HT, DM, and DLP with risk estimates of 0.084 (95% CI 0.079-0.088), 0.019 (95% CI 0.015-0.020), 0.010 (95% CI 0.008-0.010), and 0.0015 (95% CI &#x2212;0.0002 to 0.0027), respectively. IPW yielded similar, albeit slightly higher, corresponding risks of 0.092 (95% CI 0.089-0.096), 0.024 (95% CI 0.022-0.025), 0.010 (95% CI 0.008-0.010), and 0.001 (95% CI &#x2212;0.0005 to 0.0025), respectively. Comparable results were observed in the DRE analysis, with a similar trend of risk effect estimates of 0.082 (95% CI 0.0849-0.0871), 0.025 (95% CI 0.0243-0.0257), 0.008 (95% CI 0.0057-0.0063), and 0.0006 (95% CI 0.0001-0.0011), respectively.</p><p>The SCM estimation also yielded similar trends to the POM approach, in which the risk of stroke was 0.096 (95% CI 0.0948-0.0972), 0.021 (95% CI 0.0204-0.0216), 0.007 (95% CI 0.0067-0.0073), and 0.0005 (95% CI 0.0004-0.0006) for AF, HT, DM, and DLP, respectively. Mediation analysis indicated the NDE of HT to be 0.020 (95% CI 0.019-0.021) and the NIE to be 0.0027 (95% CI 0.0025-0.0029). NDE and NIE for DM and DLP were both modest and consistent with the findings from other models. <xref ref-type="fig" rid="figure1">Figure 1</xref> illustrates the pathways through which the mediators act: HT mediates through CKD and AF, DM mediates through HT and CKD, while DLP mediates through HT.</p><p>In the context of DML, the nonparametric model estimates were slightly smaller than those for the linear model, with risks of 0.086 (95% CI 0.0849-0.0871), 0.015 (95% CI 0.0145-0.0155), 0.006 (95% CI 0.0057-0.0063), and 0.0 (95% CI &#x2212;0.0001 to 0.001) for AF, HT, DM, and DLP, respectively, whereas the corresponding linear model estimate risks were 0.097 (95% CI 0.096-0.098), 0.023 (95% CI 0.0223-0.0236), 0.009 (95% CI 0.0087-0.0093), and 0.002 (95% CI 0.0018-0.0022).</p><p>Dragonnet estimated the causal effects of AF, HT, DM, and DLP on stroke as 0.075 (95% CI 0.074-0.076), 0.017 (95% CI 0.0169-0.0170), 0.01 (95% CI 0.009-0.010), and &#x2212;0.002 (95% CI &#x2212;0.0022 to 0.0021), with causal ratios of 4.56 (95% CI 4.56-4.57), 2.44 (95% CI 2.41-2.46), 1.41 (95% CI 1.21-1.60), and 0.856 (95% CI 0.855-0.858), respectively. The odds ratios from the logistic regression models were respectively 3.34 (95% CI 2.68-3.75), 2.56 (95% CI 2.33-2.80), 1.16 (95% CI 1.05-1.30), and 1.00 (95% CI 0.8-1.4). Details are provided in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref> for comparison.</p><p>The influence of risk reduction for individual patients who did not receive antiplatelet therapy, had they been given the medication (counterfactuals of nontreatment ITEs), was examined using weighted split-CQR. As shown in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>, three of the samples (3/50, 6%) appear to have potentially benefited from antiplatelet treatment, indicating that a considerable number of patients might have experienced a positive impact on their stroke risk reduction had they received the medication. The mean ITEs indicated that several patients with DM or DM with HT were not currently receiving antiplatelet treatment and would be more likely to benefit if they had received it, with reduction of total risk as &#x2212;0.015 (IQR &#x2212;0.011 to &#x2212;0.018) and &#x2212;0.016 (IQR &#x2212;0.015 to 0.022) among each group, respectively (<xref ref-type="fig" rid="figure3">Figure 3</xref>).</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Box plot representing the mean individual treatment effect for patients with different risk factors who had not been taking antiplatelet medication, illustrating the potential impact on stroke risk reduction if they had received antiplatelet therapy. DLP: dyslipidemia; DM: diabetes mellitus; HT: hypertension; ITE: individual treatment effect.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e50627_fig03.png"/></fig></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>We estimated the causal influences of risk factors associated with stroke outcomes using multiple approaches that included SPS, IPW, DRE, SCM, and mediation analysis, in addition to DML and Dragonnet NNs. Our findings indicate strong positive causal effects associated with AF and HT on stroke development, with DM exerting a weaker effect. DLP, in contrast, had little effect. Furthermore, our analysis suggests that patients with both DM and HT not currently in receipt of antiplatelet treatments would be the most likely beneficiaries of antiplatelet therapy based on the mean ITEs.</p><p>The results from the different estimators generally demonstrated consistency, although there were slight variations in specific point estimates and confidence intervals varied slightly. The estimated causal effect derived from various methods using real-world observational data is comparable with standard cohort epidemiological studies using more traditional logistic regression approaches [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>].</p></sec><sec id="s4-2"><title>Comparison to Prior Works</title><p>SPS is a widely used method that minimizes confounding bias by adjusting baseline covariates and confounding factors and estimating treatment effects by stratum. However, SPS is sensitive to the number of strata and features that affect both treatment and outcome (confounding factors), which can lead to bias in the causal effect estimate [<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref33">33</xref>]. In addition, some strata may be sparsely populated, making the ATE hard to define and more prone to bias [<xref ref-type="bibr" rid="ref34">34</xref>]. Rosenbaum and Rubin [<xref ref-type="bibr" rid="ref9">9</xref>] originally proposed dividing the strata into 5 levels and then subsequently automatically splitting the strata until the balance in the numbers of treated and control observations was achieved [<xref ref-type="bibr" rid="ref25">25</xref>].</p><p>IPW attempts to reduce confounding of the ATE by weighting the sample with the inverse propensity score and by balancing the distribution of the covariates between the treated and untreated groups [<xref ref-type="bibr" rid="ref35">35</xref>], thereby avoiding the problem of data sparsity that may be present in SPS, particularly with small sample sizes. However, there is a reliance on the assumption that the propensity score model correctly captures all confounding factors, which, if incorrect, may bias the ATE. Additionally, IPW is more sensitive to the model and variable selection for estimating the propensity scores, with small differences in estimated propensity scores potentially leading to large differences in estimated causal effects [<xref ref-type="bibr" rid="ref36">36</xref>]. Finally, IPW may imprecisely estimate treatment effects if a sample size is small, leading to a propensity score close to 0 or 1 [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>].</p><p>DRE combines propensity score and outcome regression models [<xref ref-type="bibr" rid="ref38">38</xref>], which can lead to improvements in the robustness of model specification by allowing one of the two treatment and outcome models to be miss-specified but still provide a consistent estimation [<xref ref-type="bibr" rid="ref39">39</xref>]. The challenge is to validly model either the propensity score or the outcome model; it may be tempting to use modern machine learning approaches or nonparametric models in DRE, but this may lead to bias if the functions are too complex, leading to overfitting [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]. DML was developed to address the bias from regularization and overfitting in estimating the parameter of interest, which arises when naively inserting machine learning estimators into the estimation equation. This approach consists of two critical components: (1) the use of Neyman-orthogonal moments or scores to estimate the parameters and (2) the application of cross-fitting, which provides an efficient form of data-splitting. By using both elements, DML minimizes the impact of regularization bias and overfitting on parameter estimation; this also extends to nonparametric models [<xref ref-type="bibr" rid="ref14">14</xref>].</p><p>Applying POMs (eg, SPS, IPW, DRE) relies heavily on the assumption that the treatment assignment is independent of the PO given the observed covariates, which is known as &#x201C;unconfoundedness&#x201D; or the conditional independence assumption. If this assumption does not hold, the estimated causal effect will be biased. In contrast, SCMs facilitate the modeling of complex relationships between multiple causes and effects in the presence of latent or unobserved variables [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]. In addition, SCMs can be considered as counterfactual predictions of interventions, which can be useful in applications such as causal inference in experimental or observational studies [<xref ref-type="bibr" rid="ref43">43</xref>-<xref ref-type="bibr" rid="ref46">46</xref>]. However, SCMs are limited by the assumption of independence between variables and may require conceptualized causal relationship mechanisms.</p><p>The benefit of using NNs to estimate causal effects is their flexibility and power to handle high-dimensional and complex data. Shalit et al [<xref ref-type="bibr" rid="ref17">17</xref>] introduced TARNet by sharing information between the PO of treatment and control groups, which is different from the previous model that separated the training data. More recently, Dragonnet was developed by combining propensity scores with targeted regularization, resulting in more accurate inference [<xref ref-type="bibr" rid="ref18">18</xref>]. Dragonnet is considered more robust with very low or high propensity scores but has several limitations including sensitivity to choice of architecture and hyperparameters, dealing with only a single set of features at a time, and difficulty of interpretation [<xref ref-type="bibr" rid="ref18">18</xref>]. Despite some limitations, Dragonnet&#x2019;s benefits surpass these drawbacks, making it an attractive approach for estimating causal effects in complex real-world data.</p></sec><sec id="s4-3"><title>Strengths and Limitations</title><p>A critical aspect of causal inference, particularly in estimating CATE, involves certain assumptions, notably ignorability and positivity. Strong ignorability necessitates the observation and adjustment for all confounding variables that influence both the treatment and the outcome, while positivity ensures that every patient has a nonzero probability of receiving each treatment. In our study, we believe these assumptions are reasonably satisfied. We included a comprehensive set of covariates, such as age, sex, BMI, chronic kidney disease, and relevant comorbidities (HT, DM, DLP, and AF), which are well-documented factors influencing stroke risk and treatment decisions. However, we acknowledge that there might be unmeasured confounders not captured in our dataset. Regarding the decision on antiplatelet drug administration, we utilized detailed patient records from Ramathibodi Hospital, ensuring a thorough assessment of factors influencing treatment. Nonetheless, we recognize the potential for residual confounding and the inherent limitations of observational data. Future studies could benefit from incorporating more granular clinical data and leveraging advanced causal discovery methods to further validate these assumptions.</p><p>Causal effects can vary between individuals, which necessitates the estimation of ITEs. Treatment effects can vary between individual patients; therefore, applying a single treatment effect as CATE to all individual patients is inappropriate [<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref48">48</xref>] as some patients may gain more or less benefit from treatments. Thus, the estimation of ITE to identify at-risk patients most likely to benefit from treatment is a major goal for stratified and precision medicine approaches. Estimating ITEs requires larger sample sizes, as individual-level estimates are less precise than aggregate-level estimates [<xref ref-type="bibr" rid="ref49">49</xref>]. A covariate shift may result from unobserved counterfactual data but this is minimized using a weighted split-CQR approach [<xref ref-type="bibr" rid="ref23">23</xref>].</p><p>We believe that the clinical implications of our study are significant, as understanding the causal relationships and individual treatment effects of stroke risk factors can directly influence patient care by providing more precise and personalized risk assessments. Additionally, we can conduct reviews and quality assessments of current patients in the clinic to determine who should receive further treatment. These methods enable clinicians to identify high-risk patients who would benefit most from targeted interventions, like antiplatelet therapy, thereby optimizing treatment strategies and improving patient outcomes. The use of real-world data ensures that our findings apply to everyday clinical practice.</p><p>Our study has some limitations. First, we used real-world data rather than RCT data, thus some important covariates were not previously planned, measured, and collected as part of routine clinical evaluation and were therefore unavailable for ITE estimation. Second, we acknowledge the possibility of unmeasured confounders in the observational dataset. Future studies could benefit from incorporating more granular clinical data, such as detailed medication records, laboratory results, and lifestyle factors, to mitigate potential confounding. Third, the models used for estimating ITEs were trained and validated in only a single setting, thereby limiting their generalizability. Future research should focus on validating the models in diverse settings with different patient populations or hospitals. This external validation would help to determine whether the models&#x2019; predictive performance and the estimated ITEs hold true across various contexts.</p></sec><sec id="s4-4"><title>Conclusion</title><p>This study provides comprehensive causal estimates of AF, HT, DLP, and DM on stroke using various advanced statistical and machine learning methodologies. The consistent results across multiple analytical approaches and this study&#x2019;s alignment with a standard cohort study reinforce the robustness of our findings. AF and HT emerged as significant risk factors for stroke, with DM showing a moderate effect, while DLP had minimal impact. Notably, the use of Dragonnet and conformal inference techniques allowed us to accurately estimate ITEs, highlighting that several high-risk patients who did not take antiplatelets at the time of data recorded, particularly those with DM or DM combined with HT, could potentially benefit from antiplatelet therapy. This suggests that personalized treatment strategies could be pivotal in reducing stroke risk among these patients.</p><p>The findings underscore the significance of individualized risk assessment and treatment personalization in clinical settings. Future research should focus on integrating these advanced causal inference models into routine clinical practice to enhance treatment outcomes for high-risk stroke patients. Additionally, the use of real-world data provides valuable insights but also presents challenges related to unmeasured confounding and data quality. Addressing these challenges in future studies will be crucial for advancing our understanding and improving stroke management strategies.</p></sec></sec></body><back><notes><sec><title>Data Availability</title><p>The data that support the findings of this study are available from the corresponding author upon reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>This study has been conceptualized by SL and AT. SL performed data management, model construction, and analysis. The manuscript was drafted by SL and revised by GJM, JA, and AT. All authors approved the final version of this manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AF</term><def><p>atrial fibrillation</p></def></def-item><def-item><term id="abb2">ATE</term><def><p>average treatment effect</p></def></def-item><def-item><term id="abb3">CATE</term><def><p>conditional average treatment effect</p></def></def-item><def-item><term id="abb4">CKD</term><def><p>chronic kidney disease</p></def></def-item><def-item><term id="abb5">CQR</term><def><p>conformal quantile regression</p></def></def-item><def-item><term id="abb6">DLP</term><def><p>dyslipidemia</p></def></def-item><def-item><term id="abb7">DM</term><def><p>diabetes mellitus</p></def></def-item><def-item><term id="abb8">DRE</term><def><p>doubly robust estimation</p></def></def-item><def-item><term id="abb9">HT</term><def><p>hypertension</p></def></def-item><def-item><term id="abb10"><italic>ICD-10</italic></term><def><p><italic>International Classification of Diseases, 10th Revision</italic></p></def></def-item><def-item><term id="abb11">IPW</term><def><p>inverse probability weighting</p></def></def-item><def-item><term id="abb12">ITE</term><def><p>individualized treatment effect</p></def></def-item><def-item><term id="abb13">NDE</term><def><p>natural direct effect</p></def></def-item><def-item><term id="abb14">NIE</term><def><p>natural indirect effect</p></def></def-item><def-item><term id="abb15">NN</term><def><p>neural network</p></def></def-item><def-item><term id="abb16">PO</term><def><p>potential outcome</p></def></def-item><def-item><term id="abb17">POM</term><def><p>potential outcome model</p></def></def-item><def-item><term id="abb18">RCT</term><def><p>randomized controlled trial</p></def></def-item><def-item><term id="abb19">SCM</term><def><p>structural causal model</p></def></def-item><def-item><term id="abb20">SPS</term><def><p>stratified propensity score</p></def></def-item><def-item><term id="abb21">XGBoost</term><def><p>Extreme Gradient Boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Krishnamurthi</surname><given-names>RV</given-names> </name><name name-style="western"><surname>Ikeda</surname><given-names>T</given-names> </name><name name-style="western"><surname>Feigin</surname><given-names>VL</given-names> </name></person-group><article-title>Global, regional and country-specific burden of ischaemic stroke, intracerebral haemorrhage and subarachnoid haemorrhage: a systematic analysis of the global burden of disease study 2017</article-title><source>Neuroepidemiology</source><year>2020</year><volume>54</volume><issue>2</issue><fpage>171</fpage><lpage>179</lpage><pub-id pub-id-type="doi">10.1159/000506396</pub-id><pub-id pub-id-type="medline">32079017</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Boehme</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Esenwa</surname><given-names>C</given-names> </name><name name-style="western"><surname>Elkind</surname><given-names>MSV</given-names> </name></person-group><article-title>Stroke risk factors, genetics, and prevention</article-title><source>Circ Res</source><year>2017</year><month>02</month><day>3</day><volume>120</volume><issue>3</issue><fpage>472</fpage><lpage>495</lpage><pub-id pub-id-type="doi">10.1161/CIRCRESAHA.116.308398</pub-id><pub-id pub-id-type="medline">28154098</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Austin</surname><given-names>PC</given-names> </name></person-group><article-title>An introduction to propensity score methods for reducing the effects of confounding in observational studies</article-title><source>Multivariate Behav Res</source><year>2011</year><month>05</month><volume>46</volume><issue>3</issue><fpage>399</fpage><lpage>424</lpage><pub-id pub-id-type="doi">10.1080/00273171.2011.568786</pub-id><pub-id pub-id-type="medline">21818162</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Pearl</surname><given-names>J</given-names> </name></person-group><source>Causality</source><year>2009</year><publisher-name>Cambridge University Press</publisher-name></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rubin</surname><given-names>DB</given-names> </name></person-group><article-title>Causal inference using potential outcomes</article-title><source>J Am Stat Assoc</source><year>2005</year><month>03</month><volume>100</volume><issue>469</issue><fpage>322</fpage><lpage>331</lpage><pub-id pub-id-type="doi">10.1198/016214504000001880</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Markus</surname><given-names>KA</given-names> </name></person-group><article-title>Causal effects and counterfactual conditionals: contrasting Rubin, Lewis and Pearl</article-title><source>Econ Philos</source><year>2021</year><month>11</month><volume>37</volume><issue>3</issue><fpage>441</fpage><lpage>461</lpage><pub-id pub-id-type="doi">10.1017/S0266267120000437</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pearl</surname><given-names>J</given-names> </name></person-group><article-title>An introduction to causal inference</article-title><source>Int J Biostat</source><year>2010</year><month>02</month><day>26</day><volume>6</volume><issue>2</issue><pub-id pub-id-type="doi">10.2202/1557-4679.1203</pub-id><pub-id pub-id-type="medline">20305706</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rubin</surname><given-names>DB</given-names> </name></person-group><article-title>Estimating causal effects of treatments in randomized and nonrandomized studies</article-title><source>J Educ Psychol</source><year>1974</year><volume>66</volume><issue>5</issue><fpage>688</fpage><lpage>701</lpage><pub-id pub-id-type="doi">10.1037/h0037350</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rosenbaum</surname><given-names>PR</given-names> </name><name name-style="western"><surname>Rubin</surname><given-names>DB</given-names> </name></person-group><article-title>The central role of the propensity score in observational studies for causal effects</article-title><source>Biometrika</source><year>1983</year><volume>70</volume><issue>1</issue><fpage>41</fpage><lpage>55</lpage><pub-id pub-id-type="doi">10.1093/biomet/70.1.41</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rosenbaum</surname><given-names>PR</given-names> </name><name name-style="western"><surname>Rubin</surname><given-names>DB</given-names> </name></person-group><article-title>Constructing a control group using multivariate matched sampling methods that incorporate the propensity score</article-title><source>Am Stat</source><year>1985</year><month>02</month><volume>39</volume><issue>1</issue><fpage>33</fpage><lpage>38</lpage><pub-id pub-id-type="doi">10.1080/00031305.1985.10479383</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rosenbaum</surname><given-names>PR</given-names> </name><name name-style="western"><surname>Rubin</surname><given-names>DB</given-names> </name></person-group><article-title>Reducing bias in observational studies using subclassification on the propensity score</article-title><source>J Am Stat Assoc</source><year>1984</year><month>09</month><volume>79</volume><issue>387</issue><fpage>516</fpage><lpage>524</lpage><pub-id pub-id-type="doi">10.1080/01621459.1984.10478078</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rosenbaum</surname><given-names>PR</given-names> </name></person-group><article-title>Model-based direct adjustment</article-title><source>J Am Stat Assoc</source><year>1987</year><month>06</month><volume>82</volume><issue>398</issue><fpage>387</fpage><lpage>394</lpage><pub-id pub-id-type="doi">10.1080/01621459.1987.10478441</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hern&#x00E1;n</surname><given-names>M&#x00C1;</given-names> </name><name name-style="western"><surname>Brumback</surname><given-names>B</given-names> </name><name name-style="western"><surname>Robins</surname><given-names>JM</given-names> </name></person-group><article-title>Marginal structural models to estimate the causal effect of zidovudine on the survival of HIV-positive men</article-title><source>Epidemiology</source><year>2000</year><month>09</month><volume>11</volume><issue>5</issue><fpage>561</fpage><lpage>570</lpage><pub-id pub-id-type="doi">10.1097/00001648-200009000-00012</pub-id><pub-id pub-id-type="medline">10955409</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chernozhukov</surname><given-names>V</given-names> </name><name name-style="western"><surname>Chetverikov</surname><given-names>D</given-names> </name><name name-style="western"><surname>Demirer</surname><given-names>M</given-names> </name><name name-style="western"><surname>Duflo</surname><given-names>E</given-names> </name><name name-style="western"><surname>Hansen</surname><given-names>C</given-names> </name><name name-style="western"><surname>Newey</surname><given-names>W</given-names> </name></person-group><article-title>Double/debiased/Neyman machine learning of treatment effects</article-title><source>Am Econ Rev</source><year>2017</year><month>05</month><day>1</day><volume>107</volume><issue>5</issue><fpage>261</fpage><lpage>265</lpage><pub-id pub-id-type="doi">10.1257/aer.p20171038</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Robins</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Rotnitzky</surname><given-names>A</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>LP</given-names> </name></person-group><article-title>Estimation of regression coefficients when some regressors are not always observed</article-title><source>J Am Stat Assoc</source><year>1994</year><month>09</month><volume>89</volume><issue>427</issue><fpage>846</fpage><lpage>866</lpage><pub-id pub-id-type="doi">10.1080/01621459.1994.10476818</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Funk</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Westreich</surname><given-names>D</given-names> </name><name name-style="western"><surname>Wiesen</surname><given-names>C</given-names> </name><name name-style="western"><surname>St&#x00FC;rmer</surname><given-names>T</given-names> </name><name name-style="western"><surname>Brookhart</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Davidian</surname><given-names>M</given-names> </name></person-group><article-title>Doubly robust estimation of causal effects</article-title><source>Am J Epidemiol</source><year>2011</year><month>04</month><day>1</day><volume>173</volume><issue>7</issue><fpage>761</fpage><lpage>767</lpage><pub-id pub-id-type="doi">10.1093/aje/kwq439</pub-id><pub-id pub-id-type="medline">21385832</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Shalit</surname><given-names>U</given-names> </name><name name-style="western"><surname>Johansson</surname><given-names>FD</given-names> </name><name name-style="western"><surname>Sontag</surname><given-names>D</given-names> </name></person-group><article-title>Estimating individual treatment effect: generalization bounds and algorithms</article-title><conf-name>The 34th International Conference on Machine Learning</conf-name><conf-date>Aug 8-11, 2017</conf-date><conf-loc>Sydney, Australia</conf-loc></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Shi</surname><given-names>C</given-names> </name><name name-style="western"><surname>Blei</surname><given-names>D</given-names> </name><name name-style="western"><surname>Veitch</surname><given-names>V</given-names> </name></person-group><article-title>Adapting neural networks for the estimation of treatment effects</article-title><conf-name>Advances in Neural Information Processing Systems 32 (NeurIPS 2019)</conf-name><conf-date>Dec 8-14, 2019</conf-date><conf-loc>Vancouver, Canada</conf-loc></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Curth</surname><given-names>A</given-names> </name><name name-style="western"><surname>Schaar</surname><given-names>M</given-names> </name></person-group><article-title>Nonparametric estimation of heterogeneous treatment effects: from theory to learning algorithms</article-title><conf-name>The 24th International Conference on Artificial Intelligence and Statistics</conf-name><conf-date>Apr 13-15, 2021</conf-date></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><name name-style="western"><surname>Lei</surname><given-names>L</given-names> </name><name name-style="western"><surname>Cand&#x00E8;s</surname><given-names>EJ</given-names> </name></person-group><article-title>Conformal inference of counterfactuals and individual treatment effects</article-title><source>arXiv</source><comment>Preprint posted online on  Jun 11, 2020</comment><pub-id pub-id-type="doi">10.48550/arXiv.2006.06138</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Vovk</surname><given-names>V</given-names> </name><name name-style="western"><surname>Gammerman</surname><given-names>A</given-names> </name><name name-style="western"><surname>Shafer</surname><given-names>G</given-names> </name></person-group><source>Algorithmic Learning in a Random World</source><year>2005</year><publisher-name>Springer</publisher-name></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shafer</surname><given-names>G</given-names> </name><name name-style="western"><surname>Vovk</surname><given-names>V</given-names> </name></person-group><article-title>A tutorial on conformal prediction</article-title><source>J Mach Learn Res</source><year>2008</year><volume>9</volume><issue>3</issue><fpage>371</fpage><lpage>421</lpage><pub-id pub-id-type="doi">10.1145/1390681.1390693</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Tibshirani</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Foygel Barber</surname><given-names>R</given-names> </name><name name-style="western"><surname>Candes</surname><given-names>E</given-names> </name><name name-style="western"><surname>Ramdas</surname><given-names>A</given-names> </name></person-group><article-title>Conformal prediction under covariate shift</article-title><conf-name>Advances in Neural Information Processing Systems 32 (NeurIPS 2019)</conf-name><conf-date>Dec 8-14, 2019</conf-date><conf-loc>Vancouver, Canada</conf-loc></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><name name-style="western"><surname>Sharma</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kiciman</surname><given-names>E</given-names> </name></person-group><article-title>DoWhy: an end-to-end library for causal inference</article-title><source>arXiv</source><comment>Preprint posted online on  Nov 9, 2020</comment><pub-id pub-id-type="doi">10.48550/arXiv.2011.04216</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Imbens</surname><given-names>GW</given-names> </name><name name-style="western"><surname>Rubin</surname><given-names>DB</given-names> </name></person-group><source>Causal Inference in Statistics, Social, and Biomedical Sciences</source><year>2015</year><publisher-name>Cambridge University Press</publisher-name><pub-id pub-id-type="doi">10.1017/CBO9781139025751</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><name name-style="western"><surname>Bl&#x00F6;baum</surname><given-names>P</given-names> </name><name name-style="western"><surname>G&#x00F6;tz</surname><given-names>P</given-names> </name><name name-style="western"><surname>Budhathoki</surname><given-names>K</given-names> </name><name name-style="western"><surname>Mastakouri</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Janzing</surname><given-names>D</given-names> </name></person-group><article-title>DoWhy-GCM: an extension of dowhy for causal inference in graphical causal models</article-title><source>arXiv</source><comment>Preprint posted online on  Jun 14, 2022</comment><pub-id pub-id-type="doi">10.48550/arXiv.2206.06821</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Richiardi</surname><given-names>L</given-names> </name><name name-style="western"><surname>Bellocco</surname><given-names>R</given-names> </name><name name-style="western"><surname>Zugna</surname><given-names>D</given-names> </name></person-group><article-title>Mediation analysis in epidemiology: methods, interpretation and bias</article-title><source>Int J Epidemiol</source><year>2013</year><month>10</month><volume>42</volume><issue>5</issue><fpage>1511</fpage><lpage>1519</lpage><pub-id pub-id-type="doi">10.1093/ije/dyt127</pub-id><pub-id pub-id-type="medline">24019424</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>O&#x2019;Donnell</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Chin</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Rangarajan</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Global and regional effects of potentially modifiable risk factors associated with acute stroke in 32 countries (INTERSTROKE): a case-control study</article-title><source>Lancet</source><year>2016</year><month>08</month><volume>388</volume><issue>10046</issue><fpage>761</fpage><lpage>775</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(16)30506-2</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tirschwell</surname><given-names>DL</given-names> </name><name name-style="western"><surname>Smith</surname><given-names>NL</given-names> </name><name name-style="western"><surname>Heckbert</surname><given-names>SR</given-names> </name><name name-style="western"><surname>Lemaitre</surname><given-names>RN</given-names> </name><name name-style="western"><surname>Longstreth</surname><given-names>WT</given-names>  <suffix>Jr</suffix></name><name name-style="western"><surname>Psaty</surname><given-names>BM</given-names> </name></person-group><article-title>Association of cholesterol with stroke risk varies in stroke subtypes and patient subgroups</article-title><source>Neurology</source><year>2004</year><month>11</month><day>23</day><volume>63</volume><issue>10</issue><fpage>1868</fpage><lpage>1875</lpage><pub-id pub-id-type="doi">10.1212/01.wnl.0000144282.42222.da</pub-id><pub-id pub-id-type="medline">15557504</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Imai</surname><given-names>K</given-names> </name><name name-style="western"><surname>Dyk</surname><given-names>DA</given-names> </name></person-group><article-title>Causal inference with general treatment regimes: generalizing the propensity score</article-title><source>J Am Stat Assoc</source><year>2004</year><volume>99</volume><issue>467</issue><fpage>854</fpage><lpage>866</lpage><pub-id pub-id-type="doi">10.1198/016214504000001187</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Harder</surname><given-names>VS</given-names> </name><name name-style="western"><surname>Stuart</surname><given-names>EA</given-names> </name><name name-style="western"><surname>Anthony</surname><given-names>JC</given-names> </name></person-group><article-title>Propensity score techniques and the assessment of measured covariate balance to test causal associations in psychological research</article-title><source>Psychol Methods</source><year>2010</year><month>09</month><volume>15</volume><issue>3</issue><fpage>234</fpage><lpage>249</lpage><pub-id pub-id-type="doi">10.1037/a0019623</pub-id><pub-id pub-id-type="medline">20822250</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hullsiek</surname><given-names>KH</given-names> </name><name name-style="western"><surname>Louis</surname><given-names>TA</given-names> </name></person-group><article-title>Propensity score modeling strategies for the causal analysis of observational data</article-title><source>Biostatistics</source><year>2002</year><month>06</month><volume>3</volume><issue>2</issue><fpage>179</fpage><lpage>193</lpage><pub-id pub-id-type="doi">10.1093/biostatistics/3.2.179</pub-id><pub-id pub-id-type="medline">12933612</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Adelson</surname><given-names>JL</given-names> </name><name name-style="western"><surname>McCoach</surname><given-names>DB</given-names> </name><name name-style="western"><surname>Rogers</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Adelson</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Sauer</surname><given-names>TM</given-names> </name></person-group><article-title>Developing and applying the propensity score to make causal inferences: variable selection and stratification</article-title><source>Front Psychol</source><year>2017</year><volume>8</volume><fpage>1413</fpage><pub-id pub-id-type="doi">10.3389/fpsyg.2017.01413</pub-id><pub-id pub-id-type="medline">28861028</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Morgan</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Winship</surname><given-names>C</given-names> </name></person-group><source>Counterfactuals and Causal Inference: Methods and Principles for Social Research</source><year>2014</year><publisher-name>Cambridge University Press</publisher-name></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brookhart</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Wyss</surname><given-names>R</given-names> </name><name name-style="western"><surname>Layton</surname><given-names>JB</given-names> </name><name name-style="western"><surname>St&#x00FC;rmer</surname><given-names>T</given-names> </name></person-group><article-title>Propensity score methods for confounding control in nonexperimental research</article-title><source>Circ Cardiovasc Qual Outcomes</source><year>2013</year><month>09</month><day>1</day><volume>6</volume><issue>5</issue><fpage>604</fpage><lpage>611</lpage><pub-id pub-id-type="doi">10.1161/CIRCOUTCOMES.113.000359</pub-id><pub-id pub-id-type="medline">24021692</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chesnaye</surname><given-names>NC</given-names> </name><name name-style="western"><surname>Stel</surname><given-names>VS</given-names> </name><name name-style="western"><surname>Tripepi</surname><given-names>G</given-names> </name><etal/></person-group><article-title>An introduction to inverse probability of treatment weighting in observational research</article-title><source>Clin Kidney J</source><year>2021</year><month>08</month><volume>15</volume><issue>1</issue><fpage>14</fpage><lpage>20</lpage><pub-id pub-id-type="doi">10.1093/ckj/sfab158</pub-id><pub-id pub-id-type="medline">35035932</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cole</surname><given-names>SR</given-names> </name><name name-style="western"><surname>Hern&#x00E1;n</surname><given-names>MA</given-names> </name></person-group><article-title>Constructing inverse probability weights for marginal structural models</article-title><source>Am J Epidemiol</source><year>2008</year><month>09</month><day>15</day><volume>168</volume><issue>6</issue><fpage>656</fpage><lpage>664</lpage><pub-id pub-id-type="doi">10.1093/aje/kwn164</pub-id><pub-id pub-id-type="medline">18682488</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Robins</surname><given-names>JM</given-names> </name></person-group><article-title>Doubly robust estimation in missing data and causal inference models</article-title><source>Biometrics</source><year>2005</year><month>12</month><volume>61</volume><issue>4</issue><fpage>962</fpage><lpage>973</lpage><pub-id pub-id-type="doi">10.1111/j.1541-0420.2005.00377.x</pub-id><pub-id pub-id-type="medline">16401269</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Robins</surname><given-names>J</given-names> </name><name name-style="western"><surname>Rotnitzky</surname><given-names>A</given-names> </name></person-group><article-title>Comment on the Bickel and Kwon article, 'Inference for semiparametric models: Some questions and an answer'</article-title><source>Stat Sin</source><year>2001</year><volume>11</volume><fpage>920</fpage><lpage>936</lpage></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Benkeser</surname><given-names>D</given-names> </name><name name-style="western"><surname>Carone</surname><given-names>M</given-names> </name><name name-style="western"><surname>Laan</surname><given-names>MJVD</given-names> </name><name name-style="western"><surname>Gilbert</surname><given-names>PB</given-names> </name></person-group><article-title>Doubly robust nonparametric inference on the average treatment effect</article-title><source>Biometrika</source><year>2017</year><month>12</month><volume>104</volume><issue>4</issue><fpage>863</fpage><lpage>880</lpage><pub-id pub-id-type="doi">10.1093/biomet/asx053</pub-id><pub-id pub-id-type="medline">29430041</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zivich</surname><given-names>PN</given-names> </name><name name-style="western"><surname>Breskin</surname><given-names>A</given-names> </name></person-group><article-title>Machine learning for causal inference: on the use of cross-fit estimators</article-title><source>Epidemiology</source><year>2021</year><month>05</month><day>1</day><volume>32</volume><issue>3</issue><fpage>393</fpage><lpage>401</lpage><pub-id pub-id-type="doi">10.1097/EDE.0000000000001332</pub-id><pub-id pub-id-type="medline">33591058</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pearl</surname><given-names>J</given-names> </name></person-group><article-title>Causal diagrams for empirical research</article-title><source>Biometrika</source><year>1995</year><month>12</month><volume>82</volume><issue>4</issue><fpage>669</fpage><lpage>688</lpage><pub-id pub-id-type="doi">10.2307/2337329</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Pearl</surname><given-names>J</given-names> </name></person-group><article-title>Causal and counterfactual inference</article-title><source>The Handbook of Rationality</source><year>2021</year><publisher-name>MIT Press</publisher-name><fpage>427</fpage><lpage>438</lpage><pub-id pub-id-type="doi">10.7551/mitpress/11252.003.0044</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Pawlowski</surname><given-names>N</given-names> </name><name name-style="western"><surname>Castro</surname><given-names>D</given-names> </name><name name-style="western"><surname>Glocker</surname><given-names>B</given-names> </name></person-group><article-title>Deep structural causal models for tractable counterfactual inference</article-title><conf-name>Advances in Neural Information Processing Systems 33 (NeurIPS 2020)</conf-name><conf-date>Dec 6-12, 2020</conf-date></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><name name-style="western"><surname>Xia</surname><given-names>K</given-names> </name><name name-style="western"><surname>Pan</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Bareinboim</surname><given-names>E</given-names> </name></person-group><article-title>Neural causal models for counterfactual identification and estimation</article-title><source>arXiv</source><comment>Preprint posted online on  Sep 30, 2022</comment><pub-id pub-id-type="doi">10.48550/arXiv.2210.00035</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Tian</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bareinboim</surname><given-names>E</given-names> </name></person-group><article-title>Partial counterfactual identification from observational and experimental data</article-title><conf-name>The 39th International Conference on Machine Learning</conf-name><conf-date>Jul 17-23, 2022</conf-date><conf-loc>Baltimore, MD</conf-loc></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nguyen</surname><given-names>TL</given-names> </name><name name-style="western"><surname>Collins</surname><given-names>GS</given-names> </name><name name-style="western"><surname>Landais</surname><given-names>P</given-names> </name><name name-style="western"><surname>Le Manach</surname><given-names>Y</given-names> </name></person-group><article-title>Counterfactual clinical prediction models could help to infer individualized treatment effects in randomized controlled trials-an illustration with the International Stroke Trial</article-title><source>J Clin Epidemiol</source><year>2020</year><month>09</month><volume>125</volume><fpage>47</fpage><lpage>56</lpage><pub-id pub-id-type="doi">10.1016/j.jclinepi.2020.05.022</pub-id><pub-id pub-id-type="medline">32464321</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sperrin</surname><given-names>M</given-names> </name><name name-style="western"><surname>Martin</surname><given-names>GP</given-names> </name><name name-style="western"><surname>Pate</surname><given-names>A</given-names> </name><name name-style="western"><surname>Van Staa</surname><given-names>T</given-names> </name><name name-style="western"><surname>Peek</surname><given-names>N</given-names> </name><name name-style="western"><surname>Buchan</surname><given-names>I</given-names> </name></person-group><article-title>Using marginal structural models to adjust for treatment drop-in when developing clinical prediction models</article-title><source>Stat Med</source><year>2018</year><month>12</month><day>10</day><volume>37</volume><issue>28</issue><fpage>4142</fpage><lpage>4154</lpage><pub-id pub-id-type="doi">10.1002/sim.7913</pub-id><pub-id pub-id-type="medline">30073700</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hoogland</surname><given-names>J</given-names> </name><name name-style="western"><surname>IntHout</surname><given-names>J</given-names> </name><name name-style="western"><surname>Belias</surname><given-names>M</given-names> </name><etal/></person-group><article-title>A tutorial on individualized treatment effect prediction from randomized trials with a binary endpoint</article-title><source>Stat Med</source><year>2021</year><month>11</month><day>20</day><volume>40</volume><issue>26</issue><fpage>5961</fpage><lpage>5981</lpage><pub-id pub-id-type="doi">10.1002/sim.9154</pub-id><pub-id pub-id-type="medline">34402094</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Nested approach for interval estimates of individual treatment effect algorithm. &#x03B1;=.05 to cover 95% confidence interval.</p><media xlink:href="cardio_v9i1e50627_app1.docx" xlink:title="DOCX File, 21 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Descriptive analysis of features between stroke and nonstroke.</p><media xlink:href="cardio_v9i1e50627_app2.docx" xlink:title="DOCX File, 23 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Estimated causal effect from estimators. Numbers indicate conditional average treatment (risk) effect (CATE) with 95% confidence interval. * Heart disease ** top quintile low-density lipoprotein (LDL).</p><media xlink:href="cardio_v9i1e50627_app3.docx" xlink:title="DOCX File, 22 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Sample of 50 individual treatment effects with 95% confidence intervals and stroke risk reduction who had not received antiplatelet treatment, demonstrating the potential benefits had they been given the medication. In this plot, 3 of the samples (6%) demonstrate that a considerable number of patients could have experienced a positive impact on their stroke risk reduction had they received the antiplatelet treatment. The y-axis displays the treatment effect, while the x-axis represents each individual patient in the sample.</p><media xlink:href="cardio_v9i1e50627_app4.docx" xlink:title="DOCX File, 59 KB"/></supplementary-material></app-group></back></article>