<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Cardio</journal-id><journal-id journal-id-type="publisher-id">cardio</journal-id><journal-id journal-id-type="index">26</journal-id><journal-title>JMIR Cardio</journal-title><abbrev-journal-title>JMIR Cardio</abbrev-journal-title><issn pub-type="epub">2561-1011</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e77380</article-id><article-id pub-id-type="doi">10.2196/77380</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Predicting Atrial Fibrillation Ablation Outcomes: Machine Learning Model Development and Validation Using a Large Administrative Claims Database</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Liu</surname><given-names>Yijun</given-names></name><degrees>BS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Oloko-Oba</surname><given-names>Mustapha</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Wood</surname><given-names>Kathryn A</given-names></name><degrees>RN, PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lloyd</surname><given-names>Michael S</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Ho</surname><given-names>Joyce C</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Hertzberg</surname><given-names>Vicki Stover</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Data and Decision Sciences, Emory University</institution><addr-line>36 Eagle Row</addr-line><addr-line>Atlanta</addr-line><addr-line>GA</addr-line><country>United States</country></aff><aff id="aff2"><institution>Nell Hodgson Woodruff School of Nursing, Emory University</institution><addr-line>1520 Clifton Road NE</addr-line><addr-line>Atlanta</addr-line><addr-line>GA</addr-line><country>United States</country></aff><aff id="aff3"><institution>Division of Cardiology, Department of Medicine, Emory University</institution><addr-line>100 Woodruff Circle</addr-line><addr-line>Atlanta</addr-line><addr-line>GA</addr-line><country>United States</country></aff><aff id="aff4"><institution>Department of Computer Science, Emory University</institution><addr-line>400 Dowman Drive</addr-line><addr-line>Atlanta</addr-line><addr-line>GA</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Gissel</surname><given-names>Christian</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Yogeshappa</surname><given-names>Vedamurthy Gejjegondanahalli</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Joyce C Ho, PhD, Department of Computer Science, Emory University, 400 Dowman Drive, Atlanta, GA, 30322, United States; <email>joyce.c.ho@emory.edu</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>31</day><month>12</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e77380</elocation-id><history><date date-type="received"><day>12</day><month>05</month><year>2025</year></date><date date-type="rev-recd"><day>04</day><month>12</month><year>2025</year></date><date date-type="accepted"><day>04</day><month>12</month><year>2025</year></date></history><copyright-statement>&#x00A9; Yijun Liu, Mustapha Oloko-Oba, Kathryn A Wood, Michael S Lloyd, Joyce C Ho, Vicki Stover Hertzberg. Originally published in JMIR Cardio (<ext-link ext-link-type="uri" xlink:href="https://cardio.jmir.org">https://cardio.jmir.org</ext-link>), 31.12.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Cardio, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://cardio.jmir.org">https://cardio.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://cardio.jmir.org/2025/1/e77380"/><abstract><sec><title>Background</title><p>Atrial fibrillation (AF) ablation is an effective treatment for reducing episodes and improving quality of life in patients with AF. However, long-term AF-free rates after AF ablation are inconsistent across the population, ranging from 50% to 75%. Patient selection relies on individual clinical assessment, highlighting a critical gap in population-level predictive analytics. While existing risk scores (eg, CHADS<sub>&#x2082;</sub> [congestive heart failure, hypertension, age &#x2265;75 years, diabetes mellitus, and stroke], CHA<sub>&#x2082;</sub>DS<sub>&#x2082;</sub>-VASc [congestive heart failure, hypertension, age &#x2265;75 years, diabetes mellitus, stroke, vascular disease, age, and sex category], CAAP-AF [coronary artery disease, left atrial diameter, age, AF, antiarrhythmic drugs, and female sex category]) have been applied to predict AF ablation outcomes, their performance in administrative claims data remains unclear. Leveraging large administrative claims databases represents an opportunity to develop standardized, scalable prediction models that could inform population health management and resource allocation at a national level.</p></sec><sec><title>Objective</title><p>This study utilizes machine learning (ML) models on claims data to explore if integrating <italic>International Classification of Diseases</italic> (<italic>ICD</italic>) billing codes outperforms traditional stroke and AF risk scores in predicting 1-year AF ablation outcomes.</p></sec><sec sec-type="methods"><title>Methods</title><p>We analyzed claims data from the Merative MarketScan Research Medicare database (2013&#x2010;2020) to identify 14,521 patients who underwent AF ablation. To predict 1-year AF-free outcomes, we developed logistic regression and extreme gradient boosting (XGBoost) models using demographic characteristics, comorbidity indices, and <italic>ICD</italic> diagnostic codes from the 2 years preceding ablation. Model predictions were compared with claims-based implementations of established risk scores&#x2014;CHADS<sub>2</sub>, CHA<sub>2</sub>DS<sub>2</sub>-VASc, and a modified CAAP-AF (without left atrial diameter and the number of failed antiarrhythmic drugs). The ML models were also assessed on subgroups of patients with paroxysmal AF, persistent AF, and both AF and atrial flutter from October 2015 onward.</p></sec><sec sec-type="results"><title>Results</title><p>Among 14,521 patients (mean age 71.5, SD 5.31 y; n=5800, 39.94% female), AF ablation success occurred in 54.01% (n=7843). XGBoost achieved areas under the receiver operating characteristic curve (AUCs) of 0.528, 0.521, and 0.529 for the whole, female, and male AF ablation groups, respectively, and better discrimination than CHADS<sub>2</sub>, CHA<sub>2</sub>DS<sub>2</sub>-VASc, and the modified CAAP-AF in all AF ablation groups (whole population, female, and male). While CHA<sub>2</sub>DS<sub>2</sub>-VASc and the modified CAAP-AF showed higher recall (&#x003E;0.798), their precision (&#x003C;0.540) was lower than XGBoost (0.552&#x2010;0.556). In subgroup analyses of <italic>International Classification of Disease, Tenth Revision</italic> (<italic>ICD-10</italic>) patients (n=7646), the models incorporating <italic>ICD</italic> codes demonstrated better performance than those using only demographic and comorbidity data across most AF subtypes, with the highest AUC (0.544) observed in patients with paroxysmal AF.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>While the ML models achieved statistically significant improvements over claim-based implementations of established clinical risk scores (AUC 0.528&#x2010;0.544 vs 0.498&#x2010;0.505), the modest predictive performance highlights challenges in predicting procedural outcomes using administrative data that lack key clinical variables (eg, left atrial size and medication details). Our findings establish that while standardized outcome prediction using nationally available administrative data is technically feasible, current performance is insufficient for clinical decision-making and better suited for health system quality monitoring and comparative effectiveness research applications.</p></sec></abstract><kwd-group><kwd>administrative claims data</kwd><kwd>atrial fibrillation</kwd><kwd>atrial fibrillation ablation</kwd><kwd>machine learning</kwd><kwd>XGBoost</kwd><kwd>extreme gradient boosting</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Although there is currently no cure for atrial fibrillation (AF), a major public health concern in the United States, AF ablation is the most effective treatment to restore normal sinus rhythm and decrease symptoms in episodes of paroxysmal or persistent AF, thereby reducing AF burden and improving quality of life [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. AF is associated with an increased risk of cardiovascular events that may affect treatment outcomes. While various clinical risk factors are well understood, existing risk scores have shown inconsistent effectiveness in predicting AF ablation outcomes.</p><p>Existing risk scores, such as CHADS<sub>2</sub> (congestive heart failure, hypertension, age &#x2265;75 years, diabetes mellitus, and stroke) and CHA<sub>2</sub>DS<sub>2</sub>-VASc (congestive heart failure, hypertension, age &#x2265;75 years, diabetes mellitus, stroke, vascular disease, age, and sex category), have traditionally been applied to predict stroke risk and are now also utilized in predicting outcomes following COVID-19, heart surgery, and AF ablation [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. One risk prediction scale specifically designed to predict outcomes from AF ablation, the CAAP-AF (coronary artery disease, left atrial diameter, age, AF, antiarrhythmic drugs, and female sex category) risk score, addresses the presence or absence of coronary artery disease, the left atrial diameter, the presence of persistent AF, the number of antiarrhythmic drugs that have failed, and female sex [<xref ref-type="bibr" rid="ref12">12</xref>].</p><p>Success rates for AF ablation from the literature vary based on individual clinical variables, such as the type of AF, left atrial size, or volume index [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>], yet these variables are often difficult to access in large electronic health record (EHR) datasets. Patients can continue to experience episodes of AF following initial AF ablation with long-term AF-free rates after de novo AF ablation reported as 50%-75% [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Additionally, the chances of developing any complications after AF ablation range around 6%, with 0.1%-0.9% of patients experiencing complications that could result in death [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref17">17</xref>]. Given the modest success rates of AF ablation, the prediction of outcomes could be personalized to more easily identify those who would be most likely to benefit from AF ablation.</p><p>Machine learning (ML) has emerged as a powerful approach that leverages increased computational power with large datasets to help achieve complex decisions to guide clinical practice [<xref ref-type="bibr" rid="ref18">18</xref>]. Artificial intelligence and ML have been used in the field of electrophysiology since the 1970s for automated electrocardiogram interpretation [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. More recently, innovations in algorithms, development and labeling of large databases, and improvements in hardware and software have rapidly increased the role of ML in cardiac electrophysiology and cardiovascular imaging to identify predictors of patient outcomes [<xref ref-type="bibr" rid="ref20">20</xref>]. Recent studies have demonstrated the potential for ML approaches in cardiovascular medicine, from achieving impressive diagnostic performance using novel data sources such as mobile phone acoustics for heart failure detection [<xref ref-type="bibr" rid="ref21">21</xref>] to identifying practice gaps in stroke care guidelines [<xref ref-type="bibr" rid="ref22">22</xref>] and showing predictive accuracy across various cardiovascular disease predictions [<xref ref-type="bibr" rid="ref23">23</xref>]. ML has already been used to improve the prediction of AF ablation outcomes, primarily via EHRs. Nevertheless, health systems are not widely interoperable [<xref ref-type="bibr" rid="ref24">24</xref>]; thus, extending these prognostic tools across multiple health systems is both costly and challenging. Studies utilizing EHR data have often been limited to datasets from 1 to 2 hospitals, limiting the generalizability of the models and hindering broad adoption [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>].</p><p>Health insurance claims data, in comparison, are commonly collected, more readily available, and usually collected on a large national scale [<xref ref-type="bibr" rid="ref27">27</xref>]. Although EHR data, which can include medications, laboratory data, and radiology reports, are more granular than claims data and can offer more accurate predictions, claims data&#x2019;s breadth and consistency across health systems can potentially provide stronger external validity [<xref ref-type="bibr" rid="ref28">28</xref>] and more cost-effective scaling. A recent study applied ML models on health insurance data for cardiovascular outcome prediction and achieved area under the receiver operating characteristic curve (AUC) of 0.68&#x2010;0.69 for heart failure readmission prediction [<xref ref-type="bibr" rid="ref29">29</xref>], illustrating the potential for population-level insights using administrative databases. This wider coverage across patient populations and care settings may yield models that generalize more effectively, reducing the need for labor-intensive data extraction and curation that often blocks EHR-based projects. Furthermore, claims-based prognostic models can be used to enhance health care resource allocation by reducing unnecessary procedures in patients unlikely to benefit and increasing access to this effective therapy for appropriate candidates in resource-constrained regions. Thus, claims-based prognostic models represent a promising avenue for more accessible and large-scale prediction of AF ablation outcomes.</p><p>In this study, we propose to develop ML-based predictive models for outcomes of de novo AF ablation procedures using national-level claims data in the United States. Our goal is to evaluate an ML-derived risk prediction model for AF ablation patient outcomes. We hypothesize that ML models will be comparable to or exceed claim-based implementations of existing AF risk scores with respect to predictive power. Existing risk scores, including CHADS<sub>2</sub> and CHA<sub>2</sub>DS<sub>2</sub>-VASc, have achieved nontrivial improvements in predicting the outcomes of AF procedures (AUCs of 0.785 and 0.830, respectively, in a dataset consisting of 565 patients) [<xref ref-type="bibr" rid="ref28">28</xref>]. Thus, in this study, we utilize CHADS<sub>2</sub> and CHA<sub>2</sub>DS<sub>2</sub>-VASc as a baseline to compare with our ML approaches. In addition, we also compare the performance between our ML models to a claims-based approximation of the CAAP-AF (modified CAAP-AF), a risk score specifically designed to predict AF ablation outcomes [<xref ref-type="bibr" rid="ref12">12</xref>]. We also characterize outcomes by AF subtypes and sex and use different sets of parameters in the ML models to understand the contribution of individual factors to ML prediction performance.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><p>This research leveraged deidentified claims data sourced from the Merative MarketScan Research Medicare Databases (Merative, Inc.) between January 1, 2011, and December 31, 2021. MarketScan contains claims for individuals with Medicare Supplemental and Medicare Advantage plans.</p><sec id="s2-1"><title>Patient Population</title><p>We analyzed Medicare claims data from January 1, 2011, to December 31, 2021, to identify patients who underwent AF ablation. Patients were included if they had a <italic>Current Procedural Terminology</italic> (<italic>CPT</italic>) code for AF ablation (93656) across either inpatient admission, inpatient services, and outpatient services tables in MarketScan. To ensure the accurate identification of AF ablation procedures, we required patients to have both <italic>CPT</italic> and a concurrent diagnosis of AF (<italic>International Classification of Diseases, Ninth Revision</italic> [<italic>ICD-9</italic>] code of &#x201C;427.31&#x201D; or <italic>International Statistical Classification of Diseases, Tenth Revision</italic> [<italic>ICD-10</italic>] code of &#x201C;I48.X&#x201D;). Each patient&#x2019;s medical history included all <italic>ICD</italic> codes from visits within 2 years before the initial occurrence of AF ablation within our dataset. While the 2-year lookback period captures baseline characteristics, claims data do not allow definitive confirmation that these represent truly de novo ablations, as patients may have undergone prior ablations before their enrollment period or outside the MarketScan database. Therefore, our cohort represents the best approximation of first-time AF ablation procedures available from administrative claims data.</p><p>We focused exclusively on Medicare beneficiaries for several reasons. First, the MarketScan database maintains separate patient identifiers for Medicare and commercial claims datasets, preventing integration of these patients. Second, the typical age for the first AF ablation is between 55 and 62 years [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref13">13</xref>], which is commonly covered by Medicare. Moreover, the substantial absence of postoperative outcomes for patients in the commercial database rendered it unsuitable for this study. The final cohort included 14,521 Medicare patients.</p></sec><sec id="s2-2"><title>Outcome and Subgroup Definitions</title><p>Our study&#x2019;s objective was to predict the binary outcome, success or failure, of AF ablation using patient demographics and prior medical history. Although the outpatient services table clearly documents the operation date for AF ablation, the inpatient admission and inpatient services tables only provide admission and discharge dates. To integrate the information across the 3 tables, we designated the admission date from the inpatient admission and inpatient services datasets as a surrogate for the AF ablation operation date in our analysis to maintain temporal coherence. Success was then defined as the absence of AF recurrence or repeat AF ablation between 6 and 12 months after the initial AF ablation procedure date, which is the standard interval before repeating an AF ablation according to current clinical practices [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. To ensure the accurate identification of successful cases, we verified that all patients had at least 1 clinical follow-up visit within the first year after ablation.</p><p>The study also employed subgroup analysis by stratifying patients into 3 groups based on AF type: paroxysmal AF, persistent AF, and AF with flutter. This analysis was only possible after October 1, 2015, as <italic>ICD-10</italic> codes provide more detailed AF type distinctions compared to earlier <italic>ICD-9</italic> codes. We defined persistent AF as patients with <italic>ICD-10</italic> codes I48.1, I48.11, I48.19, I48.2, or I48.21. Note that this reflects current changes in the terminology of types of AF as it combines persistent AF and chronic AF. We defined paroxysmal AF as patients with <italic>ICD-10</italic> code of I48.0 or I48.20, and free of persistent AF. AF with atrial flutter were patients with any atrial flutter codes (<italic>ICD-10</italic>: I48.3 or I48.4).</p></sec><sec id="s2-3"><title>Data Processing</title><p>We constructed a comprehensive 2-year historical patient snapshot by linking records across the inpatient admission, inpatient services, and outpatient services tables using unique patient identifiers. For each patient, we extracted demographic variables (age, sex, region, and industry) at the time of the index ablation, along with the ablation date, failure date (if applicable), and all <italic>ICD</italic> codes within the 2 years preceding the index procedure. To standardize diagnostic codes across our study period, we used the <italic>ICD-10</italic> Lookup tool [<xref ref-type="bibr" rid="ref30">30</xref>] to convert post-October 2015 <italic>ICD-10</italic> codes to their <italic>ICD-9</italic> equivalents. For computational efficiency and feature set manageability, we truncated all <italic>ICD-9</italic> codes to their first 3 digits, resulting in 785 <italic>ICD</italic> features and 19 demographic features. We used a binary measurement to denote whether or not a patient had the specific code within the 2 years prior to the initial ablation, thus avoiding extensive missing data.</p><p>We also calculated 2 established indices, the Charlson comorbidity index and the Elixhauser comorbidity index, to capture patients&#x2019; comorbid conditions [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. These indices used a weighted system based on specific conditions to provide a score, with higher values indicating more severe comorbidities.</p><p>For the subgroup analysis, we utilized three distinct datasets: (1) all the simplified 3-digit <italic>ICD</italic> codes, demographic information, and 2 established indices; (2) demographic data and 2 established indices; and (3) solely demographic information.</p></sec><sec id="s2-4"><title>Modeling</title><p>We used 2 popular supervised ML classifiers: logistic regression and extreme gradient boosting (XGBoost) [<xref ref-type="bibr" rid="ref33">33</xref>]. Logistic regression computes the probability of a binary outcome by employing a logistic function (sigmoid curve) to transform the linear combination of input features into probabilities. This model is particularly advantageous due to its simplicity and interpretability, especially in scenarios where the relationship between input variables and the outcome is expected to be linear. To tune the logistic regression model, we implemented grid search with 5-fold stratified cross-validation AUC as the primary evaluation metric. We explored regularization strengths (C values) on a logarithmic scale (0.001, 0.01, 0.1, 1, 10, 100) to address potential overfitting concerns. Both L1 (Lasso) and L2 (Ridge) regularization penalties were investigated to determine the optimal feature selection. We evaluated multiple solvers (&#x201C;liblinear,&#x201D; &#x201C;lbfgs,&#x201D; &#x201C;newton-cg,&#x201D; &#x201C;sag,&#x201D; &#x201C;saga&#x201D;) to identify the most computationally efficient optimization algorithm.</p><p>XGBoost represents a more sophisticated ML approach. XGBoost constructs multiple decision trees in a sequential manner, with each subsequent tree focusing on addressing the errors made by its predecessors. This method does not presuppose a linear relationship between input and output variables, offering greater flexibility and efficacy in dealing with larger and more intricate datasets. Despite its computational intensity, XGBoost is celebrated for its high efficiency and versatility, making it a potent tool in predictive modeling, especially in situations where the complexity of the data surpasses the capabilities of simpler models like logistic regression [<xref ref-type="bibr" rid="ref27">27</xref>]. To tune the XGBoost hyperparameters, we implemented grid search with 5-fold stratified cross-validation with AUC as the primary evaluation metric. We explored a range of maximum depth values (3, 6, 9, 12, 15) to adequately capture complex feature interactions while avoiding overfitting. The learning rate varied across 0.01, 0.05, 0.1, and 0.2 to balance convergence speed and model accuracy, while the number of estimators was tested at 100, 200, 300, and 500 to determine the optimal number of boosting rounds.</p><p>The CHADS<sub>2</sub> and CHA<sub>2</sub>DS<sub>2</sub>-VASc risk scores have been widely used to predict stroke risk in patients with AF [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. CHADS<sub>2</sub> is calculated using congestive heart failure, hypertension, age &#x2265;75 years, diabetes, stroke (doubled), while CHA<sub>2</sub>DS<sub>2</sub>-VASc is computed using congestive heart failure, hypertension, age &#x2265;75 (doubled) years, diabetes, stroke (doubled), vascular disease, age 65-74 years, and sex category (female). These risk scores more recently have been used to predict outcomes in patients with AF, heart failure, coronary artery disease, and postoperative AF undergoing cardiovascular surgical procedures [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. CHADS<sub>2</sub> and CHA<sub>2</sub>DS<sub>2</sub>-VASc risk scores were shown to be useful predictors of adverse events after AF ablation [<xref ref-type="bibr" rid="ref10">10</xref>]. In addition to CHADS<sub>2</sub> and CHA<sub>2</sub>DS<sub>2</sub>-VASc, we also evaluated a modified CAAP-AF, a risk score specifically designed to estimate the likelihood of remaining AF-free after ablation [<xref ref-type="bibr" rid="ref12">12</xref>]. Due to the limitations of claims data, we only have information on coronary artery disease, age, AF type (persistent or longstanding, available only for patients after October 2015 using <italic>ICD-10</italic>), and sex. Left atrial diameter and the number of failed antiarrhythmic drugs are unavailable in MarketScan, which may impact our CAAP-AF comparison.</p></sec><sec id="s2-5"><title>Statistical Analysis</title><p>We compared patient characteristics between the groups using the Student <italic>t</italic> test for continuous variables and chi-square tests for categorical variables. Continuous variables were reported as mean (SD), while categorical variables were expressed as percentages.</p><p>We assessed the performance of the ML models and baseline risk scores using 5 metrics: AUC, area under the precision recall curve (AUPRC), precision, recall, and <italic>F</italic><sub>1</sub>-score (the harmonic mean of precision and recall). Optimal hyperparameters for the ML models were first identified through 5-fold cross-validation on the full dataset. To measure performance, we then employed bootstrap resampling with 500 iterations. In each iteration, the ML model was trained on a bootstrap sample (drawn with replacement from the full dataset) using these optimal hyperparameters and then evaluated on the out-of-bag observations (samples not included in that bootstrap sample). This procedure was used to generate performance distributions and 95% CIs. Statistical significance was assessed using 1-tailed paired <italic>t</italic> tests on the bootstrap distributions to test whether ML outperformed the clinical scores (H&#x2080;: XGBoost&#x2264;clinical score).</p></sec><sec id="s2-6"><title>Ethical Considerations</title><p>This study used commercially available data that have been deidentified. As such, the study was deemed exempt by Emory University Institutional Review Board.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>We leveraged the Merative MarketScan Research Medicare Databases (Merative, Inc.) between January 1, 2011, and December 31, 2021. To allow for a 2-year medical history and 1-year outcome assessment, the analytic cohort included patients observed between January 1, 2013, and December 31, 2020.</p><p>The demographic and clinical profiles of the patients with AF are detailed in <xref ref-type="table" rid="table1">Tables 1 and 2</xref>. Our study cohort consisted of 14,521 patients, with an average age of 71.5 years (SD 5.31). Successful outcomes from AF ablation procedures were observed in 54.01% (n=7843) of the patients. Female patients constituted 39.94% (n=5800) of the study population. Clinically, 24.73% (n=3591) of the patients were diagnosed with concomitant atrial flutter. As shown in <xref ref-type="table" rid="table2">Table 2</xref>, the Elixhauser comorbidity index showed limited variance, with 92.89% (n=13,488) of the patients in the &#x201C;&#x2265;2&#x201D; category. The precise identification of patients with paroxysmal and persistent AF was limited, relative to the total cohort, due to the use of <italic>ICD-9</italic> instead of <italic>ICD-10</italic> prior to October 2015. A total of 7646 patients were identified using <italic>ICD-10</italic> codes for AF ablation, demonstrating a slightly reduced AF ablation success rate of 53.28% in comparison to the broader patient population. A subset of 6983 patients was categorized as having paroxysmal or persistent AF. Within this subset, 37.63% (n=2877) were diagnosed with paroxysmal AF, while 53.70% (n=4106) had persistent AF. The AF ablation success rates for paroxysmal and persistent AF were 52.55% and 53.90%, respectively.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Baseline demographic characteristics of patients undergoing AF<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> ablation.<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Demographic variable</td><td align="left" valign="bottom">Overall (N=14,521)</td><td align="left" valign="bottom">AF ablation success (n=7843)</td><td align="left" valign="bottom">AF ablation failure (n=6678)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Age (y), mean (SD)</td><td align="left" valign="top">71.5 (5.31)</td><td align="left" valign="top">71.5 (5.27)</td><td align="left" valign="top">71.6 (5.34)</td><td align="left" valign="top">.62</td></tr><tr><td align="left" valign="top">Female, n (%)</td><td align="left" valign="top">5800 (39.94)</td><td align="left" valign="top">3118 (39.76)</td><td align="left" valign="top">2682 (40.17)</td><td align="left" valign="top">.63</td></tr><tr><td align="left" valign="top" colspan="4">Region, n (%)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Northeast</td><td align="left" valign="top">2790 (19.21)</td><td align="left" valign="top">1544 (19.69)</td><td align="left" valign="top">1246 (18.66)</td><td align="left" valign="top">.12</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>North Central</td><td align="left" valign="top">4467 (30.76)</td><td align="left" valign="top">2263 (28.85)</td><td align="left" valign="top">2204 (33.00)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>South</td><td align="left" valign="top">4733 (32.59)</td><td align="left" valign="top">2599 (33.14)</td><td align="left" valign="top">2134 (31.96)</td><td align="left" valign="top">.13</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>West</td><td align="left" valign="top">2393 (16.48)</td><td align="left" valign="top">1360 (17.34)</td><td align="left" valign="top">1033 (15.47)</td><td align="left" valign="top">.003</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unknown</td><td align="left" valign="top">138 (0.95)</td><td align="left" valign="top">77 (0.98)</td><td align="left" valign="top">61 (0.91)</td><td align="left" valign="top">.74</td></tr><tr><td align="left" valign="top" colspan="4">Industry, n (%)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Oil and gas extraction, mining</td><td align="left" valign="top">6 (0.04)</td><td align="left" valign="top">5 (0.06)</td><td align="left" valign="top">1 (0.01)</td><td align="left" valign="top">.30</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Manufacturing, nondurable goods</td><td align="left" valign="top">3013 (20.75)</td><td align="left" valign="top">1486 (18.94)</td><td align="left" valign="top">1527 (22.87)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Manufacturing, durable goods</td><td align="left" valign="top">467 (3.21)</td><td align="left" valign="top">254 (3.24)</td><td align="left" valign="top">213 (3.19)</td><td align="left" valign="top">.91</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Transportation, communication, utilities</td><td align="left" valign="top">1768 (12.18)</td><td align="left" valign="top">1007 (12.84)</td><td align="left" valign="top">761 (11.40)</td><td align="left" valign="top">.009</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Retail trade</td><td align="left" valign="top">42 (0.29)</td><td align="left" valign="top">22 (0.28)</td><td align="left" valign="top">20 (0.30)</td><td align="left" valign="top">.95</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Finance, insurance, real estate</td><td align="left" valign="top">661 (4.55)</td><td align="left" valign="top">371 (4.73)</td><td align="left" valign="top">290 (4.34)</td><td align="left" valign="top">.28</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Services</td><td align="left" valign="top">2866 (19.74)</td><td align="left" valign="top">1479 (18.86)</td><td align="left" valign="top">1387 (20.77)</td><td align="left" valign="top">.004</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Agriculture, forestry, fishing</td><td align="left" valign="top">4 (0.03)</td><td align="left" valign="top">2 (0.03)</td><td align="left" valign="top">2 (0.03)</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Construction</td><td align="left" valign="top">33 (0.23)</td><td align="left" valign="top">20 (0.26)</td><td align="left" valign="top">13 (0.19)</td><td align="left" valign="top">.56</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Wholesale</td><td align="left" valign="top">54 (0.37)</td><td align="left" valign="top">37 (0.47)</td><td align="left" valign="top">17 (0.25)</td><td align="left" valign="top">.05</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unknown</td><td align="left" valign="top">5607 (38.61)</td><td align="left" valign="top">3160 (40.29)</td><td align="left" valign="top">2447 (36.64)</td><td align="left" valign="top">&#x003C;.001</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>AF: atrial fibrillation.</p></fn><fn id="table1fn2"><p><sup>b</sup>Industry is categorized based on the employer responsible for the claim payment, and regions follow the Census Bureau&#x2019;s regional definitions.  </p></fn></table-wrap-foot></table-wrap><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Baseline clinical characteristics of patients in sample undergoing AF<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> ablation.<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Clinical variable</td><td align="left" valign="bottom">Overall (N=14,521), n (%)</td><td align="left" valign="bottom">AF ablation success (n=7843), n (%)</td><td align="left" valign="bottom">AF ablation failure (n=6678), n (%)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="4">Charlson comorbidity index</td><td align="left" valign="top">.29</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">4371 (30.10)</td><td align="left" valign="top">2375 (30.28)</td><td align="left" valign="top">1996 (29.89)</td><td align="left" valign="top">.61</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">4295 (29.58)</td><td align="left" valign="top">2277 (29.03)</td><td align="left" valign="top">2018 (30.22)</td><td align="left" valign="top">.87</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x2265;2</td><td align="left" valign="top">5855 (40.32)</td><td align="left" valign="top">3191 (40.68)</td><td align="left" valign="top">2664 (39.89)</td><td align="left" valign="top">.61</td></tr><tr><td align="left" valign="top" colspan="4">Elixhauser comorbidity index</td><td align="left" valign="top">.45</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">44 (0.30)</td><td align="left" valign="top">24 (0.31)</td><td align="left" valign="top">20 (0.30)</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">989 (6.81)</td><td align="left" valign="top">515 (6.57)</td><td align="left" valign="top">474 (7.10)</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x2265;2</td><td align="left" valign="top">13,488 (92.89)</td><td align="left" valign="top">7304 (93.13)</td><td align="left" valign="top">6184 (92.60)</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top">Both atrial flutter and AF (<italic>ICD-9</italic><sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup> and <italic>ICD-10</italic><sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup>)</td><td align="left" valign="top">3591 (24.73)</td><td align="left" valign="top">1963 (25.03)</td><td align="left" valign="top">1628 (24.38)</td><td align="left" valign="top">.38</td></tr><tr><td align="left" valign="top">Patients with <italic>ICD-10</italic></td><td align="left" valign="top">7646 (52.65)</td><td align="left" valign="top">4074 (51.94)</td><td align="left" valign="top">3572 (53.49)</td><td align="left" valign="top">.51</td></tr><tr><td align="left" valign="top">Paroxysmal AF (<italic>ICD-10</italic> only)</td><td align="left" valign="top">2877 (37.63)</td><td align="left" valign="top">1512 (37.11)</td><td align="left" valign="top">1365 (38.21)</td><td align="left" valign="top">.33</td></tr><tr><td align="left" valign="top">Persistent AF (<italic>ICD-10</italic> only)</td><td align="left" valign="top">4106 (53.70)</td><td align="left" valign="top">2213 (54.32)</td><td align="left" valign="top">1893 (53.00)</td><td align="left" valign="top">.26</td></tr><tr><td align="left" valign="top">Unspecified AF</td><td align="left" valign="top">663 (8.67)</td><td align="left" valign="top">349 (8.57)</td><td align="left" valign="top">314 (8.79)</td><td align="left" valign="top">.76</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>AF: atrial fibrillation.</p></fn><fn id="table2fn2"><p><sup>b</sup>The paroxysmal and persistent AF only exists in the <italic>ICD-10</italic> space, of which the overall <italic>ICD-10</italic> population is 7646, success population is 4074, and failure population is 3572.</p></fn><fn id="table2fn3"><p><sup>c</sup><italic>ICD-9</italic>: <italic>International Classification of Diseases, Ninth Revision</italic>.</p></fn><fn id="table2fn4"><p><sup>d</sup><italic>ICD-10</italic>: <italic>International Statistical Classification of Diseases, Tenth Revision</italic>.</p></fn></table-wrap-foot></table-wrap><p><xref ref-type="table" rid="table3">Table 3</xref> shows the comparative performance of XGBoost, CHADS<sub>2</sub>, and CHA<sub>2</sub>DS<sub>&#x2082;</sub>-VASc of our entire study cohort. XGBoost consistently outperformed logistic regression in all analyses; therefore, only XGBoost results are presented for brevity. The full comparison between XGBoost and logistic regression is available in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The XGBoost model exhibited modest predictive capability with an AUC of 0.528 for the overall population. It performed slightly better in male (AUC=0.529) than in female patients (AUC=0.521). The model achieved balanced performance with an <italic>F</italic><sub>1</sub>-score of 0.581 and recall of 0.608, indicating that it captures most positive cases while maintaining reasonable precision at 0.556. Male patients showed slightly higher recall (0.614) than female patients (0.600).</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Performance comparison between XGBoost<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> and CHADS<sub>2</sub><sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> and CHA2<sub>2</sub>DS2<sub>2</sub>-VASc<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup> risk scores stratified by sex.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Metric</td><td align="left" valign="bottom">XGBoost<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td><td align="left" valign="bottom">CHADS<sub>2</sub></td><td align="left" valign="bottom">CHA<sub>2</sub>DS<sub>2</sub>-VASc</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="4">Population (n=14,521)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUC<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td><td align="left" valign="top">0.528<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (0.519&#x2010;0.533)</td><td align="left" valign="top">0.498</td><td align="left" valign="top">0.498</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUPRC<sup><xref ref-type="table-fn" rid="table3fn7">g</xref></sup></td><td align="left" valign="top">0.562<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (0.545&#x2010;0.578)</td><td align="left" valign="top">0.536</td><td align="left" valign="top">0.539</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.581 (0.569&#x2010;0.594)</td><td align="left" valign="top">0.436</td><td align="left" valign="top">0.644</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.556<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (0.542&#x2010;0.570)</td><td align="left" valign="top">0.533</td><td align="left" valign="top">0.540</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recall</td><td align="left" valign="top">0.608 (0.585&#x2010;0.632)</td><td align="left" valign="top">0.368</td><td align="left" valign="top">0.799</td></tr><tr><td align="left" valign="top" colspan="4">Female (n=5800)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUC</td><td align="left" valign="top">0.521<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (0.510&#x2010;0.532)</td><td align="left" valign="top">0.498</td><td align="left" valign="top">0.500</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUPRC</td><td align="left" valign="top">0.558<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (0.533&#x2010;0.582)</td><td align="left" valign="top">0.536</td><td align="left" valign="top">0.538</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.575 (0.556&#x2010;0.593)</td><td align="left" valign="top">0.436</td><td align="left" valign="top">0.698</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.552<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (0.530&#x2010;0.574)</td><td align="left" valign="top">0.533</td><td align="left" valign="top">0.538</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recall</td><td align="left" valign="top">0.600 (0.568&#x2010;0.632)</td><td align="left" valign="top">0.368</td><td align="left" valign="top">0.995</td></tr><tr><td align="left" valign="top" colspan="4">Male (n=8721)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUC</td><td align="left" valign="top">0.529<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (0.520&#x2010;0.539)</td><td align="left" valign="top">0.498</td><td align="left" valign="top">0.498</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUPRC</td><td align="left" valign="top">0.566<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (0.546&#x2010;0.588)</td><td align="left" valign="top">0.541</td><td align="left" valign="top">0.541</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.585 (0.568&#x2010;0.601)</td><td align="left" valign="top">0.410</td><td align="left" valign="top">0.599</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.559<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup> (0.540&#x2010;0.578)</td><td align="left" valign="top">0.538</td><td align="left" valign="top">0.542</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recall</td><td align="left" valign="top">0.614 (0.582&#x2010;0.644)</td><td align="left" valign="top">0.331</td><td align="left" valign="top">0.669</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>XGBoost: extreme gradient boosting.</p></fn><fn id="table3fn2"><p><sup>b</sup>CHADS<sub>2</sub>: congestive heart failure, hypertension, age &#x2265;75 years, diabetes mellitus, and stroke.</p></fn><fn id="table3fn3"><p><sup>c</sup>CHA<sub>2</sub>DS<sub>2</sub>-VASc: congestive heart failure, hypertension, age &#x2265;75 years, diabetes mellitus, stroke, vascular disease, age, and sex category.</p></fn><fn id="table3fn4"><p><sup>d</sup>Cell values for XGBoost report average and the 95% CI in parentheses.</p></fn><fn id="table3fn5"><p><sup>e</sup>AUC: area under the receiver operating characteristic curve.</p></fn><fn id="table3fn6"><p><sup>f</sup><italic>P</italic>&#x003C;.001 (XGBoost vs both clinical scores).</p></fn><fn id="table3fn7"><p><sup>g</sup>AUPRC: area under the precision recall curve.</p></fn></table-wrap-foot></table-wrap><p>Despite its moderate predictive power, the XGBoost model consistently outperformed both CHADS<sub>2</sub> and CHA<sub>2</sub>DS<sub>&#x2082;</sub>-VASc scores across all patient cohorts in terms of AUC and AUPRC. Both risk scores (CHADS<sub>2</sub> and CHA<sub>&#x2082;</sub>DS<sub>&#x2082;</sub>-VASc) performed poorly with AUC values worse than random chance (&#x003C;0.5) except for CHA<sub>2</sub>DS<sub>2</sub>-VASc in the female subgroup (AUC=0.5). CHADS<sub>2</sub> had poor recall (0.368) and low <italic>F</italic><sub>1</sub>-scores (0.436), missing most positive cases. While CHA<sub>2</sub>DS<sub>2</sub>-VASc demonstrated high recall (0.799), particularly in female patients (0.995), the lower precision of 0.540 and AUC below 0.5 suggest that the score&#x2019;s high sensitivity produces a higher false positive rate.</p><p><xref ref-type="table" rid="table4">Table 4</xref> presents a comparative analysis of the XGBoost and the modified CAAP-AF risk scores for the <italic>ICD-10</italic> cohort. XGBoost outperformed the modified CAAP-AF risk score with an overall AUC of 0.544 and AUPRC of 0.567 and consistent subgroup performance (female patients: AUC 0.543, AUPRC 0.569; male patients: AUC 0.545, AUPRC 0.567). In contrast, the modified CAAP-AF risk score achieved an overall AUC of 0.505, rising slightly to 0.511 in male patients but performing no better than random chance in female patients. While the modified CAAP-AF risk score exhibited high recall (0.999), capturing nearly all positive cases, it came at the cost of lower precision (0.533). XGBoost achieved better precision (0.552), albeit at a lower recall (0.793) and <italic>F</italic><sub>1</sub>-score. All differences between the models were statistically significant.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Performance comparison between XGBoost<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> (ML<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> model) and modified CAAP-AF<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup> risk score stratified by sex.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Metric</td><td align="left" valign="bottom">XGBoost<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup></td><td align="left" valign="bottom">Modified CAAP-AF</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="3"><italic>ICD-10</italic><sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup> population (n=7646)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUC<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup></td><td align="left" valign="top">0.544<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup> (0.535&#x2010;0.553)</td><td align="left" valign="top">0.505</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUPRC<sup><xref ref-type="table-fn" rid="table4fn8">h</xref></sup></td><td align="left" valign="top">0.567<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup> (0.545&#x2010;0.590)</td><td align="left" valign="top">0.537</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.651 (0.627&#x2010;0.672)</td><td align="left" valign="top">0.695<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.552<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup> (0.535&#x2010;0.572)</td><td align="left" valign="top">0.533</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recall</td><td align="left" valign="top">0.793 (0.709&#x2010;0.867)</td><td align="left" valign="top">0.999<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td></tr><tr><td align="left" valign="top" colspan="3">Female (n=3161)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUC</td><td align="left" valign="top">0.543<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup> (0.516&#x2010;0.573)</td><td align="left" valign="top">0.500</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUPRC</td><td align="left" valign="top">0.569<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup> (0.533&#x2010;0.605)</td><td align="left" valign="top">0.533</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.645 (0.615&#x2010;0.672)</td><td align="left" valign="top">0.694<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.550<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup> (0.519&#x2010;0.578)</td><td align="left" valign="top">0.531</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recall</td><td align="left" valign="top">0.783 (0.701&#x2010;0.864)</td><td align="left" valign="top">1.000<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td></tr><tr><td align="left" valign="top" colspan="3">Male (n=4485)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUC</td><td align="left" valign="top">0.545<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup> (0.522&#x2010;0.569)</td><td align="left" valign="top">0.511</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUPRC</td><td align="left" valign="top">0.567<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup> (0.540&#x2010;0.596)</td><td align="left" valign="top">0.542</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.655 (0.625&#x2010;0.678)</td><td align="left" valign="top">0.696<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.554<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup> (0.533&#x2010;0.579)</td><td align="left" valign="top">0.535</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recall</td><td align="left" valign="top">0.801 (0.717&#x2010;0.875)</td><td align="left" valign="top">0.999<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>XGBoost: extreme gradient boosting.</p></fn><fn id="table4fn2"><p><sup>b</sup>ML: machine learning.</p></fn><fn id="table4fn3"><p><sup>c</sup>CAAP-AF: coronary artery disease, left atrial diameter, age, AF, antiarrhythmic drugs, and female sex category.</p></fn><fn id="table4fn4"><p><sup>d</sup>Cell values for XGBoost report average and the 95% CI in parentheses.</p></fn><fn id="table4fn5"><p><sup>e</sup><italic>ICD-10</italic>: <italic>International Statistical Classification of Diseases, Tenth Revision</italic>.</p></fn><fn id="table4fn6"><p><sup>f</sup>AUC: area under the receiver operating characteristic curve.</p></fn><fn id="table4fn7"><p><sup>g</sup><italic>P</italic>&#x003C;.001 for comparison between XGBoost and modified CAAP-AF.</p></fn><fn id="table4fn8"><p><sup>h</sup>AUPRC: area under the precision recall curve.</p></fn></table-wrap-foot></table-wrap><p><xref ref-type="table" rid="table5">Table 5</xref> presents the predictive model performance across atrial arrhythmia subgroups: paroxysmal AF, persistent AF, and AF with atrial flutter. A total of 3 feature sets were compared: <italic>ICD</italic> codes with demographics and comorbidity indices, demographics and comorbidity indices, and demographics only. On the entire <italic>ICD-10</italic> population, incorporating all the features (<italic>ICD</italic> codes with demographics and comorbidity indices) achieved the best performance across all 5 metrics when compared to the other 2 feature sets, with AUC of 0.544, AUPRC of 0.567, <italic>F</italic><sub>1</sub>-score of 0.652, precision of 0.551, and recall of 0.798.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Predictive performance by clinical and demographic predictors across atrial arrhythmia subgroups.<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup></p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Metric</td><td align="left" valign="bottom"><italic>ICD</italic><sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup>+demographic+comorbidity indices, average (95% CI)</td><td align="left" valign="bottom">Demographic+comorbidity indices, average (95% CI)</td><td align="left" valign="bottom">Demographic only, average (95% CI)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="4">Paroxysmal AF<sup><xref ref-type="table-fn" rid="table5fn3">c</xref></sup> (n=2877)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUC<sup><xref ref-type="table-fn" rid="table5fn4">d</xref></sup></td><td align="left" valign="top">0.538 (0.523&#x2010;0.553)</td><td align="left" valign="top">0.520 (0.530&#x2010;0.558)</td><td align="left" valign="top">0.532 (0.517&#x2010;0.547)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUPRC<sup><xref ref-type="table-fn" rid="table5fn5">e</xref></sup></td><td align="left" valign="top">0.557 (0.520&#x2010;0.596)</td><td align="left" valign="top">0.564 (0.529&#x2010;0.595)</td><td align="left" valign="top">0.547 (0.515&#x2010;0.582)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.563 (0.531&#x2010;0.593)</td><td align="left" valign="top">0.596 (0.540&#x2010;0.639)</td><td align="left" valign="top">0.645 (0.581&#x2010;0.680)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.551 (0.514&#x2010;0.585)</td><td align="left" valign="top">0.548 (0.513&#x2010;0.582)</td><td align="left" valign="top">0.541 (0.509&#x2010;0.570)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recall</td><td align="left" valign="top">0.576 (0.520&#x2010;0.629)</td><td align="left" valign="top">0.660 (0.525&#x2010;0.789)</td><td align="left" valign="top">0.808 (0.620&#x2010;0.948)</td></tr><tr><td align="left" valign="top" colspan="4">Persistent AF (n=4106)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUC</td><td align="left" valign="top">0.525 (0.512&#x2010;0.537)</td><td align="left" valign="top">0.518 (0.504&#x2010;0.531)</td><td align="left" valign="top">0.524 (0.510&#x2010;0.537)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUPRC</td><td align="left" valign="top">0.561 (0.532&#x2010;0.592)</td><td align="left" valign="top">0.552 (0.522&#x2010;0.582)</td><td align="left" valign="top">0.557 (0.529&#x2010;0.586)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.575 (0.550&#x2010;0.596)</td><td align="left" valign="top">0.626 (0.586&#x2010;0.659)</td><td align="left" valign="top">0.658 (0.612&#x2010;0.689)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.554 (0.525&#x2010;0.582)</td><td align="left" valign="top">0.549 (0.522&#x2010;0.574)</td><td align="left" valign="top">0.545 (0.520&#x2010;0.573)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recall</td><td align="left" valign="top">0.598 (0.553&#x2010;0.641)</td><td align="left" valign="top">0.731 (0.622&#x2010;0.821)</td><td align="left" valign="top">0.834 (0.677&#x2010;0.947)</td></tr><tr><td align="left" valign="top" colspan="4"><italic>ICD-10</italic><sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup>, with AF (n=1503)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUC</td><td align="left" valign="top">0.528 (0.506&#x2010;0.549)</td><td align="left" valign="top">0.514 (0.493&#x2010;0.535)</td><td align="left" valign="top">0.517 (0.497&#x2010;0.537)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUPRC</td><td align="left" valign="top">0.564 (0.516&#x2010;0.609)</td><td align="left" valign="top">0.555 (0.512&#x2010;0.602)</td><td align="left" valign="top">0.558 (0.513&#x2010;0.605)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.600 (0.551&#x2010;0.644)</td><td align="left" valign="top">0.607 (0.552&#x2010;0.655)</td><td align="left" valign="top">0.611 (0.556&#x2010;0.655)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.556 (0.508&#x2010;0.601)</td><td align="left" valign="top">0.547 (0.507&#x2010;0.589)</td><td align="left" valign="top">0.693 (0.548&#x2010;0.823)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recall</td><td align="left" valign="top">0.657 (0.551&#x2010;0.770)</td><td align="left" valign="top">0.688 (0.552&#x2010;0.815)</td><td align="left" valign="top">0.550 (0.509&#x2010;0.597)</td></tr><tr><td align="left" valign="top" colspan="4"><italic>ICD-10</italic> population (n=7646)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUC</td><td align="left" valign="top">0.544 (0.535&#x2010;0.553)</td><td align="left" valign="top">0.533 (0.523&#x2010;0.542)</td><td align="left" valign="top">0.536 (0.528&#x2010;0.545)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>AUPRC</td><td align="left" valign="top">0.567 (0.545&#x2010;0.589)</td><td align="left" valign="top">0.556 (0.532&#x2010;0.579)</td><td align="left" valign="top">0.559 (0.536&#x2010;0.581)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.652 (0.625&#x2010;0.672)</td><td align="left" valign="top">0.621 (0.595&#x2010;0.645)</td><td align="left" valign="top">0.645 (0.610&#x2010;0.672)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Precision</td><td align="left" valign="top">0.551 (0.531&#x2010;0.573)</td><td align="left" valign="top">0.550 (0.530&#x2010;0.570)</td><td align="left" valign="top">0.548 (0.528&#x2010;0.570)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recall</td><td align="left" valign="top">0.798 (0.713&#x2010;0.871)</td><td align="left" valign="top">0.714 (0.644&#x2010;0.796)</td><td align="left" valign="top">0.787 (0.681&#x2010;0.878)</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup>This population only includes patients who had their first atrial fibrillation ablation in or after October 2015. Predictors include <italic>ICD</italic> codes of patients&#x2019; past medical history and demographic variables (region, sex, age, and industry). </p></fn><fn id="table5fn2"><p><sup>b</sup><italic>ICD</italic>: <italic>International Classification of Diseases</italic>.</p></fn><fn id="table5fn3"><p><sup>c</sup>AF: atrial fibrillation.</p></fn><fn id="table5fn4"><p><sup>d</sup>AUC: area under the receiver operating characteristic curve.</p></fn><fn id="table5fn5"><p><sup>e</sup>AUPRC: area under the precision recall curve.</p></fn><fn id="table5fn6"><p><sup>f</sup><italic>ICD-10</italic>: <italic>International Statistical Classification of Diseases, Tenth Revision</italic>.</p></fn></table-wrap-foot></table-wrap><p>Within the atrial arrhythmia subgroups, models incorporating all features consistently achieved the highest AUC and AUPRC across all 3 subgroups. However, performance patterns for <italic>F</italic><sub>1</sub>-score and recall varied by subgroup. For paroxysmal AF and persistent AF, the full model also achieved the highest precision (0.551 and 0.554, respectively), but the models with demographics only had better recall (0.808 and 0.834, respectively) and <italic>F</italic><sub>1</sub>-scores (0.645 and 0.658, respectively). For AF with atrial flutter, the model with demographics only achieved the highest <italic>F</italic><sub>1</sub>-score (0.611) and precision (0.693), whereas the model with demographics and comorbidity indices achieved the highest recall (0.688).</p></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In this study, we developed ML models that predict the outcomes of de novo AF ablation procedures. Our XGBoost model demonstrated statistically significant improved performance compared to 3 different claim-based implementations of clinical risk scores (CHADS<sub>2</sub>, CHA<sub>2</sub>DS<sub>2</sub>-VASc, and a limited, modified CAAP-AF without left atrial diameter and the number of failed antiarrhythmic drugs) in all patient and sex subgroups in terms of AUC and AUPRC. While the 2 risk scores achieved higher recall than XGBoost, they demonstrated lower precision and weaker discrimination (near random chance). However, XGBoost&#x2019;s predictive ability for outcomes after AF ablation was found to be lower in female patients than it was in male patients or in the entire population. There was no difference in AUC when comparing CHADS<sub>2</sub> to CHA<sub>2</sub>DS<sub>2</sub>-VASc risk scores for outcomes after AF ablation except for female patients, where CHA<sub>2</sub>DS<sub>2</sub>-VASc performs better than CHADS<sub>2</sub>.</p><p>When comparing outcomes across different AF subtypes (paroxysmal, persistent, or AF with atrial flutter), we observed heterogeneous patterns in the value of adding <italic>ICD</italic> code features. For persistent AF and AF with atrial flutter, the models incorporating <italic>ICD</italic> code features demonstrated superior discriminative power (AUC and AUPRC) compared to models using either demographic or clinical variables alone or those combined with comorbidity indices (Charlson comorbidity index and the Elixhauser comorbidity index). However, in the paroxysmal AF subgroup, the model using only demographics and comorbidity indices slightly outperformed the full model with <italic>ICD</italic> codes in terms of AUPRC but not AUC. Additionally, models using demographics only consistently achieved higher recall across all subgroups at the expense of lower precision and overall discriminative performance (AUC and AUPRC), revealing a trade-off between sensitivity and specificity in feature selection. The use of these ML models may be useful in clinical practice in patient selection for AF ablation in the future.</p></sec><sec id="s4-2"><title>Comparison to Prior Work</title><p>Claims data present challenges for outcome prediction, despite being readily available. Previous clinical models for predicting AF ablation success have reported an AUC ranging from 0.55 to 0.65, with only 3 models achieving an AUC of 0.75 [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. In other studies, CHADS<sub>2</sub> and CHA<sub>2</sub>DS<sub>2</sub>-VASc achieved an AUC of 0.785 and 0.830, respectively, in predicting complications after AF ablation [<xref ref-type="bibr" rid="ref6">6</xref>]. However, in our study, CHADS<sub>2</sub> and CHA<sub>2</sub>DS<sub>2</sub>-VASc only achieved an AUC of 0.498&#x2010;0.5, performing almost worse than random guessing. It is important to note that while CHADS<sub>2</sub> and CHA<sub>2</sub>DS<sub>2</sub>-VASc have been used for predicting procedural outcomes [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref6">6</xref>], they were originally designed to estimate stroke risk rather than ablation recurrence, and thus their lower performance in this study potentially reflects use outside of the intended purpose rather than a failure of the scores themselves.</p><p>The modified CAAP-AF reached AUC greater than 0.650 [<xref ref-type="bibr" rid="ref12">12</xref>] with the data from its original study, yet in our implementation, it achieved no better than 0.511. However, the CAAP-AF score used in our study was a modified, claims-based approximation that excluded left atrial diameter and the number of failed antiarrhythmic drugs, as these are not available in claims data. Therefore, our comparison does not represent a true head-to-head evaluation of the original CAAP-AF model, and the ML model&#x2019;s advantage should be interpreted with this limitation in mind.</p><p>These findings highlight the significant difficulty in predicting AF ablation success and failure using claims data, reflecting broader challenges in health care outcome prediction where administrative databases consistently underperform compared to clinical models due to the absence of key physiological and procedural variables, a pattern observed across multiple medical specialties and intervention types [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. In contrast, our ML models achieved AUCs of 0.521&#x2010;0.529, showing marginal improvement.</p><p>Despite the modest predictive performance of the ML models, our claims-based approach has significant potential for standardization across health care systems, as it relies on widely used <italic>ICD</italic> and <italic>CPT</italic> coding systems rather than institution-specific EHR implementations. However, adoption barriers remain, including variations in coding practices across institutions, the challenge of integrating predictive tools into clinical workflows, and potential resistance from clinicians who may prioritize clinical judgment over algorithmic recommendations. Given the relatively low AUC values observed, these models should be viewed as a foundational step toward using claims data to predict the outcomes of AF ablation procedures, rather than as tools ready for clinical deployment.</p><p>Beyond demonstrating that ML models outperform traditional risk scores, we conducted an analysis to understand what types of features should be included in the ML models across clinically relevant AF subgroups. We evaluated three feature sets: (1) demographic information alone; (2) demographics plus comorbidity indices; and (3) the full features incorporating <italic>ICD</italic> codes, demographics, and comorbidity indices. These were tested across 3 clinically distinct subgroups (paroxysmal AF, persistent AF, and AF with atrial flutter) identifiable only through <italic>ICD-10</italic> coding, yielding 16 unique ML models. Across persistent AF and AF with atrial flutter subgroups, ML models performed best when including <italic>ICD</italic> codes as features, highlighting the importance of diagnostic coding data. Among the 3 subgroups (paroxysmal AF, persistent AF, and patients with atrial flutter), the ML models performed best for patients with paroxysmal AF, and patients with persistent AF had the least success. The entire <italic>ICD-10</italic> population achieved the highest overall AUC compared to other subgroups, which was likely due to the larger sample size.</p></sec><sec id="s4-3"><title>Future Directions</title><p>Our findings demonstrate that ML models using <italic>ICD</italic> codes to estimate AF ablation procedural outcomes are robust and valid across populations. However, the model&#x2019;s current predictive power in this study remains insufficient for clinical decision-making. Improvement of outcome predictions for AF ablation using ML has the potential for widespread use in research and clinical practice to determine optimal patient selection for AF ablation and the management of patients with AF. Advances in artificial intelligence and ML technology have an ability to rapidly analyze and synthesize innumerable variables to predict outcomes of AF ablation and discover new patterns of clinical variables that greatly surpass prior conventional methods of gaging success. These findings will be important to consider, as health care policymakers struggle to allocate limited resources to as many patients as possible and search for ways to improve patient outcomes. ML technologies will play increasingly more important roles in medicine with future advances as we better learn how to incorporate ML for better health care resource allocation as well as improvements in clinical practice and patient outcomes.</p><p>Several specific clinical implementation scenarios could leverage these predictive tools to enhance AF ablation care delivery. An important deployment consideration is the metric to optimize, as our findings revealed a trade-off between precision and recall. For population health monitoring, quality improvement initiatives, or patient counseling, high-recall models may be preferred. Conversely, for resource allocation decisions such as prioritizing ablation slots during periods of limited procedure capacity, high-precision models would be more appropriate to minimize false positives. Clinicians could use model predictions to provide patients with more personalized success probability estimates during shared decision-making discussions, helping patients make more informed treatment choices. Alternatively, these models could guide the development of alternative treatment pathways or enhanced monitoring protocols for patients with consistently lower predicted success rates. Future research should focus on developing implementation frameworks that appropriately balance algorithmic predictions with clinical judgment and metric selection based on clinical context while ensuring equitable access to AF ablation across diverse patient populations.</p></sec><sec id="s4-4"><title>Limitations</title><p>First, our study relied exclusively on Medicare Advantage and Medicare Supplemental claims, which skews the cohort toward older patients. Although first ablations often occur between ages 55&#x2010;62 years, our findings may not be generalizable to younger populations with different comorbidity profiles and procedural outcomes. The etiology and pathophysiology of AF may differ between younger and older patients, which could affect both the predictive variables and outcomes in ways that our models may not capture. Future work should validate and potentially recalibrate these models in younger and more diverse populations to ensure broader clinical utility.</p><p>Second, as with all administrative data, coding errors and inconsistencies are possible. We mitigated this by truncating <italic>ICD</italic> codes into broader categories, incorporating 2 established comorbidity indices (Charlson comorbidity index and the Elixhauser comorbidity index), and requiring that all patients had a documented AF diagnosis before ablation. Despite these steps, misclassification could still reduce model performance. Moreover, truncating <italic>ICD-9</italic> codes to the first 3 digits may also have reduced diagnostic specificity. This limitation may explain our unexpected finding that the model using only demographics and comorbidity indices slightly outperformed the full model with <italic>ICD</italic> codes in the paroxysmal AF subgroup. The truncated <italic>ICD</italic> codes may have introduced noise rather than signal for this subgroup, particularly if patients with paroxysmal AF have less diverse billing code profiles making the additional <italic>ICD</italic> code features less informative. Future analysis may mitigate the issue by integrating claims with richer data sources to cross-validate the information.</p><p>Third, while we aimed to study de novo AF ablation procedures, administrative claims data have inherent limitations in both identifying first-time ablations and measuring their outcomes. Although we identified the initial occurrence of AF ablation within our dataset, we cannot definitively exclude patients who may have undergone prior ablations before their enrollment in the database or at facilities not captured in MarketScan. Furthermore, our outcome definition may be subject to misclassification as we are using billing codes as a proxy for clinical recurrence. Asymptomatic or unrecorded recurrences could be missed (falsely classified as success), while unrelated visits coded with previous AF could be incorrectly classified as failures. Additionally, patients with undetected prior ablations may have different recurrence trajectories than true first-time procedures, further complicating outcome assessment. AF recurrence is best confirmed with secondary data sources such as Holter monitoring or electrocardiogram data.</p><p>Fourth, claims data lack important clinical variables known to influence AF ablation outcomes, such as left atrial size, ejection fraction, specific antiarrhythmic medications, and procedural details (catheter type, ablation strategy). This limitation likely contributed to our models&#x2019; modest predictive performance compared to clinical prediction models that incorporate these variables. Additionally, the limited variance in the Elixhauser comorbidity index, where 92.89% (n=13,488) of patients fell into a single category (&#x2265;2), reduced its discriminative value and may explain why adding comorbidity indices to demographic variables resulted in minimal or slightly negative effects on model performance in some subgroups. While we cannot address this limitation within our study design, future research could explore hybrid approaches that combine claims data with targeted clinical data collection for key predictive variables. However, we note this may limit the scalability and standardization advantages that motivated our claims-based approach.</p><p>Finally, given the proprietary nature of MarketScan data, direct replication is constrained. To enhance transparency and reproducibility, we documented our data source, inclusion and exclusion criteria, billing codes, and potential confounders and released the analytic code in a public GitHub repository to facilitate replication [<xref ref-type="bibr" rid="ref36">36</xref>]. This enables researchers with access to similar claims databases to replicate our methodology, though exact replication would require the same data source.</p></sec><sec id="s4-5"><title>Conclusions</title><p>In this study, we developed and evaluated ML models using MarketScan claims data to predict 1-year AF ablation outcomes. Across the overall cohort and sex-stratified groups, ML models modestly but consistently outperformed claim-based implementations of established clinical risk scores. In the <italic>ICD-10</italic> subset, incorporating <italic>ICD</italic> diagnostic codes improved performance relative to the models using only demographic and comorbidity indices over most subgroups. Our findings demonstrate the limitations of ML approaches when applied to claims data that lack key clinical variables, such as left atrial size, ejection fraction, and medication details. The modest predictive performance indicates that current claims-based models are insufficient for individual clinical decision-making. Despite these constraints, our work establishes that standardized, population-level outcome prediction using nationally available administrative data is technically feasible, providing capability that could complement existing clinical tools for health system quality monitoring and research applications. These results contribute important insights into the potential and limitations of claims-based prediction models for population-level analyses and comparative effectiveness research.</p></sec></sec></body><back><ack><p>No generative artificial intelligence (GenAI) models (including large language models such as ChatGPT) were used in the conduct of this research, data analysis, or original writing of this manuscript. Code auto-completion tools were used during programming, with all generated code manually reviewed. Limited GenAI assistance was used to refine language during manuscript revision. We used the Python scikit-learn module to perform logistic regression and extreme gradient boosting, which formed the body of this research [<xref ref-type="bibr" rid="ref37">37</xref>].</p></ack><notes><sec><title>Funding</title><p>This work was supported by the National Institutes of Health (grant NHLBI #R21HL156184; principal investigator: VSH).</p></sec><sec><title>Data Availability</title><p>The Merative MarketScan Research Medicare database is proprietary and not publicly accessible. Interested researchers may obtain access directly from Merative under a licensing agreement.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: JCH, MSL, VSH, YL</p><p>Data curation: MOO, VSH, YL</p><p>Formal analysis: JCH, KAW, MOO, MSL, VSH, YL</p><p>Funding acquisition: JCH, KAW, VSH</p><p>Investigation: YL</p><p>Methodology: JCH, MOO, VSH, YL</p><p>Project administration: VSH</p><p>Supervision: JCH, KAW, VSH</p><p>Writing &#x2013; original draft: YL</p><p>Writing &#x2013; review &#x0026; editing: JCH, KAW, MOO, MSL, VSH</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AF</term><def><p>atrial fibrillation</p></def></def-item><def-item><term id="abb2">AUC </term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb3">AUPRC</term><def><p>area under the precision recall curve</p></def></def-item><def-item><term id="abb4">CAAP-AF</term><def><p>coronary artery disease, left atrial diameter, age, AF, antiarrhythmic drugs, and female sex category</p></def></def-item><def-item><term id="abb5">CHA<sub>2</sub>DS<sub>2</sub>-VASc</term><def><p>congestive heart failure, hypertension, age &#x2265;75 years, diabetes mellitus, stroke, vascular disease, age, and sex category</p></def></def-item><def-item><term id="abb6">CHADS<sub>2</sub></term><def><p>congestive heart failure, hypertension, age &#x2265;75 years, diabetes mellitus, and stroke</p></def></def-item><def-item><term id="abb7"><italic>CPT</italic></term><def><p><italic>Current Procedural Terminology</italic></p></def></def-item><def-item><term id="abb8">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb9"><italic>ICD</italic></term><def><p><italic>International Classification of Disease</italic></p></def></def-item><def-item><term id="abb10"><italic>ICD-10</italic></term><def><p><italic>International Statistical Classification of Diseases, Tenth Revision</italic></p></def></def-item><def-item><term id="abb11"><italic>ICD-9</italic></term><def><p><italic>International Classification of Diseases, Ninth Revision</italic></p></def></def-item><def-item><term id="abb12">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb13">XGBoost</term><def><p>extreme gradient boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tzeis</surname><given-names>S</given-names> </name><name name-style="western"><surname>Gerstenfeld</surname><given-names>EP</given-names> </name><name name-style="western"><surname>Kalman</surname><given-names>J</given-names> </name><etal/></person-group><article-title>2024 European Heart Rhythm Association/Heart Rhythm Society/Asia Pacific Heart Rhythm Society/Latin American Heart Rhythm Society expert consensus statement on catheter and surgical ablation of atrial fibrillation</article-title><source>Europace</source><year>2024</year><month>03</month><day>30</day><volume>26</volume><issue>4</issue><fpage>euae043</fpage><pub-id pub-id-type="doi">10.1093/europace/euae043</pub-id><pub-id pub-id-type="medline">38587017</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Martin</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Aday</surname><given-names>AW</given-names> </name><name name-style="western"><surname>Almarzooq</surname><given-names>ZI</given-names> </name><etal/></person-group><article-title>2024 heart disease and stroke statistics: a report of US and global data from the American Heart Association</article-title><source>Circulation</source><year>2024</year><month>02</month><day>20</day><volume>149</volume><issue>8</issue><fpage>e347</fpage><lpage>e913</lpage><pub-id pub-id-type="doi">10.1161/CIR.0000000000001209</pub-id><pub-id pub-id-type="medline">38264914</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Andrade</surname><given-names>JG</given-names> </name><name name-style="western"><surname>Champagne</surname><given-names>J</given-names> </name><name name-style="western"><surname>Dubuc</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Cryoballoon or radiofrequency ablation for atrial fibrillation assessed by continuous monitoring: a randomized clinical trial</article-title><source>Circulation</source><year>2019</year><month>11</month><day>26</day><volume>140</volume><issue>22</issue><fpage>1779</fpage><lpage>1788</lpage><pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.119.042622</pub-id><pub-id pub-id-type="medline">31630538</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>JY</given-names> </name><name name-style="western"><surname>Li</surname><given-names>DT</given-names> </name><name name-style="western"><surname>Q&#x0131;u</surname><given-names>YG</given-names> </name><etal/></person-group><article-title>CHA2DS2-VASc score as a prognostic indicator in patients with atrial fibrillation undergoing coronary stenting</article-title><source>Turk J Med Sci</source><year>2022</year><month>08</month><volume>52</volume><issue>4</issue><fpage>1103</fpage><lpage>1110</lpage><pub-id pub-id-type="doi">10.55730/1300-0144.5413</pub-id><pub-id pub-id-type="medline">36326398</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mulder</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Kemme</surname><given-names>MJB</given-names> </name><name name-style="western"><surname>Hopman</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Comparison of the predictive value of ten risk scores for outcomes of atrial fibrillation patients undergoing radiofrequency pulmonary vein isolation</article-title><source>Int J Cardiol</source><year>2021</year><month>12</month><day>1</day><volume>344</volume><fpage>103</fpage><lpage>110</lpage><pub-id pub-id-type="doi">10.1016/j.ijcard.2021.09.029</pub-id><pub-id pub-id-type="medline">34555444</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jacobs</surname><given-names>V</given-names> </name><name name-style="western"><surname>May</surname><given-names>HT</given-names> </name><name name-style="western"><surname>Bair</surname><given-names>TL</given-names> </name><etal/></person-group><article-title>The impact of risk score (CHADS2 versus CHA2DS2-VASc) on long-term outcomes after atrial fibrillation ablation</article-title><source>Heart Rhythm</source><year>2015</year><month>04</month><volume>12</volume><issue>4</issue><fpage>681</fpage><lpage>686</lpage><pub-id pub-id-type="doi">10.1016/j.hrthm.2014.12.034</pub-id><pub-id pub-id-type="medline">25546809</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kornej</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hindricks</surname><given-names>G</given-names> </name><name name-style="western"><surname>Arya</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sommer</surname><given-names>P</given-names> </name><name name-style="western"><surname>Husser</surname><given-names>D</given-names> </name><name name-style="western"><surname>Bollmann</surname><given-names>A</given-names> </name></person-group><article-title>The APPLE score&#x2014;a novel score for the prediction of rhythm outcomes after repeat catheter ablation of atrial fibrillation</article-title><source>PLoS One</source><year>2017</year><volume>12</volume><issue>1</issue><fpage>e0169933</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0169933</pub-id><pub-id pub-id-type="medline">28085921</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kosich</surname><given-names>F</given-names> </name><name name-style="western"><surname>Schumacher</surname><given-names>K</given-names> </name><name name-style="western"><surname>Potpara</surname><given-names>T</given-names> </name><name name-style="western"><surname>Lip</surname><given-names>GY</given-names> </name><name name-style="western"><surname>Hindricks</surname><given-names>G</given-names> </name><name name-style="western"><surname>Kornej</surname><given-names>J</given-names> </name></person-group><article-title>Clinical scores used for the prediction of negative events in patients undergoing catheter ablation for atrial fibrillation</article-title><source>Clin Cardiol</source><year>2019</year><month>02</month><volume>42</volume><issue>2</issue><fpage>320</fpage><lpage>329</lpage><pub-id pub-id-type="doi">10.1002/clc.23139</pub-id><pub-id pub-id-type="medline">30578568</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shuvy</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zwas</surname><given-names>DR</given-names> </name><name name-style="western"><surname>Keren</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gotsman</surname><given-names>I</given-names> </name></person-group><article-title>Value of the CHA<sub>2</sub> DS<sub>2</sub> -VASc score for predicting outcome in patients with heart failure</article-title><source>ESC Heart Fail</source><year>2020</year><volume>7</volume><issue>5</issue><fpage>2553</fpage><lpage>2560</lpage><pub-id pub-id-type="doi">10.1002/ehf2.12831</pub-id><pub-id pub-id-type="medline">32614479</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lip</surname><given-names>GYH</given-names> </name><name name-style="western"><surname>Nieuwlaat</surname><given-names>R</given-names> </name><name name-style="western"><surname>Pisters</surname><given-names>R</given-names> </name><name name-style="western"><surname>Lane</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Crijns</surname><given-names>HJGM</given-names> </name></person-group><article-title>Refining clinical risk stratification for predicting stroke and thromboembolism in atrial fibrillation using a novel risk factor-based approach: the Euro Heart Survey on atrial fibrillation</article-title><source>Chest</source><year>2010</year><month>02</month><volume>137</volume><issue>2</issue><fpage>263</fpage><lpage>272</lpage><pub-id pub-id-type="doi">10.1378/chest.09-1584</pub-id><pub-id pub-id-type="medline">19762550</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>JY</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>AD</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>HY</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>FF</given-names> </name><name name-style="western"><surname>Li</surname><given-names>ZC</given-names> </name></person-group><article-title>CHADS2 versus CHA2DS2-VASc score in assessing the stroke and thromboembolism risk stratification in patients with atrial fibrillation: a systematic review and meta-analysis</article-title><source>J Geriatr Cardiol</source><year>2013</year><month>09</month><volume>10</volume><issue>3</issue><fpage>258</fpage><lpage>266</lpage><pub-id pub-id-type="doi">10.3969/j.issn.1671-5411.2013.03.004</pub-id><pub-id pub-id-type="medline">24133514</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Winkle</surname><given-names>RA</given-names> </name><name name-style="western"><surname>Jarman</surname><given-names>JWE</given-names> </name><name name-style="western"><surname>Mead</surname><given-names>RH</given-names> </name><etal/></person-group><article-title>Predicting atrial fibrillation ablation outcome: the CAAP-AF score</article-title><source>Heart Rhythm</source><year>2016</year><month>11</month><volume>13</volume><issue>11</issue><fpage>2119</fpage><lpage>2125</lpage><pub-id pub-id-type="doi">10.1016/j.hrthm.2016.07.018</pub-id><pub-id pub-id-type="medline">27435586</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Van Gelder</surname><given-names>IC</given-names> </name><name name-style="western"><surname>Rienstra</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bunting</surname><given-names>KV</given-names> </name><etal/></person-group><article-title>2024 ESC Guidelines for the management of atrial fibrillation developed in collaboration with the European Association for Cardio-Thoracic Surgery (EACTS)</article-title><source>Eur Heart J</source><year>2024</year><month>09</month><day>29</day><volume>45</volume><issue>36</issue><fpage>3314</fpage><lpage>3414</lpage><pub-id pub-id-type="doi">10.1093/eurheartj/ehae176</pub-id><pub-id pub-id-type="medline">39210723</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Clarnette</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Brooks</surname><given-names>AG</given-names> </name><name name-style="western"><surname>Mahajan</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Outcomes of persistent and long-standing persistent atrial fibrillation ablation: a systematic review and meta-analysis</article-title><source>Europace</source><year>2018</year><month>11</month><day>1</day><volume>20</volume><issue>FI_3</issue><fpage>f366</fpage><lpage>f376</lpage><pub-id pub-id-type="doi">10.1093/europace/eux297</pub-id><pub-id pub-id-type="medline">29267853</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ngo</surname><given-names>L</given-names> </name><name name-style="western"><surname>Ali</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ganesan</surname><given-names>A</given-names> </name><name name-style="western"><surname>Woodman</surname><given-names>R</given-names> </name><name name-style="western"><surname>Adams</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ranasinghe</surname><given-names>I</given-names> </name></person-group><article-title>Ten-year trends in mortality and complications following catheter ablation of atrial fibrillation</article-title><source>Eur Heart J Qual Care Clin Outcomes</source><year>2022</year><month>06</month><day>6</day><volume>8</volume><issue>4</issue><fpage>398</fpage><lpage>408</lpage><pub-id pub-id-type="doi">10.1093/ehjqcco/qcab102</pub-id><pub-id pub-id-type="medline">34982824</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ngo</surname><given-names>L</given-names> </name><name name-style="western"><surname>Ali</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ganesan</surname><given-names>A</given-names> </name><name name-style="western"><surname>Woodman</surname><given-names>R</given-names> </name><name name-style="western"><surname>Adams</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ranasinghe</surname><given-names>I</given-names> </name></person-group><article-title>Gender differences in complications following catheter ablation of atrial fibrillation</article-title><source>Eur Heart J Qual Care Clin Outcomes</source><year>2021</year><month>09</month><day>16</day><volume>7</volume><issue>5</issue><fpage>458</fpage><lpage>467</lpage><pub-id pub-id-type="doi">10.1093/ehjqcco/qcab035</pub-id><pub-id pub-id-type="medline">33963402</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abdur Rehman</surname><given-names>K</given-names> </name><name name-style="western"><surname>Wazni</surname><given-names>OM</given-names> </name><name name-style="western"><surname>Barakat</surname><given-names>AF</given-names> </name><etal/></person-group><article-title>Life-threatening complications of atrial fibrillation ablation: 16-year experience in a large prospective tertiary care cohort</article-title><source>JACC Clin Electrophysiol</source><year>2019</year><month>03</month><volume>5</volume><issue>3</issue><fpage>284</fpage><lpage>291</lpage><pub-id pub-id-type="doi">10.1016/j.jacep.2018.11.013</pub-id><pub-id pub-id-type="medline">30898229</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Feeny</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Chung</surname><given-names>MK</given-names> </name><name name-style="western"><surname>Madabhushi</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Artificial intelligence and machine learning in arrhythmias and cardiac electrophysiology</article-title><source>Circ Arrhythm Electrophysiol</source><year>2020</year><month>08</month><volume>13</volume><issue>8</issue><fpage>e007952</fpage><pub-id pub-id-type="doi">10.1161/CIRCEP.119.007952</pub-id><pub-id pub-id-type="medline">32628863</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nyg&#x00E5;rds</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Hulting</surname><given-names>J</given-names> </name></person-group><article-title>An automated system for ECG monitoring</article-title><source>Comput Biomed Res</source><year>1979</year><month>04</month><volume>12</volume><issue>2</issue><fpage>181</fpage><lpage>202</lpage><pub-id pub-id-type="doi">10.1016/0010-4809(79)90015-6</pub-id><pub-id pub-id-type="medline">371910</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dey</surname><given-names>D</given-names> </name><name name-style="western"><surname>Slomka</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Leeson</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Artificial intelligence in cardiovascular imaging</article-title><source>J Am Coll Cardiol</source><year>2019</year><month>03</month><volume>73</volume><issue>11</issue><fpage>1317</fpage><lpage>1335</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2018.12.054</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huecker</surname><given-names>M</given-names> </name><name name-style="western"><surname>Schutzman</surname><given-names>C</given-names> </name><name name-style="western"><surname>French</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Accurate modeling of ejection fraction and stroke volume with mobile phone auscultation: prospective case-control study</article-title><source>JMIR Cardio</source><year>2024</year><month>06</month><day>26</day><volume>8</volume><fpage>e57111</fpage><pub-id pub-id-type="doi">10.2196/57111</pub-id><pub-id pub-id-type="medline">38924781</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>M&#x00FC;ller</surname><given-names>S</given-names> </name><name name-style="western"><surname>Diekmann</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wenzel</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Combining machine learning with real-world data to identify gaps in clinical practice guidelines: feasibility study using the prospective German Stroke Registry and the national acute ischemic stroke guidelines</article-title><source>JMIR Med Inform</source><year>2025</year><month>07</month><day>11</day><volume>13</volume><fpage>e69282</fpage><pub-id pub-id-type="doi">10.2196/69282</pub-id><pub-id pub-id-type="medline">40653745</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alhumaidi</surname><given-names>NH</given-names> </name><name name-style="western"><surname>Dermawan</surname><given-names>D</given-names> </name><name name-style="western"><surname>Kamaruzaman</surname><given-names>HF</given-names> </name><name name-style="western"><surname>Alotaiq</surname><given-names>N</given-names> </name></person-group><article-title>The use of machine learning for analyzing real-world data in disease prediction and management: systematic review</article-title><source>JMIR Med Inform</source><year>2025</year><month>06</month><day>19</day><volume>13</volume><fpage>e68898</fpage><pub-id pub-id-type="doi">10.2196/68898</pub-id><pub-id pub-id-type="medline">40537090</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>MacKay</surname><given-names>EJ</given-names> </name><name name-style="western"><surname>Stubna</surname><given-names>MD</given-names> </name><name name-style="western"><surname>Chivers</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Application of machine learning approaches to administrative claims data to predict clinical outcomes in medical and surgical patient populations</article-title><source>PLoS One</source><year>2021</year><volume>16</volume><issue>6</issue><fpage>e0252585</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0252585</pub-id><pub-id pub-id-type="medline">34081720</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Deng</surname><given-names>H</given-names> </name><name name-style="western"><surname>Shantsila</surname><given-names>A</given-names> </name><name name-style="western"><surname>Xue</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Using the MB-LATER score for predicting arrhythmia outcome after catheter ablation for atrial fibrillation: the Guangzhou atrial fibrillation project</article-title><source>Int J Clin Pract</source><year>2018</year><month>11</month><volume>72</volume><issue>11</issue><fpage>e13247</fpage><pub-id pub-id-type="doi">10.1111/ijcp.13247</pub-id><pub-id pub-id-type="medline">30144238</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yuan</surname><given-names>N</given-names> </name><name name-style="western"><surname>Duffy</surname><given-names>G</given-names> </name><name name-style="western"><surname>Dhruva</surname><given-names>SS</given-names> </name><etal/></person-group><article-title>Deep learning of electrocardiograms in sinus rhythm from US veterans to predict atrial fibrillation</article-title><source>JAMA Cardiol</source><year>2023</year><month>12</month><day>1</day><volume>8</volume><issue>12</issue><fpage>1131</fpage><lpage>1139</lpage><pub-id pub-id-type="doi">10.1001/jamacardio.2023.3701</pub-id><pub-id pub-id-type="medline">37851434</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tseng</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Noseworthy</surname><given-names>PA</given-names> </name></person-group><article-title>Prediction of atrial fibrillation using machine learning: a review</article-title><source>Front Physiol</source><year>2021</year><volume>12</volume><fpage>752317</fpage><pub-id pub-id-type="doi">10.3389/fphys.2021.752317</pub-id><pub-id pub-id-type="medline">34777014</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chao</surname><given-names>TF</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>YJ</given-names> </name><name name-style="western"><surname>Tsao</surname><given-names>HM</given-names> </name><etal/></person-group><article-title>CHADS(2) and CHA(2)DS(2)-VASc scores in the prediction of clinical outcomes in patients with atrial fibrillation after catheter ablation</article-title><source>J Am Coll Cardiol</source><year>2011</year><month>11</month><day>29</day><volume>58</volume><issue>23</issue><fpage>2380</fpage><lpage>2385</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2011.08.045</pub-id><pub-id pub-id-type="medline">22115643</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Levinson</surname><given-names>RT</given-names> </name><name name-style="western"><surname>Paul</surname><given-names>C</given-names> </name><name name-style="western"><surname>Meid</surname><given-names>AD</given-names> </name><name name-style="western"><surname>Schultz</surname><given-names>JH</given-names> </name><name name-style="western"><surname>Wild</surname><given-names>B</given-names> </name></person-group><article-title>Identifying predictors of heart failure readmission in patients from a statutory health insurance database: retrospective machine learning study</article-title><source>JMIR Cardio</source><year>2024</year><month>07</month><day>23</day><volume>8</volume><fpage>e54994</fpage><pub-id pub-id-type="doi">10.2196/54994</pub-id><pub-id pub-id-type="medline">39042456</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="web"><article-title>ICD code lookup website</article-title><source>Lookup IC</source><year>2024</year><access-date>2025-12-16</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://icdcodelookup.com">https://icdcodelookup.com</ext-link></comment></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Charlson</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Pompei</surname><given-names>P</given-names> </name><name name-style="western"><surname>Ales</surname><given-names>KL</given-names> </name><name name-style="western"><surname>MacKenzie</surname><given-names>CR</given-names> </name></person-group><article-title>A new method of classifying prognostic comorbidity in longitudinal studies: development and validation</article-title><source>J Chronic Dis</source><year>1987</year><volume>40</volume><issue>5</issue><fpage>373</fpage><lpage>383</lpage><pub-id pub-id-type="doi">10.1016/0021-9681(87)90171-8</pub-id><pub-id pub-id-type="medline">3558716</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Elixhauser</surname><given-names>A</given-names> </name><name name-style="western"><surname>Steiner</surname><given-names>C</given-names> </name><name name-style="western"><surname>Harris</surname><given-names>DR</given-names> </name><name name-style="western"><surname>Coffey</surname><given-names>RM</given-names> </name></person-group><article-title>Comorbidity measures for use with administrative data</article-title><source>Med Care</source><year>1998</year><month>01</month><volume>36</volume><issue>1</issue><fpage>8</fpage><lpage>27</lpage><pub-id pub-id-type="doi">10.1097/00005650-199801000-00004</pub-id><pub-id pub-id-type="medline">9431328</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>T</given-names> </name><name name-style="western"><surname>Guestrin</surname><given-names>C</given-names> </name></person-group><article-title>XGBoost: a scalable tree boosting system</article-title><conf-name>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name><conf-date>Aug 13-17, 2016</conf-date><conf-loc>San Francisco, CA, USA</conf-loc><fpage>785</fpage><lpage>794</lpage><pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Desai</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>SV</given-names> </name><name name-style="western"><surname>Vaduganathan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Evers</surname><given-names>T</given-names> </name><name name-style="western"><surname>Schneeweiss</surname><given-names>S</given-names> </name></person-group><article-title>Comparison of machine learning methods with traditional models for use of administrative claims with electronic medical records to predict heart failure outcomes</article-title><source>JAMA Netw Open</source><year>2020</year><month>01</month><day>3</day><volume>3</volume><issue>1</issue><fpage>e1918962</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2019.18962</pub-id><pub-id pub-id-type="medline">31922560</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zeltzer</surname><given-names>D</given-names> </name><name name-style="western"><surname>Balicer</surname><given-names>RD</given-names> </name><name name-style="western"><surname>Shir</surname><given-names>T</given-names> </name><name name-style="western"><surname>Flaks-Manov</surname><given-names>N</given-names> </name><name name-style="western"><surname>Einav</surname><given-names>L</given-names> </name><name name-style="western"><surname>Shadmi</surname><given-names>E</given-names> </name></person-group><article-title>Prediction accuracy with electronic medical records versus administrative claims</article-title><source>Med Care</source><year>2019</year><month>07</month><volume>57</volume><issue>7</issue><fpage>551</fpage><lpage>559</lpage><pub-id pub-id-type="doi">10.1097/MLR.0000000000001135</pub-id><pub-id pub-id-type="medline">31135691</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="web"><article-title>yijunliu23/AFA-Claims-CodeRelease</article-title><source>GitHub</source><access-date>2025-12-23</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/yijunliu23/AFA-Claims-CodeRelease">https://github.com/yijunliu23/AFA-Claims-CodeRelease</ext-link></comment></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pedregosa</surname><given-names>F</given-names> </name><name name-style="western"><surname>Varoquaux</surname><given-names>G</given-names> </name><name name-style="western"><surname>Gramfort</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Scikit-learn: machine learning in Python</article-title><source>J Mach Learn Res</source><year>2011</year><volume>12</volume><fpage>2825</fpage><lpage>2830</lpage><pub-id pub-id-type="doi">10.5555/1953048.2078195</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Logistic regression results.</p><media xlink:href="cardio_v9i1e77380_app1.docx" xlink:title="DOCX File, 3252 KB"/></supplementary-material></app-group></back></article>