<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Cardio</journal-id><journal-id journal-id-type="publisher-id">cardio</journal-id><journal-id journal-id-type="index">26</journal-id><journal-title>JMIR Cardio</journal-title><abbrev-journal-title>JMIR Cardio</abbrev-journal-title><issn pub-type="epub">2561-1011</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e60238</article-id><article-id pub-id-type="doi">10.2196/60238</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Causal Inference for Hypertension Prediction With Wearable Electrocardiogram and Photoplethysmogram Signals: Feasibility Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Gong</surname><given-names>Ke</given-names></name><degrees>MEng</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chen</surname><given-names>Yifan</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Song</surname><given-names>Xinyue</given-names></name><degrees>MEng</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Fu</surname><given-names>Zhizhong</given-names></name><degrees>MEng</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Ding</surname><given-names>Xiaorong</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1"/></contrib></contrib-group><aff id="aff1"><institution>School of Life Science and Technology, University of Electronic Science and Technology of China</institution><addr-line>Research Building C348A, 3rd Fl</addr-line><addr-line>Chengdu</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Jain</surname><given-names>Ashish</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Vlad</surname><given-names>Letitia</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Tian</surname><given-names>Xin</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Xiao</surname><given-names>Xinqing</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Xiaorong Ding, PhD, School of Life Science and Technology, University of Electronic Science and Technology of China, Research Building C348A, 3rd Fl, Chengdu, 611731, China, 86 18030493605; <email>xiaorong.ding@uestc.edu.cn</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>23</day><month>1</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e60238</elocation-id><history><date date-type="received"><day>06</day><month>05</month><year>2024</year></date><date date-type="rev-recd"><day>21</day><month>10</month><year>2024</year></date><date date-type="accepted"><day>21</day><month>10</month><year>2024</year></date></history><copyright-statement>&#x00A9; Ke Gong, Yifan Chen, Xinyue Song, Zhizhong Fu, Xiaorong Ding. Originally published in JMIR Cardio (<ext-link ext-link-type="uri" xlink:href="https://cardio.jmir.org">https://cardio.jmir.org</ext-link>), 23.1.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Cardio, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://cardio.jmir.org">https://cardio.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://cardio.jmir.org/2025/1/e60238"/><abstract><sec><title>Background</title><p>Hypertension is a leading cause of cardiovascular disease and premature death worldwide, and it puts a heavy burden on the health care system. Therefore, it is very important to detect and evaluate hypertension and related cardiovascular events to enable early prevention, detection, and management. Hypertension can be detected in a timely manner with cardiac signals, such as through an electrocardiogram (ECG) and photoplethysmogram (PPG), which can be observed via wearable sensors. Most previous studies predicted hypertension from ECG and PPG signals with extracted features that are correlated with hypertension. However, correlation is sometimes unreliable and may be affected by confounding factors.</p></sec><sec><title>Objective</title><p>The aim of this study was to investigate the feasibility of predicting the risk of hypertension by exploring features that are causally related to hypertension via causal inference methods. Additionally, we paid special attention to and verified the reliability and effectiveness of causality compared to correlation.</p></sec><sec sec-type="methods"><title>Methods</title><p>We used a large public dataset from the Aurora Project, which was conducted by Microsoft Research. The dataset included diverse individuals who were balanced in terms of gender, age, and the condition of hypertension, with their ECG and PPG signals simultaneously acquired with wrist-worn wearable devices. We first extracted 205 features from the ECG and PPG signals, calculated 6 statistical metrics for these 205 features, and selected some valuable features out of the 205 features under each statistical metric. Then, 6 causal graphs of the selected features for each kind of statistical metric and hypertension were constructed with the equivalent greedy search algorithm. We further fused the 6 causal graphs into 1 causal graph and identified features that were causally related to hypertension from the causal graph. Finally, we used these features to detect hypertension via machine learning algorithms.</p></sec><sec sec-type="results"><title>Results</title><p>We validated the proposed method on 405 subjects. We identified 24 causal features that were associated with hypertension. The causal features could detect hypertension with an accuracy of 89%, precision of 92%, and recall of 82%, which outperformed detection with correlation features (accuracy of 85%, precision of 88%, and recall of 77%).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>The results indicated that the causal inference&#x2013;based approach can potentially clarify the mechanism of hypertension detection with noninvasive signals and effectively detect hypertension. It also revealed that causality can be more reliable and effective than correlation for hypertension detection and other application scenarios.</p></sec></abstract><kwd-group><kwd>hypertension</kwd><kwd>causal inference</kwd><kwd>wearable physiological signals</kwd><kwd>electrocardiogram</kwd><kwd>photoplethysmogram</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Hypertension, also known as high blood pressure (BP), is a condition in which the pressure of the blood increases in the arteries. The diagnosis of hypertension relies on BP measurement, and it is defined as systolic BP (SBP) &#x2265;140 mm Hg or diastolic BP (DBP) &#x2265;90 mm Hg [<xref ref-type="bibr" rid="ref1">1</xref>]. Hypertension can be further classified into 3 stages. Stage 1 hypertension is associated with SBP and DBP ranges of 140&#x2010;159 mm Hg and 90&#x2010;99 mm Hg, respectively. Stage 2 hypertension is characterized by SBP and DBP ranges of 160&#x2010;179 mm Hg and 100&#x2010;109 mm Hg, respectively. For stage 3 hypertension, the SBP and DBP are more than 180 mm Hg and 110 mm Hg [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>].</p><p>Furthermore, it is noteworthy that even when SBP &#x2265;115 mm Hg and DBP &#x2265;75 mm Hg, a continuous relationship exists between the increase in BP level and the occurrence of cardiovascular or renal pathological conditions and even fatal events. The definition of high blood pressure as SBP &#x2265;140 mm Hg or DBP &#x2265;90 mm Hg primarily serves the purpose of simplifying hypertension diagnosis and decision-making regarding hypertension treatment. This threshold was chosen because the benefits of intervention outweigh the risks associated with nonintervention in this context.</p><p>According to a review of the global epidemiology of hypertension [<xref ref-type="bibr" rid="ref3">3</xref>], hypertension is a leading preventable risk factor for cardiovascular disease and all-cause mortality worldwide. In 2010, a total of 1.38 billion people (31.1% of the global adult population) had hypertension. The prevalence of hypertension is rising globally owing to the aging of the population and increases in exposure to lifestyle risk factors, including unhealthy diets and lack of physical activity.</p><p>In addition, hypertension can be divided into primary and secondary forms. Secondary hypertension originates from specific causes and only encompasses a small fraction of the population. Primary hypertension covers the remaining large fraction of the hypertension population, and it arises from intricate interactions among genetic factors, environmental influences, and the aging process. These factors collectively contribute to an increase in systemic vascular resistance, a hallmark hemodynamic abnormality that leads to elevated BP in almost all hypertensive individuals [<xref ref-type="bibr" rid="ref4">4</xref>]. Furthermore, considering that hypertension may not show any symptoms in its early stages and that there is a continuous relationship between an increase in BP and the risk of stroke, coronary heart disease, heart failure, and chronic kidney disease, it is very important to detect and treat hypertension in the early stages.</p><p>Moreover, physicians often diagnose hypertension by office BP, but masked hypertension and white coat hypertension cannot be effectively detected by office BP. Instead, they usually detect masked hypertension and white coat hypertension through a 24-hour ambulatory recording of the BP signal [<xref ref-type="bibr" rid="ref5">5</xref>], but this process is cumbersome. Hence, there are data-driven approaches based on noninvasive signals for the detection of hypertension, such as electrocardiogram (ECG) or photoplethysmogram (PPG), that are easily accessible from wearable sensors [<xref ref-type="bibr" rid="ref2">2</xref>]. Subsequently, wearable monitoring can continuously monitor patients&#x2019; physiological conditions 24 hours a day. Compared with outpatient blood pressure monitoring, wearable monitoring can obtain patients&#x2019; rhythm information and real physiological conditions (to avoid white coat hypertension and other conditions), as well as the impact of patients&#x2019; behaviors on physiological indicators and other personalized information. Rich reference information is conducive to more accurate assessment and stratification of individual risks.</p><p>There are various studies on detecting hypertension with data-driven methods based on noninvasive signals. These methods include classic machine learning models with hand-extracted features and feature representation learning with deep learning methods. For example, Paragliola et al [<xref ref-type="bibr" rid="ref6">6</xref>] proposed a novel approach for analyzing and classifying the ECG signal with a hybrid deep learning network method called hybrid deep network, which combines long short-term memory, convolutional neural networks, and deep neural networks. The hybrid method can reach an average accuracy of 0.98 and an average sensitivity and specificity of 0.97. Elgendi et al [<xref ref-type="bibr" rid="ref7">7</xref>] reviewed the effect of different types of artifacts added to the PPG signal, characteristic features of the PPG waveform, and existing indexes on hypertension diagnosis. In another study, Alkhodari et al [<xref ref-type="bibr" rid="ref8">8</xref>] used features related to heart rate variability to predict hypertension based on decision trees and random undersampling boosting. The accuracy of the method was 0.81, with the <italic>F</italic><sub>1</sub>-score and area under the receiver operating characteristic curve (AUC) being 0.86 and 0.89, respectively. In a study about the automated detection of hypertension severity, Rajput et al [<xref ref-type="bibr" rid="ref9">9</xref>] developed a 2-band optimal orthogonal wavelet filter bank method, which generates 6 subbands from each ECG signal through a 5-level wavelet decomposition. Further, the sample mean and wavelet entropy features of all subbands were computed to predict the risk of hypertension with classic machine learning methods, such as k-nearest neighbors and support vector machine, and the proposed method can achieve an average classification accuracy of 0.99.</p><p>However, most of the previously mentioned studies relied on extracting features correlated with hypertension but ignored the causality of hypertension and characteristic variables. Due to the presence of confounding factors, correlations can lead to wrong conclusions, just like Simpson&#x2019;s paradox [<xref ref-type="bibr" rid="ref10">10</xref>]. In different populations, the distribution of confounding factors will change, which means the correlations can be unstable and unreliable. Instead, causal inference can not only identify more reliable feature variables with the elimination of confounding factors but also provide more trustworthy guidance for further exploring the physiological mechanisms of hypertension [<xref ref-type="bibr" rid="ref11">11</xref>].</p><p>In this work, we propose to predict hypertension based on causal inference with wearable noninvasive signals. The overview of the proposed method is delineated in <xref ref-type="fig" rid="figure1">Figures 1</xref> and <xref ref-type="fig" rid="figure2">2</xref>. We will select effective features based on causality between hypertension and features extracted from PPG and ECG signals. Then, combined with the detected causal features, we will predict hypertension and evaluate its prediction performance by various evaluation metrics. Ultimately, we aim to identify some features that may be of great value in predicting hypertension.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Research route flow chart.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig01.png"/></fig><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Flowchart of the causal inference for hypertension prediction. (A) Signal preprocessing: 205-dimension beat-by-beat features were extracted from the ECG and PPG as well as the first and second derivatives of the PPG signal (dPPG, sdPPG), and the statistical metrics of these features were calculated as the feature matrix M. (B) Based on the feature matrix M, the causal graphs of the extracted features and hypertension status were identified with the causal inference algorithm (the equivalent greedy search algorithm). (C) The causal feature matrix F was identified from the causal graph obtained from step (B), and we used machine learning classification algorithms to achieve hypertension prediction. ECG: electrocardiogram; PPG: photoplethysmogram.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig02.png"/></fig></sec><sec id="s2" sec-type="methods"><title>Methods</title><p>The methods of this paper can be divided into 7 steps; the details of each step are shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><sec id="s2-1"><title>Ethical Considerations</title><p>In this study, we used data from the Microsoft Waveform Database, and we obtained data access permission from the Microsoft Data Access Committee [<xref ref-type="bibr" rid="ref12">12</xref>]. Microsoft obtained institutional review board approval from WCG IRB (Puyallup, WA, United States). Individuals unable to consent in English, pregnant women, prisoners, institutionalized individuals, and individuals younger than 18 years were excluded from participation due to their vulnerable status. All the subjects voluntarily participated in the experiment and signed informed consent. The original informed consent and the institutional review board both allow for secondary analysis without additional consent. The dataset used in this study was de-identified to protect the privacy of the subjects.</p></sec><sec id="s2-2"><title>Data</title><p>The database that we obtained data from was developed for validating new methods for blood pressure measurement with noninvasive sensors. Noninvasive epidermal pressure signals, ECG signals, and PPG signals were acquired with tension, electrical, and optical sensors, respectively. Meanwhile, the reference blood pressure was measured with either the oscillometric method or the auscultatory method. In this study, we used noninvasive signals for hypertension detection. To validate our proposed method, we used data collected based on the oscillometric method. A total of 614 subjects participated in the oscillometric protocol scheme, with ages ranging from 18-85 years. After excluding data anomalies during the collection process, including miswear, malfunction, data file failure, participant opt-out, alignment failure, and quality failure, relevant measurement information from 483 subjects was retained [<xref ref-type="bibr" rid="ref12">12</xref>]. In a further waveform preprocessing step, poor waveform segments and subjects with less than 4 qualified waveform segments were removed, which led to the final retention of measurement data from 405 participants, comprising 183 hypertensive patients and 222 healthy individuals. The ages of the 405 participants ranged from 18-60 years, with an average age of 45 years. In addition, the 405 participants comprised 199 females and 206 males.</p><p>Moreover, measurements in this protocol were obtained during controlled laboratory visits spaced at least 24 hours apart. Additionally, dynamic measurements were collected during the 24-hour interval between laboratory visits. Automatic measurements were taken every 30 minutes in the morning and every 60 minutes in the evening. Each patient typically had 24-36 waveform segments, with each acquired for 15-30 seconds. Our feature extraction primarily relied on data from dynamic measurements.</p></sec><sec id="s2-3"><title>Feature Extraction</title><p>We extracted 205 features from the filtered ECG and PPG signals with the extraction method defined in our previous study [<xref ref-type="bibr" rid="ref13">13</xref>]. The features mainly include pulse transit time (PTT), time duration (TD), amplitude (AM), intensity of PPG, the first derivative of PPG (dPPG), the second derivative of PPG (sdPPG), area under the PPG curve (AR), and physiological meaningful relative index (RI). The mathematical expression and definition of these features are as follows and are also described in <xref ref-type="table" rid="table1">Table 1</xref>. The fiducial points of ECG, PPG, dPPG, and sdPPG signals of each cardiac cycle were identified to calculate the features. The identified fiducial points are illustrated in <xref ref-type="fig" rid="figure3">Figure 3</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Features extracted from electrocardiogram and photoplethysmogram signals.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Index</td><td align="left" valign="bottom">Classification</td><td align="left" valign="bottom">Definition of features</td></tr></thead><tbody><tr><td align="left" valign="top">1&#x2010;10</td><td align="left" valign="top">Pulse transit time</td><td align="left" valign="top">Time deviation between R peak of electrocardiogram and fiducial points of photoplethysmogram</td></tr><tr><td align="left" valign="top">11&#x2010;66</td><td align="left" valign="top">Time duration</td><td align="left" valign="top">Time duration between 2 fiducial points of photoplethysmogram</td></tr><tr><td align="left" valign="top">67&#x2010;111</td><td align="left" valign="top">Amplitude</td><td align="left" valign="top">Amplitude between fiducial points of photoplethysmogram</td></tr><tr><td align="left" valign="top">112&#x2010;130</td><td align="left" valign="top">Pulse intensity</td><td align="left" valign="top">Intensity of photoplethysmogram, dPPG<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup>, and sdPPG<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> at fiducial points</td></tr><tr><td align="left" valign="top">131&#x2010;185</td><td align="left" valign="top">Area</td><td align="left" valign="top">Area under the photoplethysmogram curve between fiducial points</td></tr><tr><td align="left" valign="top">186&#x2010;205</td><td align="left" valign="top">Relative index</td><td align="left" valign="top">Physiological meaningful ratio index</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>dPPG: the first derivative of photoplethysmogram.</p></fn><fn id="table1fn2"><p><sup>b</sup>sdPPG: the second derivative of photoplethysmogram.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Diagram of fiducial points of the ECG and PPG signals as well as major types of features [<xref ref-type="bibr" rid="ref13">13</xref>]. AI: absolute intensity; AR: area under the PPG curve; AM: amplitude; dPPG: the first derivative of PPG; ECG: electrocardiogram; PPG: photoplethysmogram; PTT: pulse transit time; PW: pulse width; RRI: R-R interval; sdPPG: the second derivative of PPG.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig03.png"/></fig><p><italic>Feature Point (FP, 1</italic>&#x223C;<italic>10</italic>) = [PPG valley, sdPPG a, dPPG peak, sdPPG a, PPG peak, sdPPG c, sdPPG d, dPPG valley, sdPPG e, sdPPG f, PPG valley next]</p><p><italic>PTT</italic> = FP(i) - R peak, i=1&#x223C;10</p><p><italic>TD</italic> = [RRI, (FP(j) - FP(i)), i,j=1&#x223C;10, and <italic>j&#x003E;i</italic>]</p><p><italic>AM</italic> = PPG(FP(j)) - PPG(FP(i)), i=1&#x223C;10, and <italic>j&#x003E;i</italic></p><p><italic>AIPPG</italic> = PPG(FP(i)), i=1&#x223C;10</p><p><italic>AIdPPG</italic> = dPPG(FP(i)), i=1&#x223C;10</p><p><italic>AIsdPPG</italic> = sdPPG(FP(i)), i=2,4,7&#x223C;10</p><p><italic>AR</italic> = Area between (FP(j) &#x2013; FP(i)), i,j=1&#x223C;10</p><p><italic>RI</italic>: relative rising time, dicrotic diastolic ratio, augmentation index, inflection point area point, slope transit time, ratio of sdPPG (b/a, c/a, (c+d&#x2013;b)/a, etc), PPG intensity ratio, perfusion index [<xref ref-type="bibr" rid="ref13">13</xref>].</p><p>After obtaining the above features, we can perform feature selection and build a causal graph based on the causal inference algorithm.</p></sec><sec id="s2-4"><title>Algorithm of Causal Inference</title><p>We used the greedy equivalence search (GES) algorithm to learn the causal graph. The GES algorithm is based on the theoretical basis of Meek&#x2019;s conjecture [<xref ref-type="bibr" rid="ref14">14</xref>]. The Meek&#x2019;s conjecture is: if direct acyclic graph (DAG) M is an independent map of another DAG F, then there exists a finite set of edges in DAG F that can be added or reversed, after each modifiable edge is added or reversed direction, DAG M is still an independent graph of DAG F. After all modifications are done, M = F. Underlying the Meek&#x2019;s conjecture, we can use generalized score functions [<xref ref-type="bibr" rid="ref15">15</xref>] and the GES algorithm to get the final causal graph. <xref ref-type="fig" rid="figure4">Figure 4</xref> shows the implementation steps of the GES algorithm. In addition, we also provide the pseudo code to illustrate the detailed steps of the GES algorithm as shown in <xref ref-type="other" rid="box1">Textbox 1</xref>.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Flowchart of the greedy equivalence search algorithm.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig04.png"/></fig><boxed-text id="box1"><title> Algorithm 1: Apply-edge-operation(<inline-formula><mml:math id="ieqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula>,<inline-formula><mml:math id="ieqn2"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">H</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula>).</title><p>Input: <inline-formula><mml:math id="ieqn3"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>D</mml:mi><mml:mi>A</mml:mi><mml:msub><mml:mi>G</mml:mi><mml:mrow><mml:mi>s</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mstyle></mml:math></inline-formula><inline-formula><mml:math id="ieqn4"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn5"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">H</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> where <inline-formula><mml:math id="ieqn6"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mo>&#x2264;</mml:mo><mml:mrow><mml:mi mathvariant="fraktur">H</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn7"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mo>&#x2260;</mml:mo><mml:mrow><mml:mi mathvariant="fraktur">H</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>1: Set <inline-formula><mml:math id="ieqn8"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mo>&#x2032;</mml:mo></mml:mrow></mml:mrow></mml:msup><mml:mo stretchy="false">&#x2190;</mml:mo><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>2: While <inline-formula><mml:math id="ieqn9"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn10"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">H</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> contain a node Y that is a sink node in both <inline-formula><mml:math id="ieqn11"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>D</mml:mi><mml:mi>A</mml:mi><mml:msub><mml:mi>G</mml:mi><mml:mrow><mml:mi>s</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mstyle></mml:math></inline-formula> and for which <inline-formula><mml:math id="ieqn12"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>P</mml:mi><mml:msubsup><mml:mi>a</mml:mi><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mi>G</mml:mi></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mi>P</mml:mi><mml:msubsup><mml:mi>a</mml:mi><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:mstyle></mml:math></inline-formula>, remove Y and all incident edges from both <inline-formula><mml:math id="ieqn13"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>D</mml:mi><mml:mi>A</mml:mi><mml:msub><mml:mi>G</mml:mi><mml:mrow><mml:mi>s</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>3: end while</p><p>4: Let Y be any sink node in <inline-formula><mml:math id="ieqn14"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">H</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>5: if Y has no children in <inline-formula><mml:math id="ieqn15"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> then</p><p><named-content content-type="indent">&#x2003;</named-content>6: Let X be any parent of Y in <inline-formula><mml:math id="ieqn16"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">H</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> that is not a parent of</p><p><named-content content-type="indent">&#x2003;</named-content>7: Y in <inline-formula><mml:math id="ieqn17"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula>, add the edge <inline-formula><mml:math id="ieqn18"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="normal">X</mml:mi></mml:mrow><mml:mo stretchy="false">&#x2192;</mml:mo><mml:mrow><mml:mi mathvariant="normal">Y</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p><named-content content-type="indent">&#x2003;</named-content>8: return <inline-formula><mml:math id="ieqn19"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mo>&#x2032;</mml:mo></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>9: end if</p><p>10: Let <inline-formula><mml:math id="ieqn20"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="normal">D</mml:mi></mml:mrow><mml:msubsup><mml:mrow><mml:mi mathvariant="normal">e</mml:mi></mml:mrow><mml:mrow><mml:mi>Y</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:msubsup></mml:mrow></mml:mstyle></mml:math></inline-formula> denote the descendants of Y in<inline-formula><mml:math id="ieqn21"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>11: And let D &#x2208; DeY G denote the (unique) maximal element from this set within &#x210B;2</p><p>12: Let Z be any maximal child of Y in <inline-formula><mml:math id="ieqn22"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> such that <inline-formula><mml:math id="ieqn23"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> is a descendant of Y in <inline-formula><mml:math id="ieqn24"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>13: if <inline-formula><mml:math id="ieqn25"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="normal">Y</mml:mi></mml:mrow><mml:mo stretchy="false">&#x2192;</mml:mo><mml:mrow><mml:mi mathvariant="normal">Z</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> is covered in <inline-formula><mml:math id="ieqn26"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p><named-content content-type="indent">&#x2003;</named-content>14: reverse <inline-formula><mml:math id="ieqn27"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="normal">Y</mml:mi></mml:mrow><mml:mo stretchy="false">&#x2192;</mml:mo><mml:mrow><mml:mi mathvariant="normal">Z</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> in <inline-formula><mml:math id="ieqn28"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mo>&#x2032;</mml:mo></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p><named-content content-type="indent">&#x2003;</named-content>15: Return <inline-formula><mml:math id="ieqn29"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mo>&#x2032;</mml:mo></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>16: end if</p><p>17: if There exists a node X that is a parent of Y but not a parent of Z in <inline-formula><mml:math id="ieqn30"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mo>&#x2032;</mml:mo></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math></inline-formula> then</p><p><named-content content-type="indent">&#x2003;</named-content>18: add <inline-formula><mml:math id="ieqn31"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="normal">X</mml:mi></mml:mrow><mml:mo stretchy="false">&#x2192;</mml:mo><mml:mrow><mml:mi mathvariant="normal">Z</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> to <inline-formula><mml:math id="ieqn32"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mo>&#x2032;</mml:mo></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p><named-content content-type="indent">&#x2003;</named-content>19: return <inline-formula><mml:math id="ieqn33"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mo>&#x2032;</mml:mo></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>20: end if</p><p>21: Let X be any parent of Z that is not a parent of Y</p><p>22: Add <inline-formula><mml:math id="ieqn34"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="normal">Y</mml:mi></mml:mrow><mml:mo stretchy="false">&#x2192;</mml:mo><mml:mrow><mml:mi mathvariant="normal">Y</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula> to <inline-formula><mml:math id="ieqn35"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mo>&#x2032;</mml:mo></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>23: return <inline-formula><mml:math id="ieqn36"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mo>&#x2032;</mml:mo></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>Output: DAG <inline-formula><mml:math id="ieqn37"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mo>&#x2032;</mml:mo></mml:mrow></mml:mrow></mml:msup></mml:mrow></mml:mstyle></mml:math></inline-formula> that results from adding or reversing an edge in <inline-formula><mml:math id="ieqn38"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mrow><mml:mi mathvariant="fraktur">G</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:math></inline-formula>.</p></boxed-text><p>Then, the GES algorithm has 2 stages. In the first stage, it starts from an equivalence class (empty graph) with no dependencies and keeps adding possible edges to search for the largest equivalence class of generalized scoring functions until the scoring functions&#x2019; local maximum is reached. Then, in the second stage, the greedy principle is used to gradually delete the directed edges until the generalized scoring function reaches the local maximum again, and the final causal graph is obtained.</p><p>Considering that hypertension is a discrete variable while the feature variables are continuous, we are essentially dealing with mixed data. Traditional scoring functions such as Bayesian information criterion and Bayesian Dirichlet equivalent uniform do not take into account the issue of mixed data; for example, it discretizes continuous data and process it uniformly, resulting in a loss of valuable information. Therefore, we introduce a generalized scoring function to replace traditional scoring functions. The generalized function is primarily based on kernels and handles linear causal relationships, nonlinear causal relationships, continuous variables, discrete variables, and mixed data in a uniform manner, maximizing information retention. Finally, this scoring function addresses the issue of Markov equivalence classes, to some extent, overcoming the limitation of equivalence greedy search algorithms in distinguishing Markov equivalence classes.</p><p>Finally, we needed to organize a feature matrix in which each row represents a sample and each column represents a kind of feature, then input this matrix into the equivalent greedy search algorithm to obtain the causal graph. Prior to this, feature selection is a necessary step to construct the feature matrix.</p></sec><sec id="s2-5"><title>Feature Selection</title><p>This section mainly explains the specific process of feature selection in this study, which is mainly divided into the following 3 parts. After completing feature selection, we will perform causal strategy and causal graph construction.</p><list list-type="order"><list-item><p>Six statistical metrics: Since ECG and PPG signals are time series data, we extracted the beat-by-beat features and calculated the statistical metrics of these 205 features to represent the temporal variability information. The statistical metrics include: standard deviation, range, mean, quartile deviation, coefficient of variation, and median, which result in 205&#x00D7;6=1230 dimensional features. This allows us to capture and analyze the temporal characteristics of ECG and PPG signals while summarizing them using key statistical measures. Based on the extracted features, we then detected the 6 different causal graphs of these features with hypertension, which provide insights into the relationships and causal effects among the extracted feature variables and hypertension.</p></list-item><list-item><p>Significant difference analysis: Now, we need to use the corresponding 205 features to construct a causal graph under each metric. Due to the limitations of the equivalent greedy search algorithm calculation efficiency, hardware device computing power resources, and the number of subject samples, the time cost of constructing a causal graph based on 205 features is unacceptable. Therefore, we will use significant difference analysis to exclude features that do not show significant differences between hypertensive patients and healthy people. Then, considering the time cost and sample size, we will sort the retained features according to the degree of significant difference. We ultimately selected less than 50 features for causal graph construction.</p></list-item><list-item><p>Causal feature selection: In the following, we select the features that have a direct causal relationship with the hypertension node from the causal graph constructed under each metric. A total of 24 causal features were selected under the 6 metrics. It should be noted here that different metrics mean observing the changes of the same feature over a period of time from different perspectives. The features with the same number under different statistical metrics are essentially derivatives of the original features. Taking feature 52 as an example, we can get 4 feature variables under these metrics; they are shown in <xref ref-type="fig" rid="figure5">Figure 5</xref>. These 4 feature variables are essentially derivatives of feature 52. Therefore, in the final causal graph, we use feature 52 nodes to represent the above 4 features. From this, we can see that there are some features with the same number among the 24 causal features. We can use a feature node in the final causal graph to represent these feature variables with the same number, and finally obtain a final causal graph containing 10 feature nodes.</p></list-item></list><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Box plot of the various statistical indicators of the feature 52.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig05.png"/></fig></sec><sec id="s2-6"><title>Strategy of Causal Inference</title><p>In order to mitigate the potential issues of bidirectional causality and cyclic graphs, we conducted the analysis of the causal relationships between respective feature variables and hypertension under each indicator, culminating in the derivation of corresponding causal subgraphs, so as to obtain the causal graph.</p><list list-type="order"><list-item><p>Strategy for obtaining causal graph: We randomly partitioned the dataset to identify the causal graph, with the allocation of an additional validation set for subsequent hypertension risk prediction. Recognizing that a single random partitioning could introduce undesired stochasticity (thereby rendering the resulting causal graphs potentially unrepresentative), we draw inspiration from the concept of 10-fold cross-validation. This method involves conducting 10 iterations to compute causal subgraphs, followed by a rigorous pruning process to retain only those segments demonstrating direct causal associations with hypertension within each causal subgraph. Subsequently, guided by the principle of majority rule, we amalgamate the results of these iterations to derive the ultimate causal subgraph.</p></list-item><list-item><p>Strategy for merging causal graph: After obtaining the final causal subgraph with each graph identified with the 6 categories of features mentioned in feature selection section, we assume that the weights of the causal relationships between the feature variables and hypertension are equal under each category of feature; based on the principle of majority rule, we integrate multiple causal subgraphs into the ultimate causal graph. This method can screen out more reliable direct causal feature variables, further simplify the causal graph, and preserve important information.</p></list-item></list></sec><sec id="s2-7"><title>Classifier and Performance Evaluation</title><p>In conjunction with a 10-fold cross-validation approach to partition the dataset into training and testing sets, our predictive modeling of hypertension risk primarily leverages 4 classification algorithms: random forest, logistic regression, decision trees, and naive Bayes. These algorithms are selected for their effectiveness in capturing diverse patterns in the data. Moreover, the evaluation of our models is based on a comprehensive set of performance metrics, encompassing accuracy, precision, recall, <italic>F</italic><sub>1</sub>-score, and the AUC, which are defined later on. Following the derivation of the final causal diagram, we proceeded to select an equal number of feature variables with the strongest correlation to hypertension, based on the point-biserial correlation coefficient. These selected features were then used in the prediction of hypertension risk. Subsequently, we compared the predictive performance of this model with the one based on causal feature variables.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Signal and Feature Analysis</title><p>We found that there are 24 feature variables directly causally related to hypertension under 6 indicators. These can be abstracted into 10 representative feature variables in the causal graph. Then, we used the point-biserial correlation coefficient to select the 24 feature variables with the strongest correlation to hypertension. After conducting data analysis, we discovered that there are 5 feature variables that overlap between the causal feature variables and the correlated feature variables. These variables are as follows and 4 of them are shown in <xref ref-type="fig" rid="figure5">Figure 5</xref>.</p><disp-formula id="equWL1"><mml:math id="eqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>S</mml:mi><mml:mi>D</mml:mi><mml:mi>F</mml:mi><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>u</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mn>52</mml:mn><mml:mtext>&#x00A0;</mml:mtext><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>S</mml:mi><mml:mi>D</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mi>o</mml:mi><mml:mi>f</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mi>T</mml:mi><mml:mi>D</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mrow><mml:mi mathvariant="normal">s</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">d</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">G</mml:mi></mml:mrow><mml:mrow><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mrow><mml:mi mathvariant="normal">d</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">G</mml:mi></mml:mrow><mml:mrow><mml:mtext>valley</mml:mtext></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math></disp-formula><disp-formula id="equWL2"><mml:math id="eqn2"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>Q</mml:mi><mml:mi>D</mml:mi><mml:mi>F</mml:mi><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>u</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mn>52</mml:mn><mml:mtext>&#x00A0;</mml:mtext><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>Q</mml:mi><mml:mi>D</mml:mi><mml:mrow><mml:mtext>&#x00A0;</mml:mtext></mml:mrow><mml:mi>o</mml:mi><mml:mi>f</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mi>T</mml:mi><mml:mi>D</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mrow><mml:mi mathvariant="normal">s</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">d</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">c</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mrow><mml:mi mathvariant="normal">d</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">G</mml:mi></mml:mrow><mml:mrow><mml:mtext>valley</mml:mtext></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math></disp-formula><disp-formula id="equWL3"><mml:math id="eqn3"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>R</mml:mi><mml:mi>F</mml:mi><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>u</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mn>52</mml:mn><mml:mtext>&#x00A0;</mml:mtext><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>R</mml:mi><mml:mi>a</mml:mi><mml:mi>n</mml:mi><mml:mi>g</mml:mi><mml:mi>e</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mi>o</mml:mi><mml:mi>f</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mi>T</mml:mi><mml:mi>D</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mrow><mml:mi mathvariant="normal">s</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">d</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">G</mml:mi></mml:mrow><mml:mrow><mml:mi>c</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mrow><mml:mi mathvariant="normal">d</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">G</mml:mi></mml:mrow><mml:mrow><mml:mtext>valley</mml:mtext></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math></disp-formula><disp-formula id="equWL4"><mml:math id="eqn4"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>M</mml:mi><mml:mi>E</mml:mi><mml:mi>F</mml:mi><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>u</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mn>52</mml:mn><mml:mtext>&#x00A0;</mml:mtext><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>M</mml:mi><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>n</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mi>o</mml:mi><mml:mi>f</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mi>T</mml:mi><mml:mi>D</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mrow><mml:mi mathvariant="normal">s</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">d</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">c</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mrow><mml:mi mathvariant="normal">d</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">G</mml:mi></mml:mrow><mml:mrow><mml:mtext>valley</mml:mtext></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math></disp-formula><disp-formula id="equWL5"><mml:math id="eqn5"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi>M</mml:mi><mml:mi>E</mml:mi><mml:mi>F</mml:mi><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>u</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mn>47</mml:mn><mml:mtext>&#x00A0;</mml:mtext><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>M</mml:mi><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>n</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mi>o</mml:mi><mml:mi>f</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mi>T</mml:mi><mml:mi>D</mml:mi><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mrow><mml:mi mathvariant="normal">s</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">d</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">G</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">c</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">G</mml:mi></mml:mrow><mml:mrow><mml:mtext>peak</mml:mtext></mml:mrow></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mstyle></mml:math></disp-formula><p>Furthermore, we selected the representative samples from the groups of hypertensive patients and healthy people for comparative analysis. The PPG waveform analysis diagrams of hypertensive patients and healthy people are shown in <xref ref-type="fig" rid="figure6">Figure 6</xref>, and the scatter plots of feature 52 are shown in <xref ref-type="fig" rid="figure7">Figure 7</xref>. Then, based on the analysis of feature 52&#x2019;s position in PPG signals, we observed that in hypertensive patients, the peak of the c-point on sdPPG may occur earlier compared to healthy individuals. This could be a possible reason as to why feature 52 is strongly correlated with hypertension and is considered to have a strong causal relationship with hypertension.</p><p>Finally, it is important to note that further research and validation are necessary to confirm the relationship between feature 52, the c-point on sdPPG, and hypertension. These findings may provide valuable insights into potential markers for hypertension and contribute to the understanding of its pathophysiology.</p><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>Comparison of PPG waveforms between healthy people and hypertensive patients. PPG: photoplethysmogram.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig06.png"/></fig><fig position="float" id="figure7"><label>Figure 7.</label><caption><p>Scatter distribution of feature 52 for normotensive subjects (green) and hypertensive subjects (red).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig07.png"/></fig></sec><sec id="s3-2"><title>Causal Graph</title><p>In this study, considering the potential disturbance to the causal graph caused by randomly partitioning the data into training and testing sets, we used the idea of 10-fold cross-validation and causal strategy I to mitigate such interference. After applying the aforementioned procedures, we obtained a total of 6 causal subgraphs under different metrics. In addition, due to space constraints, this paper only presents the causal subgraphs under the standard deviation and range indicators, as shown in <xref ref-type="fig" rid="figure8">Figures 8</xref> and <xref ref-type="fig" rid="figure9">9</xref>, respectively. It is observed that the feature variables directly causally associated with the risk of hypertension vary across different indicators. Based on the principle of majority rule, we applied causal strategy II to obtain the final causal graph, as depicted in <xref ref-type="fig" rid="figure10">Figure 10</xref>.</p><fig position="float" id="figure8"><label>Figure 8.</label><caption><p>Causal subgraph of hypertension and the features calculated with their standard deviation. AI: absolute intensity; AR: area under the PPG curve; dPPG: the first derivative of PPG; P-R: precision-recall; PPG: photoplethysmogram; RI: physiological meaningful relative index; sdPPG: the second derivative of PPG; TD: time duration.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig08.png"/></fig><fig position="float" id="figure9"><label>Figure 9.</label><caption><p>Causal subgraph of hypertension and the features calculated with their range. AM: amplitude; AR: area under the PPG curve; dPPG: the first derivative of PPG; P-R: precision-recall; PPG: photoplethysmogram; RI: physiological meaningful relative index; sdPPG: the second derivative of PPG; TD: time duration.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig09.png"/></fig><fig position="float" id="figure10"><label>Figure 10.</label><caption><p>Final causal graph. AR: area under the PPG curve; dPPG: the first derivative of PPG; P-R: precision-recall; PPG: photoplethysmogram; RI: physiological meaningful relative index; sdPPG: the second derivative of PPG; TD: time duration.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig10.png"/></fig></sec><sec id="s3-3"><title>Hypertension Classification Results</title><p>In this subsection, we used multiple classifier algorithms for hypertension classification prediction. First, we primarily utilized logistic regression and other classification algorithms based on causal feature variables for hypertension classification. The classification performance is presented in <xref ref-type="table" rid="table2">Table 2</xref>. We found that the logistic regression algorithm exhibited the best predictive performance with an accuracy of 0.89, precision of 0.92, recall of 0.82, and <italic>F</italic><sub>1</sub>-score of 0.87. Both the accuracy and accuracy rate are relatively high, which means that our classification prediction model can accurately predict hypertensive patients and healthy people, and the probability of making errors in the judgment of hypertensive patients is low; the <italic>F</italic><sub>1</sub>-score further proves the above conclusion. In addition, a higher recall rate indicates that most patients with high blood pressure can be correctly predicted.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Causality-based classification performance.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Algorithm</td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom">Precision</td><td align="left" valign="bottom">Recall</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score</td></tr></thead><tbody><tr><td align="left" valign="top">Random forest</td><td align="left" valign="top">0.86</td><td align="left" valign="top">0.90</td><td align="left" valign="top">0.77</td><td align="left" valign="top">0.83</td></tr><tr><td align="left" valign="top">Decision tree</td><td align="left" valign="top">0.78</td><td align="left" valign="top">0.76</td><td align="left" valign="top">0.78</td><td align="left" valign="top">0.76</td></tr><tr><td align="left" valign="top">Naive Bayes</td><td align="left" valign="top">0.80</td><td align="left" valign="top">0.95</td><td align="left" valign="top">0.58</td><td align="left" valign="top">0.72</td></tr><tr><td align="left" valign="top">Logistic regression</td><td align="left" valign="top">0.89</td><td align="left" valign="top">0.92</td><td align="left" valign="top">0.82</td><td align="left" valign="top">0.87</td></tr></tbody></table></table-wrap><p>Subsequently, <xref ref-type="fig" rid="figure11">Figure 11</xref> illustrates the receiver operating characteristic curve and precision-recall curve of the classifier algorithms. The purple line represents the logistic regression classification algorithm. It can be observed that the area under the curve of this logistic regression classification algorithm is higher than that of other classification algorithms in both receiver operating characteristic and precision-recall curves.</p><fig position="float" id="figure11"><label>Figure 11.</label><caption><p>The ROC curve (top panel) and P-R curve (bottom panel) of hypertension detection based on causal features with different machine learning algorithms: the blue curve represents random forest (R), the green curve represents decision tree (D), the red curve represents naive Bayes (G), and the purple curve represents logistic regression (L). AUC: area under the receiver operating characteristic curve; FPR: false positive rate; P-R: precision-recall; ROC: receiver operating characteristic; TPR: true positive rate.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig11.png"/></fig><p>Finally, we compared the classification performance based on causal feature variables with that based on correlated feature variables, as shown in <xref ref-type="table" rid="table3">Table 3</xref>. We found that the best performance in terms of the 4 evaluation metrics was consistently achieved by the classification algorithm based on causal feature variables. This finding is also consistent with the results presented in <xref ref-type="fig" rid="figure12">Figures 12</xref> and <xref ref-type="fig" rid="figure13">13</xref>. These findings imply that the causal characteristics we screened have certain mining value in the field of hypertension prediction.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Classifier performance comparison.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="2">Algorithm</td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom">Precision</td><td align="left" valign="bottom">Recall</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="6"><bold>Causality</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Random forest</td><td align="left" valign="top">0.86</td><td align="left" valign="top">0.90</td><td align="left" valign="top">0.77</td><td align="left" valign="top">0.82</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Decision tree</td><td align="left" valign="top">0.78</td><td align="left" valign="top">0.76</td><td align="left" valign="top">0.78</td><td align="left" valign="top">0.79</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Naive Bayes</td><td align="left" valign="top">0.80</td><td align="left" valign="top">0.95</td><td align="left" valign="top">0.58</td><td align="left" valign="top">0.72</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Logistic regression</td><td align="left" valign="top">0.89</td><td align="left" valign="top">0.92</td><td align="left" valign="top">0.82</td><td align="left" valign="top">0.87</td></tr><tr><td align="left" valign="top" colspan="6"><bold>Correlation</bold></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Random forest</td><td align="left" valign="top">0.79</td><td align="left" valign="top">0.81</td><td align="left" valign="top">0.72</td><td align="left" valign="top">0.75</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Decision tree</td><td align="left" valign="top">0.72</td><td align="left" valign="top">0.68</td><td align="left" valign="top">0.72</td><td align="left" valign="top">0.69</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Naive Bayes</td><td align="left" valign="top">0.80</td><td align="left" valign="top">0.82</td><td align="left" valign="top">0.74</td><td align="left" valign="top">0.77</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Logistic regression</td><td align="left" valign="top">0.85</td><td align="left" valign="top">0.88</td><td align="left" valign="top">0.77</td><td align="left" valign="top">0.82</td></tr></tbody></table></table-wrap><fig position="float" id="figure12"><label>Figure 12.</label><caption><p>The ROC curve (top panel) and P-R curve (bottom panel) for the best classifier of causality and correlation: the blue curve represents the logistic regression classifier based on causality, while the red curve represents the logistic regression classifier based on correlation. AUC: area under the receiver operating characteristic curve; FPR: false positive rate; P-R: precision-recall; ROC: receiver operating characteristic; TPR: true positive rate.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig12.png"/></fig><fig position="float" id="figure13"><label>Figure 13.</label><caption><p>Histogram of evaluation metrics for the best classifier of causality and correlation.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="cardio_v9i1e60238_fig13.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings and Advantages</title><p>This study primarily explored the relationship between feature variables extracted from ECG and PPG signals and hypertension from a causal perspective, using causal inference methods to construct causal graphs. Simultaneously, to preserve the temporal information of time series signals to the maximum extent, causal graphs were constructed separately for 6 metrics, including standard deviation, mean, range, coefficient of variation, median, and quartiles. These causal graphs were derived based on specific causal strategies, ensuring a certain degree of reliability and accuracy in the resulting causal graphs. By assessing the performance of feature variables based on causality in hypertension risk classification prediction against those based on correlation, we validated the reliability of causality-based feature variables compared to correlation-based ones.</p><p>Specifically, when selecting feature variables strongly associated with hypertension, both causal inference and correlation coefficient&#x2013;based methods performed similarly. However, when the association between feature variables and hypertension was weak, causal inference methods tended to select more reliable feature variables compared to correlation-based methods. This is the reason why feature variables based on causality outperformed those based on correlation in hypertension risk prediction. Additionally, we found that feature 52&#x2019;s derived variables exhibited significant differences in distribution between the hypertensive and healthy subject groups under multiple metrics. This may provide potential value and insights for subsequent pathological mechanism analysis.</p></sec><sec id="s4-2"><title>Comparison to Prior Work</title><p>This study conducted exploratory analysis, initially focusing on the correlation analysis between hypertension and blood pressure based on the medical information mart for intensive care (MIMIC) database. Typically, the gold standard for diagnosing hypertension is SBP and DBP, where subjects are considered hypertensive when SBP exceeds 140 mm Hg or DBP exceeds 90 mm Hg. Nevertheless, when clustering analysis was performed on 24-hour dynamic blood pressure data collected from patients, we observed that the blood pressure distribution of hypertensive and nonhypertensive subjects did not exhibit significant differentiation or stratification; instead, they appeared mixed. After analysis, we attributed this phenomenon to factors such as patients taking antihypertensive medications, being in specific states, or incorrect device wear, which indirectly reflects the limitations of blood pressure measurement. Second, we previously conducted causal analysis [<xref ref-type="bibr" rid="ref16">16</xref>] using data collected from a self-generated database of 30 individuals. Causal analysis was primarily carried out under the mean metric, resulting in limited preservation of temporal information. However, it still revealed significant differences in the distribution of feature 52 between the hypertensive and healthy subject groups, consistent with the findings of this paper.</p></sec><sec id="s4-3"><title>Limitations and Future Work</title><p>There were some limitations to this study. First, our work primarily focused on binary classification to distinguish hypertensive patients from healthy individuals. However, hypertension can be categorized into different stages, such as stage 1, stage 2, and stage 3, based on blood pressure level and disease condition. Second, the population used could have been more diverse in terms of race and ethnicity. In our future work, we will consider conducting clustering of the features to distinguish different stages of hypertension, and we will validate the work on larger and more diverse subject populations to be able to draw more general conclusions.</p></sec><sec id="s4-4"><title>Conclusion</title><p>In this study, we explored the feasibility of predicting the risk of hypertension using causal inference methods. First, we constructed causal graphs using the GES algorithm and 10-fold cross-validation approach under each indicator. We then applied corresponding causal strategies to obtain the optimal causal graphs for each indicator. Finally, we merged the causal graphs from different indicators into a final causal graph based on the majority rule. After selecting the feature variables, we used classifiers including random forests, decision trees, naive Bayes, and logistic regression to predict hypertension. Overall, combining various indicators, we found that most classifiers based on causal features have better classification performance than classifiers based on correlation features. To the best of our knowledge, this study represents the first attempt to introduce causal inference methods in hypertension prediction, providing a new perspective for understanding the physiological mechanisms of hypertension.</p></sec></sec></body><back><ack><p>This work was supported in part by the National Natural Science Foundation of China (82102178) and Huzhou ST Special Program of Huzhou (2023GZ01).</p></ack><notes><sec><title>Data Availability</title><p>The data we used for this study came from a public dataset, which other researchers can apply to access [<xref ref-type="bibr" rid="ref17">17</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>KG's contributions include data curation, formal analysis, investigation, methodology, software, validation, visualization, and writing the original draft. YC's contributions include conceptualization, resources, and reviewing and editing the manuscript. XS and ZF contributed to visualization. XD's contributions include conceptualization, funding acquisition, methodology, project administration, resources, supervision, and reviewing and editing the manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>absolute intensity</p></def></def-item><def-item><term id="abb2">AM</term><def><p>amplitude</p></def></def-item><def-item><term id="abb3">AR</term><def><p>area under the PPG curve</p></def></def-item><def-item><term id="abb4">AUC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb5">BP</term><def><p>blood pressure</p></def></def-item><def-item><term id="abb6">DAG</term><def><p>direct acyclic graph</p></def></def-item><def-item><term id="abb7">DBP</term><def><p>diastolic blood pressure</p></def></def-item><def-item><term id="abb8">dPPG</term><def><p>the first derivative of PPG</p></def></def-item><def-item><term id="abb9">ECG</term><def><p>electrocardiogram</p></def></def-item><def-item><term id="abb10">GES</term><def><p>greedy equivalence search</p></def></def-item><def-item><term id="abb11">P-R</term><def><p>precision-recall</p></def></def-item><def-item><term id="abb12">PPG</term><def><p>photoplethysmogram</p></def></def-item><def-item><term id="abb13">PTT</term><def><p>pulse transit time</p></def></def-item><def-item><term id="abb14">RI</term><def><p>physiological meaningful relative index</p></def></def-item><def-item><term id="abb15">RRI</term><def><p>R-R interval</p></def></def-item><def-item><term id="abb16">SBP</term><def><p>systolic blood pressure</p></def></def-item><def-item><term id="abb17">sdPPG</term><def><p>the second derivative of PPG</p></def></def-item><def-item><term id="abb18">TD</term><def><p>time duration</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Williams</surname><given-names>B</given-names> </name><name name-style="western"><surname>Mancia</surname><given-names>G</given-names> </name><name name-style="western"><surname>Spiering</surname><given-names>W</given-names> </name><etal/></person-group><article-title>ESC/ESH Guidelines for the management of arterial hypertension: The Task Force for the management of arterial hypertension of the European Society of Cardiology (ESC) and the European Society of Hypertension (ESH)</article-title><source>Eur Heart J</source><year>2018</year><volume>39</volume><issue>33</issue><fpage>3021</fpage><lpage>3104</lpage><pub-id pub-id-type="doi">10.1093/eurheartj/ehy339</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jain</surname><given-names>P</given-names> </name><name name-style="western"><surname>Gajbhiye</surname><given-names>P</given-names> </name><name name-style="western"><surname>Tripathy</surname><given-names>RK</given-names> </name><name name-style="western"><surname>Acharya</surname><given-names>UR</given-names> </name></person-group><article-title>A two-stage deep CNN architecture for the classification of low-risk and high-risk hypertension classes using multi-lead ECG signals</article-title><source>Inform Med Unlocked</source><year>2020</year><volume>21</volume><fpage>100479</fpage><pub-id pub-id-type="doi">10.1016/j.imu.2020.100479</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mills</surname><given-names>KT</given-names> </name><name name-style="western"><surname>Stefanescu</surname><given-names>A</given-names> </name><name name-style="western"><surname>He</surname><given-names>J</given-names> </name></person-group><article-title>The global epidemiology of hypertension</article-title><source>Nat Rev Nephrol</source><year>2020</year><month>04</month><volume>16</volume><issue>4</issue><fpage>223</fpage><lpage>237</lpage><pub-id pub-id-type="doi">10.1038/s41581-019-0244-2</pub-id><pub-id pub-id-type="medline">32024986</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mancia</surname><given-names>G</given-names> </name><name name-style="western"><surname>Kreutz</surname><given-names>R</given-names> </name><name name-style="western"><surname>Brunstr&#x00F6;m</surname><given-names>M</given-names> </name><etal/></person-group><article-title>ESH Guidelines for the management of arterial hypertension. The Task Force for the management of arterial hypertension of the European Society of Hypertension: endorsed by the International Society of Hypertension (ISH) and the European Renal Association (ERA)</article-title><source>J Hypertens</source><year>2023</year><month>12</month><day>1</day><volume>41</volume><issue>12</issue><fpage>1874</fpage><lpage>2071</lpage><pub-id pub-id-type="doi">10.1097/HJH.0000000000003480</pub-id><pub-id pub-id-type="medline">37345492</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>QF</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>WY</given-names> </name><name name-style="western"><surname>Asayama</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Ambulatory blood pressure monitoring to diagnose and manage hypertension</article-title><source>Hypertension</source><year>2021</year><month>02</month><volume>77</volume><issue>2</issue><fpage>254</fpage><lpage>264</lpage><pub-id pub-id-type="doi">10.1161/HYPERTENSIONAHA.120.14591</pub-id><pub-id pub-id-type="medline">33390042</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Paragliola</surname><given-names>G</given-names> </name><name name-style="western"><surname>Coronato</surname><given-names>A</given-names> </name></person-group><article-title>An hybrid ECG-based deep network for the early identification of high-risk to major cardiovascular events for hypertension patients</article-title><source>J Biomed Inform</source><year>2021</year><month>01</month><volume>113</volume><fpage>103648</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2020.103648</pub-id><pub-id pub-id-type="medline">33276113</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Elgendi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Fletcher</surname><given-names>R</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>The use of photoplethysmography for assessing hypertension</article-title><source>NPJ Digit Med</source><year>2019</year><volume>2</volume><fpage>60</fpage><pub-id pub-id-type="doi">10.1038/s41746-019-0136-7</pub-id><pub-id pub-id-type="medline">31388564</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alkhodari</surname><given-names>M</given-names> </name><name name-style="western"><surname>Islayem</surname><given-names>DK</given-names> </name><name name-style="western"><surname>Alskafi</surname><given-names>FA</given-names> </name><name name-style="western"><surname>Khandoker</surname><given-names>AH</given-names> </name></person-group><article-title>Predicting hypertensive patients with higher risk of developing vascular events using heart rate variability and machine learning</article-title><source>IEEE Access</source><year>2020</year><volume>8</volume><fpage>192727</fpage><lpage>192739</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2020.3033004</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rajput</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Sharma</surname><given-names>M</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>RS</given-names> </name><name name-style="western"><surname>Acharya</surname><given-names>UR</given-names> </name></person-group><article-title>Automated detection of severity of hypertension ECG signals using an optimal bi-orthogonal wavelet filter bank</article-title><source>Comput Biol Med</source><year>2020</year><month>08</month><volume>123</volume><fpage>103924</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2020.103924</pub-id><pub-id pub-id-type="medline">32768053</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Pearl</surname><given-names>J</given-names> </name></person-group><article-title>Comment: Understanding Simpson&#x2019;s Paradox</article-title><source>Probabilistic and Causal Inference: The Works of Judea Pearl</source><year>2022</year><fpage>399</fpage><lpage>412</lpage><pub-id pub-id-type="doi">10.1145/3501714.3501738</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yao</surname><given-names>L</given-names> </name><name name-style="western"><surname>Chu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Li</surname><given-names>S</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Gao</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>A</given-names> </name></person-group><article-title>A survey on causal inference</article-title><source>ACM Trans Knowl Discov Data</source><year>2021</year><month>10</month><day>31</day><volume>15</volume><issue>5</issue><fpage>1</fpage><lpage>46</lpage><pub-id pub-id-type="doi">10.1145/3444944</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mieloszyk</surname><given-names>R</given-names> </name><name name-style="western"><surname>Twede</surname><given-names>H</given-names> </name><name name-style="western"><surname>Lester</surname><given-names>J</given-names> </name><etal/></person-group><article-title>A comparison of wearable tonometry, photoplethysmography, and electrocardiography for cuffless measurement of blood pressure in an ambulatory setting</article-title><source>IEEE J Biomed Health Inform</source><year>2022</year><month>07</month><volume>26</volume><issue>7</issue><fpage>2864</fpage><lpage>2875</lpage><pub-id pub-id-type="doi">10.1109/JBHI.2022.3153259</pub-id><pub-id pub-id-type="medline">35201992</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><name name-style="western"><surname>Ding</surname><given-names>X</given-names> </name><name name-style="western"><surname>Yan</surname><given-names>BP</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>YT</given-names> </name><etal/></person-group><article-title>Feature exploration for knowledge-guided and data-driven approach based cuffless blood pressure measurement</article-title><source>arXiv</source><access-date>2024-12-03</access-date><comment>Preprint posted online on  Aug 27, 2019</comment><comment><ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1908.10245">https://arxiv.org/abs/1908.10245</ext-link></comment></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chickering</surname><given-names>DM</given-names> </name></person-group><article-title>Optimal structure identification with greedy search</article-title><source>J Mach Learn Res</source><year>2002</year><volume>3</volume><issue>Nov</issue><fpage>507554</fpage><pub-id pub-id-type="doi">10.1162/153244303321897717</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>K</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Sch&#x00F6;lkopf</surname><given-names>B</given-names> </name><name name-style="western"><surname>Glymour</surname><given-names>C</given-names> </name></person-group><article-title>Generalized score functions for causal discovery</article-title><source>KDD</source><year>2018</year><month>08</month><volume>2018</volume><fpage>1551</fpage><lpage>1560</lpage><pub-id pub-id-type="doi">10.1145/3219819.3220104</pub-id><pub-id pub-id-type="medline">30191079</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Gong</surname><given-names>K</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ding</surname><given-names>X</given-names> </name></person-group><article-title>Causal inference for hypertension prediction</article-title><year>2023</year><conf-name>2023 45th Annual International Conference of the IEEE Engineering in Medicine &#x0026; Biology Society (EMBC)</conf-name><conf-date>Jul 24-27, 2023</conf-date><conf-loc>Sydney, Australia</conf-loc><pub-id pub-id-type="doi">10.1109/EMBC40787.2023.10341021</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="web"><article-title>Aurora</article-title><source>Microsoft</source><access-date>2025-01-07</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.microsoft.com/en-us/research/project/aurora/">https://www.microsoft.com/en-us/research/project/aurora/</ext-link></comment></nlm-citation></ref></ref-list></back></article>