Full text
47,554 characters
· extracted from
preprint-html
· click to expand
Artificial Intelligence-Enabled Electrocardiogram for Elevated Left Ventricular Filling Pressure | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Artificial Intelligence-Enabled Electrocardiogram for Elevated Left Ventricular Filling Pressure View ORCID Profile Jaehyun Lim , View ORCID Profile Min Sung Lee , Jung Ho Suh , Sora Kang , View ORCID Profile Hak Seung Lee , Jong-Hwan Jang , Jeong Min Son , Joon-Myoung Kwon , Yong-Jin Kim , View ORCID Profile Kyung-Hee Kim , View ORCID Profile Seung-Pyo Lee doi: https://doi.org/10.1101/2025.10.03.25337299 Jaehyun Lim 1 Department of Internal Medicine, Seoul National University College of Medicine and Seoul National University Hospital , Seoul, Republic of Korea MD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jaehyun Lim Min Sung Lee 2 Digital Healthcare Institute, Sejong Hospital , Bucheon, Republic of Korea 3 Medical AI Co., Ltd. Seoul , Republic of Korea MD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Min Sung Lee Jung Ho Suh 4 Biomedical Research Institute, Seoul National University , Seoul, Republic of Korea MD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Sora Kang 2 Digital Healthcare Institute, Sejong Hospital , Bucheon, Republic of Korea 3 Medical AI Co., Ltd. Seoul , Republic of Korea MS Find this author on Google Scholar Find this author on PubMed Search for this author on this site Hak Seung Lee 2 Digital Healthcare Institute, Sejong Hospital , Bucheon, Republic of Korea 3 Medical AI Co., Ltd. Seoul , Republic of Korea MD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Hak Seung Lee Jong-Hwan Jang 2 Digital Healthcare Institute, Sejong Hospital , Bucheon, Republic of Korea 3 Medical AI Co., Ltd. Seoul , Republic of Korea MD, PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jeong Min Son 2 Digital Healthcare Institute, Sejong Hospital , Bucheon, Republic of Korea 3 Medical AI Co., Ltd. Seoul , Republic of Korea MD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Joon-Myoung Kwon 2 Digital Healthcare Institute, Sejong Hospital , Bucheon, Republic of Korea 3 Medical AI Co., Ltd. Seoul , Republic of Korea MD, MS Find this author on Google Scholar Find this author on PubMed Search for this author on this site Yong-Jin Kim 1 Department of Internal Medicine, Seoul National University College of Medicine and Seoul National University Hospital , Seoul, Republic of Korea 4 Biomedical Research Institute, Seoul National University , Seoul, Republic of Korea 5 Healthcare AI Research Institute, Seoul National University Hospital , Seoul, Republic of Korea MD, PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site Kyung-Hee Kim 6 Division of Cardiology, Department of Internal Medicine, Incheon Sejong Hospital, Cardiovascular Center , Incheon, Republic of Korea MD, PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Kyung-Hee Kim For correspondence: sproll1{at}snu.ac.kr learnbyliving9{at}gmail.com Seung-Pyo Lee 1 Department of Internal Medicine, Seoul National University College of Medicine and Seoul National University Hospital , Seoul, Republic of Korea 4 Biomedical Research Institute, Seoul National University , Seoul, Republic of Korea 5 Healthcare AI Research Institute, Seoul National University Hospital , Seoul, Republic of Korea MD, PhD Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Seung-Pyo Lee For correspondence: sproll1{at}snu.ac.kr learnbyliving9{at}gmail.com Abstract Full Text Info/History Metrics Data/Code Preview PDF ABSTRACT Background Left ventricular filling pressure (LVFP) is associated with heart failure symptoms, a key prognostic marker, and a therapeutic target, but is difficult to measure non-invasively. We aimed to develop and validate a deep learning-based artificial intelligence (AI) model using a standard 12-lead electrocardiogram (ECG) to detect elevated LVFP and assess its prognostic value. Methods We trained an AI model to detect increased LVFP. Septal E/e’ >15 on Doppler echocardiography was used to define increased LVFP and guide AI-ECG model training. The model was built upon a foundation model trained with >1 million multi-ethnic ECGs and fine-tuned through a development cohort of 225737 ECGs and 115982 echocardiogram data from 92775 unique patients from two tertiary hospitals. The model performance was assessed in a separate internal population from the development cohort (n=9278) and an independent external cohort from another tertiary hospital (n=17926). The prognostic significance of the AI-ECG output value was evaluated via survival analyses using the internal and external hospital cohorts, as well as the UK Biobank (n=43347). Results The AI-ECG model detected increased LVFP with an area under the curve of 0·868 (95% confidence interval [CI] 0·859–0·877) and 0·850 (95% CI 0·841–0·858) in the internal and external test cohorts, respectively. The model output was an independent predictor of mortality in all three cohorts (adjusted hazard ratio per 10-point increment: internal 1.31 [95% CI 1·23–1·38]; external 1·32 [95% CI 1·28–1·35]; UK Biobank 1.16 [95% CI 1·07–1·26]; all p<0·001). Its prognostic capability was comparable or superior to traditional echocardiographic parameters, particularly in patients with comorbidities. Conclusions The AI-ECG may enable identification of patients with increased LVFP and provide powerful prognostic information. Further prospective studies are warranted to evaluate its clinical utility. What Is New? By using a specific, broadly applicable echocardiographic marker, E/e’ > 15 as the training target, our model circumvents the well-documented problems of indeterminate classifications and the exclusion of patients with atrial fibrillation, that have constrained previous models. The most significant added value is the extensive external validation. We built our model upon a state-of-the-art, multi-ethnic foundation model pre-trained on >1 million ECGs, and demonstrated the model’s consistent high performance not only in an internal cohort but also in two independent, racially and geographically distinct external cohorts. This robust external validation directly confronts the critical challenge of generalizability. What Are the Clinical Implications? The AI-ECG output value provides independent and meaningful prognostic information, with performance comparable or numerically superior to established traditional echocardiographic parameters. This was particularly evident in patients with comorbidities, where the role of traditional echocardiographic markers is often limited. The AI-ECG may enable both population-level screening and enhance longitudinal management, offering an opportunity to identify at-risk individuals earlier and implement preventive strategies. INTRODUCTION Elevated left ventricular filling pressure (LVFP), a consequence of left ventricular diastolic dysfunction (LVDD), is associated with heart failure symptoms, and a key prognostic marker and therapeutic target. 1 – 6 However, direct measurement of LVFP via invasive methods, the current gold standard, is impractical for routine screening or therapeutic guidance. Accordingly, there has been ongoing research to detect increased LVFP noninvaisvely. 1 , 5 , 7 Several echocardiographic parameters—such as peak early (E) and late (A) mitral inflow velocities, early diastolic mitral annulus velocity (e’), the E/e’ ratio, peak velocity of tricuspid regurgitation by continuous-wave Doppler, and left atrial volume index—have been suggested, 7 , 8 with the latest guidelines integrating these parameters into a diagnostic algorithm. 1 Nonetheless, the performance of this algorithm and its individual components has been modest. 7 , 9 Furthermore, each parameter has inherent limitations, particularly notable with the latest guideline, which leaves many patients in an indeterminate category and is inapplicable to patients with atrial fibrillation/flutter (AF/AFL). 1 , 7 , 10 Artificial intelligence (AI) has provided novel solutions in medicine, particularly by leveraging conventional yet widely-used techniques, such as the electrocardiogram (ECG). 11 – 15 As the ECG encodes the vector summation of electrical signals including myocardial contraction and relaxation, deep neural network-based processing of the ECG has demonstrated potential in unraveling meaningful patterns, suggesting AI-enhanced ECG as a valuable screening and diagnostic tool in various cardiac diseases. 11 – 15 We hypothesized that AI-driven ECG analysis could identify elevations in LVFP. This study aimed to develop and validate an AI model, trained using septal E/e’ >15 as a reference, that performs reliably across diverse ethnicities and populations as well as cardiac rhythms, including atrial arrhythmias. 8 The model performance and its prognostic significance were validated in an internal cohort and two independent external cohorts from racially and geographically diverse populations. METHODS Study design, datasets, and population This was a retrospective multicenter study involving three tertiary hospitals in South Korea and the UK Biobank. The model was developed using data from adult patients at Bucheon Sejong Hospital (Hospital A) and Incheon Sejong Hospital (Hospital B) who underwent transthoracic echocardiography and a 12-lead ECG within a 14-day window between September 2016 and October 2023. The model was tested both internally and externally, with external testing using data from Seoul National University Hospital (Hospital C). Across all hospital cohorts, patients with a history of mitral valve repair or replacement, a left ventricular assist device, constrictive pericarditis, or missing septal E/e’ were excluded. Raw ECG data were extracted in XML format at a 500Hz sampling rate. Given that increases in LVFP predict survival, 2 , 4 , 5 we conducted survival analyses using both the hospital-based mortality data (from Hospitals A, B, and C, for test datasets only) and the UK Biobank data ( Figure 1 ). Mortality data were obtained from death statistics provided by Statistics Korea. In the UK Biobank data, resting 10-second ECG recorded at 500Hz was matched with clinical information collected between May 2014 and July 2022. Download figure Open in new tab Figure 1. Study workflow The study outlines the AiTiALVDD model development process, comprising upstream and downstream tasks using large-scale ECG and echocardiogram datasets. External validation was conducted at Seoul National University Hospital and UK Biobank to assess primary, secondary, survival, and exploratory outcomes. This study was approved by the Institutional Review Boards at each participating hospital (No.: Hospital A, 2024-09-003; B, 2024-09-001; C, H-2408-112-1562), and informed consent was waived. The UK Biobank application (Ref: 89372) was approved with an appropriate Material Transfer Agreement. AI-ECG model development Our model, AiTiALVDD v0.90.00, was built upon a pre-trained foundation model that serves as a generalizable learning framework trained on a large-scale ECG dataset before being fine-tuned for specific clinical tasks. The foundation model was initially trained using 1291868 ECG samples from 442736 unique patients from five international public repositories. The foundation model was subsequently fine-tuned using labeled ECG data from Hospitals A and B to detect increased LVFP. We chose a mitral septal E/e’ ratio >15 as an estimator of increased LVFP. 8 Our rationale for using this criterion included its mathematical background linking it to LVFP, its diagnostic accuracy comparable to the latest 2016 ASE/EACVI guideline when validated against invasively measured LVFP, and its broad applicability across cardiac rhythms. 7 , 9 The final model generates a continuous output, an AI-ECG score, between 0–100. A 1-lead version using lead I was also derived from the 12-lead model. Further model specifications are detailed in the eText 1 and eFigures 1, 2 . Endpoints The primary endpoint was the ability of the AI-ECG model detecting increased LVFP. The secondary endpoint was the identification of grade II/III LVDD according to the latest guideline. 1 Patients with indeterminate LVDD status were excluded from the secondary analysis. Survival analysis We conducted survival analyses using this value in the internal test cohort (Hospital A and B), the external test cohort (Hospital C), and the prognostic significance validation cohort, the UK Biobank ( Figure 1 ). Cox proportional hazards models were used to evaluate the prognostic value of the AI-ECG scores. The prognostic discrimination of the AI-ECG score, E/e’ ratio, and LVDD grade for all-cause mortality was compared using C-index. Subgroup analyses were conducted according to age, sex, comorbidities, electrocardiographic and echocardiographic features (left ventricular ejection fraction [LVEF], mitral regurgitation). For an exploratory analysis, the AI-ECG score was compared with N-terminal prohormone of brain natriuretic peptide (NT-proBNP) levels. Patients with NT-proBNP levels measured within two days of the echocardiography were included in this analysis. Statistical Analysis Demographic characteristics were compared using Student’s t-test, Mann-Whitney U-test, chi-square test, or Fisher’s exact test, as appropriate. The area under the receiver operating characteristic curve (AUROC), area under the precision-recall curve (AUPRC), sensitivity, specificity, positive predictive value (PPV), and negative predictive value (NPV) with corresponding 95% confidence intervals (CI) were calculated using bootstrap resampling and averaging methods. The optimal threshold for binary classification was selected at the Youden index. The DeLong test was employed to compare AUROCs between models. 16 Correlations between two parameters were assessed using the Pearson correlation coefficient. A multivariable Cox-proportional hazards model was employed to calculate adjusted hazard ratios (aHRs) and 95% CIs, with adjustment for age, sex, hypertension, diabetes mellitus, ischemic heart disease, heart failure, stroke, and CKD. For all Cox regression models, the AI-ECG score was analyzed per 10-point increment. Similarly, age was also analyzed per 10-year increment. We used R software v4.4.1 and Python v3.9.7, and a two-sided p <.05 was considered statistically significant. This study was reported following the STARD (Standards for Reporting of Diagnostic Accuracy Studies) guidelines. RESULTS Baseline characteristics: development cohort The development cohort (Hospitals A, B) included 225737 ECGs and 115982 echocardiograms from 92775 unique patients ( Figure 1 and Table 1 ). Among these, 15130 echocardiogram-ECG pairs (13.0%) had increased LVFP. Patients with increased LVFP were older, more likely to be women, had a higher burden of comorbidities, a larger left atrium, and higher NT-proBNP levels than those with normal LVFP ( Table 1 ). View this table: View inline View popup Table 1. Baseline characteristics: Development cohort (Hospital A, B) Baseline characteristics: external cohort and prognostic significance validation cohort The external test cohort from Hospital C included 17929 echocardiogram-ECG pairs from 17926 patients, of which 2024 pairs (11.3%) were classified as having increased LVFP ( Figure 1 ). The clinical characteristics of these patients were similar to those in the development cohort ( Table 2 ). The prognostic significance validation cohort, the UK Biobank, included 43,347 individuals. Baseline characteristics of this cohort are detailed in eTable 2 . View this table: View inline View popup Download powerpoint Table 2. Primary and secondary endpoints: AI model discrimination performance of the increased LVFP or LVDD grade (II or III) Distributions of AL-ECG model output, the AI-ECG score In the internal test cohort, the increased LVFP group had a median AI-ECG score of 34.1 (interquartile range [IQR] 18.1–54.8), whereas the normal LVFP group had a median score of 5.6 (IQR 1.6–14.7). A similar separation was observed in the external cohort (median scores 28.4 vs. 6.0, Figure 2 ). There was a stepwise increase in the AI-ECG scores with higher septal E/e’ groups of ≤8, >8 to ≤15, and >15 ( eFigure 3 ), as well as LVDD grades based on the 2016 ASE/EACVI recommendations ( eFigure 4 ), in both the internal and external test cohorts. The Pearson correlation coefficients between E/e’ and AI-ECG score were 0.60 and 0.54 in the internal and external test datasets, respectively (both p<.001, eFigure 5 ). Download figure Open in new tab Figure 2. Comparison of the AI-ECG score distribution between increased and normal left ventricular filling pressure groups Distribution of the AI-ECG scores according to left ventricular filling pressure (LVFP) status. The boxplots illustrate the AI-ECG scores for the increased LVFP group (blue) and the normal LVFP group (pink). In the increased LVFP group (internal test) the mean AI-ECG score was 37.2 ± 22.1, with a median of 34.1 (Interquartile range, 18.1–54.8). In contrast, the normal LVFP group had a mean AI-ECG score of 10.6 ± 13.1 and a median of 5.9 (1.6–14.7). In the increased LVFP group (external test) the mean AI-ECG score was 32.2 ± 20.7, with a median of 28.4 (14.8–46.3). In contrast, the normal LVFP group had a mean AI-ECG score of 10.0 ± 11.7 and a median of 6.0 (2.3–13.3). The cutoff score of 13.3 (indicated by the blue dashed line) was predefined during the model development phase using Younden’s J statistic. Panel (A) represents the internal test, while panel (B) represents the external test. Primary and secondary endpoints For the primary endpoint of detecting increased LVFP, the AI-ECG model achieved an AUROC of 0.868 (95% CI 0.859–0.877) and an AUPRC of 0.540 (95% CI 0.511–0.569) in the internal test cohort. A similar AUROC of 0.850 (95% CI 0.841–0.858) and AUPRC of 0.458 (95% CI 0.435–0.479) were demonstrated in the external test cohort ( Figure 3 and Table 2 ). Sensitivity, specificity, PPV, and NPV were 83.4% (95% CI 81.6–85.2), 72.4% (95% CI 71.6–73.3), 31.1% (95% CI 29.7–32.5), and 96.7% (95% CI 96.3–97.1) in the internal test cohort. The performance was also robust in the external cohort ( Table 2 ). Download figure Open in new tab Figure 3. Receiver operating characteristic curve analyses for primary and secondary endpoints. Receiver operating characteristics curves (panel A, internal test; panel B, external test), illustrating the discriminative ability of the AI-ECG model in detecting elevated left ventricular filling pressure, defined by a mitral E/e’ ratio > 15 (primary outcome), and in identifying left ventricular diastolic dysfunction grade II/III (secondary outcome). The primary outcome is depicted in blue, and the secondary outcome is depicted in red. AUROC, area under the receiver operating characteristic curve; AUPRC, area under the precision-recall curve For the secondary endpoint (grade II/III LVDD), the model demonstrated high AUROCs of 0.901 (95% CI 0.892–0.910) and 0.941 (95% CI 0.931–0.951) in the internal and external test cohorts, respectively ( Figure 3 and Table 2 ). Subgroup analysis of primary and secondary endpoints In the subgroup analyses, the AUROCs were consistently lower in patients with unfavorable clinical characteristics, such as advanced age, comorbidities including hypertension, diabetes mellitus, CKD, ischemic heart disease, systolic dysfunction, or non-sinus rhythms, and AF/AFL, in both the internal and external cohorts ( eTables 3 and 4, eFigure 6 ). The performance for discriminating grade II/III LVDD was generally better across subgroups, but the tendency of lower performance in those with unfavorable clinical characteristics was consistently observed ( eTables 5 and 6, eFigure 7 ). Survival analysis of AI-ECG for increased LVFP The internal test cohort (Hospitals A and B), external test cohort (Hospital C), and the UK Biobank consisted of 7568, 17922, and 43347 patients, respectively, with median follow-up periods of 2.7 (IQR 1.4–4.0), 5.8 (IQR 3.9–8.0), and 3.4 (IQR 2.5–4.9) years. During follow-up, 361 deaths occurred in the internal test cohort (4.8%), 2837 in the external test cohort (15.8%), and 536 in the UK Biobank (1.2%). Kaplan–Meier analysis showed progressive increases in mortality by AI-ECG score quartiles ( eFigure 8–10 ). After multivariable adjustment, the AI-ECG score remained independently associated with mortality across all cohorts: adjusted hazard ratio (aHR) 1.31 (95% CI 1.23–1.38, p <.001) in the internal test cohort; aHR 1.32 (95% CI 1.28–1.35, p <.001) in the external test cohort; and aHR 1.16 (95% CI 1.07–1.26, p <.001) in the UK Biobank ( eTables 7 – 9 ). Regarding prognostic performance, as measured by the C-index, it was generally favorable for the AI-ECG score compared to echocardiographic LVDD grading and E/e’ ratio ( eTable 10 ). In the internal test cohort, the AI-ECG score achieved a C-index of 0.877 (95% CI 0.855–0.898) versus 0.868 (95% CI 0.846–0.890) for LVDD grading and 0.867 (95% CI 0.845-0.889) for E/e’ ratio. In the external test cohort, the C-index for AI-ECG was 0.720 (95% CI 0.708–0.733), compared to 0.711 (95% CI 0.699–0.724) for LVDD grading and 0.709 (95% CI 0.697-0.721) for E/e’ ratio, with no statistically significant difference between AI-ECG and LVDD grading (p=0.305). Notably, the AI-ECG score demonstrated numerically superior prognostic discrimination for all-cause mortality particularly in most subgroups of patients with comorbidities ( eTable 10 ). Performance comparison between AI-ECG and NT-proBNP for increased LVFP In our exploratory analysis, the 12-lead AI-ECG outperformed NT-proBNP in both internal and external test cohorts regarding the primary endpoint: AUROCs were 0.840 (95% CI 0.821–0.856) for AI-ECG vs. 0.809 (95% CI 0.788–0.828) for NT-proBNP in the internal test, and 0.835 (95% CI 0.802–0.866) for AI-ECG vs. 0.767 (95% CI 0.730–0.802) for NT-proBNP in the external test cohort ( eTable 11 ). Consistent results were demonstrated for secondary outcomes ( eTable 12 ). Notably, a single lead model achieved performance comparable to NT-proBNP ( eTables 11 and 12 ). DISCUSSION The present study demonstrates that the AI-ECG model can reliably identify increased LVFP, whether defined by an E/e’ >15 or by LVDD grading (grade II/III), and provide robust prognostic information. Importantly, these results were validated in racially and geographically diverse external cohorts, highlighting the model’s generalizability. Deep neural networks, when trained with sufficiently large datasets, can effectively generalize and accurately discern meaningful patterns even in the presence of considerable noise—even up to 50:1 of noise-to-signal ratios in the presence of a sufficiently large number (≥10,000) of valid samples. 17 This has also been demonstrated in medicine. For instance, although diagnostic variability among ophthalmologists in diabetic retinopathy is substantial, AI models trained using these noisy human-labeled datasets have demonstrated performance surpassing that of ophthalmologists. 18 , 19 Our model was pre-trained on over a million ECGs and fine-tuned using over 100,000 ECG–echocardiogram pairs labeled with E/e′. Thus, despite the acknowledged suboptimal nature of E/e’ for defining increased LVFP, this dataset likely provided sufficient volume and variety for the AI model to learn ECG patterns representative of elevated LVFP, resulting in comparable or superior performance in certain contexts to traditional echocardiographic parameters. Selecting a reference standard for AI model development requires balancing precision with data availability and generalizability. While invasive measurements are the gold standard, their relative scarcity limits dataset size and increases risk of overfitting. Indeed, we, for the first time, have reported an AI-ECG model detecting diastolic heart failure with preserved LVEF based on the 2016 ASE/EACVI recommendations, 1 , 13 with a subsequent study demonstrating similar findings across various EF ranges. 12 Despite acceptable AUROCs, it should be noted that our previous study was limited to patients with preserved LVEF, while the latter study lacked rigorous external validation. 12 , 13 Indeed, reproducibility and rigorous external validation of AI models are to be emphasized. 20 In addition, as these studies utilized LVDD grading, they inherently excluded AF/AFL, significantly limiting generalizability and clinical applicability given its high prevalence. 1 The 2016 algorithm also leaves many patients in an indeterminate category. 10 Furthermore, the diagnostic accuracy of this integrated algorithm is only comparable to E/e’ in detecting increased LVFP, particularly in patients with preserved LVEF (see eTable 13 for comparison). 9 Thus, our model trained based on E/e’, given its physiological rationale and broader applicability across cardiac rhythms, offers greater clinical acceptability and generalizability. 7 LVFP holds two clinical objectives: therapeutic guidance and prognostication. Regarding prognostication, our study demonstrated that the AI-ECG model provides robust prognostic prediction, often comparable or superior to echocardiographic parameters, particularly in patients with comorbidities. The lower hazard ratio in the UK Biobank data is likely attributable to its lower heart failure prevalence (0.7%) compared to hospital-based cohorts enriched with patients having increased LVFP in the presence of systolic dysfunction. As for therapeutic guidance, guiding therapy based on the accurate assessment of LVFP has significant clinical implications, as demonstrated by the CHAMPION trial where invasive hemodynamic-guided therapy significantly reduced heart failure hospitalizations. 3 However, such invasive monitoring is impractical for widespread use. While echocardiography has been also demonstrated to guide therapy, its utility for frequent reassessment is limited by high cost, resource demands, and intra- and inter-observer variability. 5 , 21 , 22 Harmonizing AI with ECG addresses these limitations, enabling frequent, noninvasive monitoring. Moreover, its simple and rapid nature makes it particularly well-suited for population-based screening. 23 Its favorable performance compared to established biomarkers such as NT-proBNP further highlights its potential applicability. Prior research on using AI-ECG to detect increased LVFP is limited. One study trained a model directly on invasively measured pulmonary capillary wedge pressure (PCWP), and reported modest performance (AUROC 0.79–0.82) in internal and subsequent external validation. 15 , 24 It should be noted that this approach is inherently susceptible to selection bias and lacks generalizability despite its methodological robustness, because only high-risk patients necessitating invasive pulmonary artery catheterization were used to train the model. Nonetheless, this prior work should be appraised since they demonstrated the proof-of-concept that changes in model outputs generally correlate with changes in the PCWP, demonstrating the possibility that AI-ECG may be used to track patients and guide treatment. 24 Subgroup analyses offer a critical insight into the AI-ECG model. We observed a consistent tendency toward lower AUROC in subgroups with advanced age or comorbidities. However, the reduced performance in these subgroups may not reflect a deficiency in the AI model, but rather the inherent limitations of the echocardiographic reference standard: that is, the E/e’ ratio itself may less accurately represent the true elevation in LVFP in these populations, leading to an artificially lower AUROC. 25 , 26 For instance, the subgroup with LVEF <40% provides compelling insight. Prior invasive catheterization studies reported that 80–95% of patients with systolic dysfunction had increased LVFP. 2 , 6 , 27 Whereas the AI model classified 85.3% of these patients as having increased LVFP, only 39.7% of these patients were classified as such according to the E/e’ or LVDD grading, strongly suggesting that the AI-ECG approach may more accurately reflect true elevations in LVFP. Similarly, previous literature has suggested a lower E/e’ threshold (e.g., E/e’>11) for increased LVFP in patients with AF/AFL. 26 , 28 Accordingly, the observed low specificity in these patients likely indicates that some of those who were classified as having normal LVFP according to E/e’≤15 might actually have increased LVFP. Ultimately, the observation that our model—trained on E/e’ >15 threshold—aligns better with the expected clinical and pathophysiological status in subgroups where that same threshold is known to be unreliable, suggests the model learned underlying physiological signals beyond the label itself. Limitations Our study has several limitations. First, despite its robust learning capability, training the model solely based on echocardiographic parameters may lack clinical robustness. However, using E/e’ for model training is a strategic compromise, obtaining sufficient data volume and minimizing selection bias at the expense of methodological robustness, ultimately ensuring greater model generalizability. Second, more delicate model training, such as using different thresholds of E/e’ according to age or cardiac rhythm, might have improved performance. Third, the optimal clinical thresholds for guiding therapeutic interventions may vary across individuals and remain to be established. Future research is required to define and validate such clinically relevant thresholds. Lastly, a maximum interval of 14 days between ECG and echocardiography might allow for changes in the patient’s clinical status. CONCLUSION The present study demonstrates that an AI-ECG may identify patients with increased LVFP. The AI model showed robust performance in external validation cohorts derived from geographically and racially different populations. Beyond correlation with echocardiographic parameters indicating increased LVFP, our model provided meaningful prognostic information. Further studies are warranted to evaluate the clinical utility of AI-ECG in screening patients with increased LVFP or guiding interventions in these patients. Author Contributions Jaehyun Lim (Study design, Data analysis, Manuscript drafting and critical revision), Min Sung Lee (Data acquisition, Statistical analysis, Manuscript drafting), Jung Ho Suh (Data curation, Data interpretation, Manuscript revision), Sora Kang (Data curation, Statistical analysis, Manuscript revision), Hak Seung Lee (Data curation, Data interpretation, Critical manuscript revision), Jong-Hwan Jang (Data management, Statistical support, Manuscript review), Jeong Min Son (Data acquisition, Data verification, Manuscript review), Joon-Myoung Kwon (Study conception, Model development, Manuscript drafting and critical revision), Yong-Jin Kim (Clinical data interpretation, Manuscript review), Kyung-Hee Kim (Study design, Study supervision, Data analysis, Manuscript drafting, Review and Approval), and Seung-Pyo Lee (Study design, Study supervision, Data analysis, Manuscript drafting, Review and approval). Declaration of Interests M.S.L., S.K., H.S.L., J.-H.J., J.M.S., and J.-M.K. are employees of Medical AI Co., Ltd. and are involved in an equity/royalty relationship with Medical AI Co., Ltd. J.-M.K. is the founder of Medical AI Co., Ltd. S.-P.L. is involved in an equity relationship with Medical AI Co., Ltd. No other conflicts of interest relevant to this article were reported. Data Availability The data used for this study are available upon reasonable request to the corresponding author for research purposes. The AiTiALVDD model used in this study will be made available to external researchers upon request to validate and expand the findings presented in this study. Funding This study did not receive specific funding or grants. ACKNOWLEDGEMENT REFERENCES 1. ↵ Nagueh SF , Smiseth OA , Appleton CP , Byrd BF , Dokainish H , Edvardsen T , Flachskampf FA , Gillebert TC , Klein AL , Lancellotti P . Recommendations for the evaluation of left ventricular diastolic function by echocardiography: an update from the American Society of Echocardiography and the European Association of Cardiovascular Imaging . European Journal of Echocardiography . 2016 ; 17 : 1321 – 1360 . OpenUrl CrossRef 2. ↵ Drazner MH , Hellkamp AS , Leier CV , Shah MR , Miller LW , Russell SD , Young JB , Califf RM , Nohria A . Value of clinician assessment of hemodynamics in advanced heart failure: the ESCAPE trial . Circulation: Heart Failure . 2008 ; 1 : 170 – 177 . OpenUrl Abstract / FREE Full Text 3. ↵ Abraham WT , Adamson PB , Bourge RC , Aaron MF , Costanzo MR , Stevenson LW , Strickland W , Neelagaru S , Raval N , Krueger S . Wireless pulmonary artery haemodynamic monitoring in chronic heart failure: a randomised controlled trial . The Lancet . 2011 ; 377 : 658 – 666 . OpenUrl 4. ↵ Mascherbauer J , Zotter-Tufaro C , Duca F , Binder C , Koschutnik M , Kammerlander AA , Aschauer S , Bonderman D . Wedge pressure rather than left ventricular end-diastolic pressure predicts outcome in heart failure with preserved ejection fraction . JACC: Heart Failure . 2017 ; 5 : 795 – 801 . OpenUrl PubMed 5. ↵ Little WC , Oh JK . Echocardiographic evaluation of diastolic function can be used to guide clinical care . Circulation . 2009 ; 120 : 802 – 809 . OpenUrl FREE Full Text 6. ↵ Shah MR , Hasselblad V , Stinnett SS , Gheorghiade M , Swedberg K , Califf RM , O’Connor CM . Hemodynamic profiles of advanced heart failure: association with clinical characteristics and long-term outcomes . Journal of cardiac failure . 2001 ; 7 : 105 – 113 . OpenUrl CrossRef PubMed Web of Science 7. ↵ Mitter SS , Shah SJ , Thomas JD . A test in context: E/A and E/e′ to assess diastolic dysfunction and LV filling pressure . Journal of the American College of Cardiology . 2017 ; 69 : 1451 – 1464 . OpenUrl FREE Full Text 8. ↵ Ommen SR , Nishimura RA , Appleton CP , Miller F , Oh JK , Redfield MM , Tajik A . Clinical utility of Doppler echocardiography and tissue Doppler imaging in the estimation of left ventricular filling pressures: a comparative simultaneous Doppler-catheterization study . Circulation . 2000 ; 102 : 1788 – 1794 . OpenUrl Abstract / FREE Full Text 9. ↵ van de Bovenkamp AA , Enait V , de Man FS , Oosterveer FT , Bogaard HJ , Vonk Noordegraaf A , van Rossum AC , Handoko ML . Validation of the 2016 ASE/EACVI guideline for diastolic dysfunction in patients with unexplained dyspnea and a preserved left ventricular ejection fraction . Journal of the American Heart Association . 2021 ; 10 : e021165 . OpenUrl PubMed 10. ↵ Almeida JG , Fontes-Carvalho R , Sampaio F , Ribeiro J , Bettencourt P , Flachskampf FA , Leite-Moreira A , Azevedo A . Impact of the 2016 ASE/EACVI recommendations on the prevalence of diastolic dysfunction in the general population . European Heart Journal-Cardiovascular Imaging . 2018 ; 19 : 380 – 386 . OpenUrl 11. ↵ Kwon J-m , Cho Y , Jeon K-H , Cho S , Kim K-H , Baek SD , Jeung S , Park J , Oh B-H . A deep learning algorithm to detect anaemia with ECGs: a retrospective, multicentre study . The Lancet Digital Health . 2020 ; 2 : e358 – e367 . OpenUrl 12. ↵ Lee E , Ito S , Miranda WR , Lopez-Jimenez F , Kane GC , Asirvatham SJ , Noseworthy PA , Friedman PA , Carter RE , Borlaug BA . Artificial intelligence-enabled ECG for left ventricular diastolic function and filling pressure. npj Digital Medicine . 2024 ; 7 : 4 . OpenUrl PubMed 13. ↵ Kwon J-m , Kim K-H , Eisen HJ , Cho Y , Jeon K-H , Lee SY , Park J , Oh B-H . Artificial intelligence assessment for early detection of heart failure with preserved ejection fraction based on electrocardiographic features . European Heart Journal-Digital Health . 2021 ; 2 : 106 – 116 . OpenUrl 14. Ko W-Y , Siontis KC , Attia ZI , Carter RE , Kapa S , Ommen SR , Demuth SJ , Ackerman MJ , Gersh BJ , Arruda-Olson AM . Detection of hypertrophic cardiomyopathy using a convolutional neural network-enabled electrocardiogram . Journal of the American College of Cardiology . 2020 ; 75 : 722 – 733 . OpenUrl FREE Full Text 15. ↵ Schlesinger DE , Diamant N , Raghu A , Reinertsen E , Young K , Batra P , Pomerantsev E , Stultz CM . A deep learning model for inferring elevated pulmonary capillary wedge pressures from the 12-lead electrocardiogram . JACC: Advances . 2022 ; 1 : 100003 . OpenUrl PubMed 16. ↵ Davis J , Goadrich M . The relationship between Precision-Recall and ROC curves . Paper/Poster presented at: Proceedings of the 23rd international conference on Machine learning ; 2006 ; 17. ↵ Rolnick D , Veit A , Belongie S , Shavit N . Deep learning is robust to massive label noise . arXiv preprint arXiv:170510694. 2017 . 18. ↵ Krause J , Gulshan V , Rahimy E , Karth P , Widner K , Corrado GS , Peng L , Webster DR . Grader variability and the importance of reference standards for evaluating machine learning models for diabetic retinopathy . Ophthalmology . 2018 ; 125 : 1264 – 1272 . OpenUrl CrossRef PubMed 19. ↵ Gulshan V , Peng L , Coram M , Stumpe MC , Wu D , Narayanaswamy A , Venugopalan S , Widner K , Madams T , Cuadros J. Development and validation of a deep learning algorithm for detection of diabetic retinopathy in retinal fundus photographs . jama . 2016 ; 316 : 2402 – 2410 . OpenUrl CrossRef PubMed 20. ↵ Abazeed M . Walking the tightrope of artificial intelligence guidelines in clinical practice . The Lancet Digital Health . 2019 : PE100 . 21. ↵ Shah AM , Claggett B , Sweitzer NK , Shah SJ , Deswal A , Anand IS , Fleg JL , Pitt B , Pfeffer MA , Solomon SD . Prognostic importance of changes in cardiac structure and function in heart failure with preserved ejection fraction and the impact of spironolactone . Circulation: Heart Failure . 2015 ; 8 : 1052 – 1058 . OpenUrl Abstract / FREE Full Text 22. ↵ Unzek S , Popovic Z , Marwick T . Diastolic Guidelines Concordance I . Effect of recommendations on interobserver consistency of diastolic function evaluation JACC Cardiovasc Imaging . 2011 ; 4 : 460 – 467 . OpenUrl PubMed 23. ↵ Lim J , Lee HS , Han GI , Kang S , Jang J-H , Jo Y-Y , Son JM , Lee MS , Kwon J-M , Lee S-P . Artificial intelligence-enhanced six-lead portable electrocardiogram device for detecting left ventricular systolic dysfunction: a prospective single-centre cohort study . European Heart Journal-Digital Health . 2025 ; 6 : 476 – 485 . OpenUrl 24. ↵ Raghu A , Schlesinger D , Pomerantsev E , Devireddy S , Shah P , Garasic J , Guttag J , Stultz CM . ECG-guided non-invasive estimation of pulmonary congestion in patients with heart failure . Scientific Reports . 2023 ; 13 : 3923 . OpenUrl PubMed 25. ↵ Mullens W , Borowski AG , Curtin RJ , Thomas JD , Tang W . Tissue Doppler imaging in the estimation of intracardiac filling pressure in decompensated patients with advanced systolic heart failure . Circulation . 2009 ; 119 : 62 – 70 . OpenUrl Abstract / FREE Full Text 26. ↵ Al-Omari MA , Finstuen J , Appleton CP , Barnes ME , Tsang TS . Echocardiographic assessment of left ventricular diastolic function and filling pressure in atrial fibrillation . The American journal of cardiology . 2008 ; 101 : 1759 – 1765 . OpenUrl CrossRef PubMed Web of Science 27. ↵ Nohria A , Tsang SW , Fang JC , Lewis EF , Jarcho JA , Mudge GH , Stevenson LW . Clinical assessment identifies hemodynamic profiles that predict outcomes in patients admitted with heart failure . Journal of the American College of Cardiology . 2003 ; 41 : 1797 – 1804 . OpenUrl FREE Full Text 28. ↵ Oh JK , Miranda WR , Bird JG , Kane GC , Nagueh SF . The 2016 diastolic function guideline: is it already time to revisit or revise them? JACC: Cardiovascular Imaging . 2020 ; 13 : 327 – 335 . OpenUrl View the discussion thread. Back to top Previous Next Posted October 07, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Artificial Intelligence-Enabled Electrocardiogram for Elevated Left Ventricular Filling Pressure Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Artificial Intelligence-Enabled Electrocardiogram for Elevated Left Ventricular Filling Pressure Jaehyun Lim , Min Sung Lee , Jung Ho Suh , Sora Kang , Hak Seung Lee , Jong-Hwan Jang , Jeong Min Son , Joon-Myoung Kwon , Yong-Jin Kim , Kyung-Hee Kim , Seung-Pyo Lee medRxiv 2025.10.03.25337299; doi: https://doi.org/10.1101/2025.10.03.25337299 Share This Article: Copy Citation Tools Artificial Intelligence-Enabled Electrocardiogram for Elevated Left Ventricular Filling Pressure Jaehyun Lim , Min Sung Lee , Jung Ho Suh , Sora Kang , Hak Seung Lee , Jong-Hwan Jang , Jeong Min Son , Joon-Myoung Kwon , Yong-Jin Kim , Kyung-Hee Kim , Seung-Pyo Lee medRxiv 2025.10.03.25337299; doi: https://doi.org/10.1101/2025.10.03.25337299 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Cardiovascular Medicine Subject Areas All Articles Addiction Medicine (569) Allergy and Immunology (863) Anesthesia (300) Cardiovascular Medicine (4442) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1510) Epidemiology (15230) Forensic Medicine (30) Gastroenterology (1126) Genetic and Genomic Medicine (6609) Geriatric Medicine (668) Health Economics (998) Health Informatics (4542) Health Policy (1370) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1266) Infectious Diseases (except HIV/AIDS) (15923) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (147) Nephrology (668) Neurology (6607) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1146) Occupational and Environmental Health (957) Oncology (3337) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (664) Pediatrics (1693) Pharmacology and Therapeutics (692) Primary Care Research (712) Psychiatry and Clinical Psychology (5448) Public and Global Health (9237) Radiology and Imaging (2202) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (596) Sexual and Reproductive Health (714) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a01976592cca58f4',t:'MTc3OTc2MzcyMQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.