Full text
64,153 characters
· extracted from
preprint-html
· click to expand
Multimodal Electronic Health Record Foundation Models with Electrocardiogram for Cardiovascular Disease Prediction | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Multimodal Electronic Health Record Foundation Models with Electrocardiogram for Cardiovascular Disease Prediction View ORCID Profile Junmo Kim , Young-Kwan Kim , Kwangsoo Kim doi: https://doi.org/10.1101/2025.11.10.25339886 Junmo Kim 1 Interdisciplinary Program in Bioengineering, Seoul National University , Seoul, Republic of Korea Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Junmo Kim Young-Kwan Kim 2 Cardiovascular Center, Seoul National University Hospital , Seoul, Republic of Korea Find this author on Google Scholar Find this author on PubMed Search for this author on this site Kwangsoo Kim 3 Department of Transdisciplinary Medicine, Institute of Convergence Medicine with Innovative Technology, Seoul National University Hospital 4 Department of Clinical Medical Sciences, College of Medicine, Seoul National University , Seoul, Republic of Korea 5 Center for Data Science, Healthcare AI Research Institute, Seoul National University Hospital Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: kwangsookim{at}snu.ac.kr Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Electronic health record (EHR) foundation models (FMs) have improved clinical task performance by learning comprehensive clinical context from sequential medical records called patient trajectories. However, existing multimodal approaches generate representations separately for each modality and integrate them only at the final prediction stage, without capturing temporal relationships across data types. Here, we propose TRIM, text-based representations for integrated multimodal trajectories, which converts unstructured data into text-based representations via their diagnostic reports and integrates them directly into patient trajectories. This enables EHR FMs to simultaneously analyze structured and unstructured longitudinal data while preserving temporal context. To develop and evaluate TRIM, we trained EHR FMs with electrocardiogram data to predict cardiovascular diseases (CVDs). TRIM-integrated EHR FMs improved overall CVD prediction performance. Model interpretation revealed that models prioritized ECG diagnostic information, focusing on clinically established risk factors. Survival analysis validated model decisions, with TRIM integration consistently increasing hazard ratios. TRIM provides a generalizable framework for integrating multimodal medical data into EHR FMs. Introduction With the availability of large structured electronic health record (EHR) datasets 1 , 2 , EHR foundation models (FMs) have emerged to enhance the performance of diverse clinical tasks 3 – 6 . EHR FMs are trained on patient trajectories, which are patient-level sequential medical codes extracted from EHR databases. As each patient trajectory corresponds to a natural language sentence, EHR FMs have followed the paradigms of natural language processing. By utilizing entire patient medical histories rather than specific curated variables, EHR FMs learn comprehensive medical contexts to fulfill given clinical tasks, such as predicting patient outcomes 3 , 7 , simulating patient status 6 , and synthesizing EHR data 8 . Despite current advances in EHR FMs, only a few studies have utilized multiple data modalities with EHR FMs. Mataraso et al. proposed Clinical and Omics Multimodal analysis Enhanced with Transfer learning (COMET) 9 . COMET complemented the data scarcity of omics data by integrating EHR FM representations that contain information from many more patients. Soenksen et al. proposed the Holistic Artificial Intelligence in Medicine (HAIM) framework to leverage multimodal inputs 10 . HAIM concatenated multimodal representations generated from respective pretrained models to construct final integrated inputs for clinical tasks. While many other studies have utilized structured EHR data with unstructured data, EHR FMs have been rarely used. Although COMET and HAIM achieved improved performance on diverse clinical tasks, they generated representations from EHR and non-EHR data separately and integrated them at the final stage. This approach does not capture the temporal relationships between medical codes and other modalities throughout the patient timeline. In this study, we propose text-based representations for integrated multimodal trajectories (TRIM), to integrate unstructured data into patient trajectories for EHR FMs. The motivation behind TRIM is that most unstructured medical data, such as electrocardiogram (ECG), chest X-ray (CXR), and computed tomography (CT), are accompanied by textual reports written by machines or clinicians. Inspired by MedRep 11 , which provides a representation for each medical concept (code) using free-text descriptions, we integrated text-based representations of unstructured data into original patient trajectories by generating MedRep-style representations from the textual reports of the unstructured data. In this way, EHR FMs can simultaneously analyze the comprehensive context of structured and unstructured longitudinal data while considering time intervals between records. To develop and evaluate TRIM, we trained EHR FMs with ECG data to predict the first occurrence of cardiovascular diseases (CVDs), including heart failure (HF), ischemic heart disease (IHD), coronary artery disease (CAD), and stroke, to contribute to the prevention and early-management of CVDs. Outcomes that can be directly diagnosed from ECGs (e.g., arrhythmia and atrial fibrillation) were excluded to effectively evaluate the impact of integrated unstructured data, thereby preventing the models from excessively relying on raw ECG signals. We used EHR and ECG data from one publicly available dataset, MIMIC-IV 12 , and one private dataset from Seoul National University Hospital, a tertiary hospital in the Republic of Korea. The results demonstrate that leveraging TRIM-style ECG records enhances CVD prediction performance and that EHR FMs focus more on integrated ECG data rather than original EHR records when making decisions. Results In this study, we proposed a multimodal EHR FM framework to predict four CVDs (HF, IHD, CAD, and stroke) within one year after ECG measurement through a multilabel classification approach ( Fig. 1a ). We defined the prediction timepoint (index date) as the last ECG measurement before the first CVD occurrence for the CVD group, with a one-month washout period to exclude imminent events. For the non-CVD group, the prediction timepoint (index date) was the last ECG measurement, and patients were included only if they had at least one visit record more than one year later (follow-up period). TRIM representations were generated by LLM-enriched ECG diagnosis descriptions and the text-based representation generator of MedRep ( Figs. 1b - 1c ). In the CVD prediction process ( Fig. 1d ), each ECG record was converted into a TRIM representation and integrated into the patient trajectory alongside EHR records. An EHR FM generated “trajectory representations” from these integrated trajectories, while an ECG encoder generated “ECG representations” from raw ECG signals of the last ECG measurement. These trajectory and ECG representations were processed through separate linear layers for independent and combined modalities, then concatenated and passed through a final prediction head. Download figure Open in new tab Fig 1. Implementation process for CVD prediction using multimodal EHR FMs with TRIM. a, Prediction timepoint definition for CVD and non-CVD groups. b , Text-based representation generation process of medical concepts in EHR. Each phrase-level concept name is enriched with LLM-generated descriptions. c , Text-based representation generation process of phrase-level ECG diagnoses (TRIM). TRIM representations were generated by LLM-enriched ECG diagnosis descriptions and a small language model trained on medical concept descriptions. d , CVD prediction process with representation-based EHR FMs, TRIM, and raw ECG signals. Representations generated by EHR FM and ECG encoder are integrated to predict CVDs. Baseline characteristics For both MIMIC-IV and SNUH datasets, we used 85% of data for pretraining and 15% for finetuning ( Table 1 ). Of the 257,992 patients in MIMIC-IV and 39,128 patients in SNUH, we allocated 219,293 and 33,258 patients to the pretraining dataset, and 38,699 and 5,870 patients to the finetuning dataset, respectively. Age, sex, and outcome distributions were significantly different between datasets (all p<0.0001). HF (7.37% vs.4.16%) and CAD (10.68% vs. 6.21%) incidence was higher in MIMIC-IV, while IHD (1.55% vs. 4.52%) and stroke (2.06% vs. 3.43%) was higher in SNUH. Although MIMIC-IV contained more patients overall, SNUH showed higher patient data density, with more visits, EHR records, and ECG records per patient, as well as more unique ECG diagnoses. View this table: View inline View popup Download powerpoint Table 1. Baseline characteristics of finetuning datasets. TRIM representation analysis We first examined how well ECG records from ECG and EHR systems were aligned ( Fig. 2a ). For MIMIC-IV, only 3,030 records overlapped, among 117,345 records from the ECG system and 4,071 records from the EHR system. For SNUH, 33,620 records were recorded in both ECG and EHR systems, while 35,544 records from the ECG system and 6,329 records from the EHR system did not overlap. These results indicate that ECG measurements are not routinely recorded in the EHR system, and the ECG system may also miss records. Therefore, integrating records from the ECG system into patient trajectories could enhance the validity of multimodal EHR FM research. Download figure Open in new tab Fig 2. Overview of TRIM-style ECG representations. a , Venn diagram of ECG records in ECG and EHR systems. Larger overlapping area indicates better reflection of ECG records in the EHR system. b , UMAP visualization of CVD and non-CVD EHR concept representations and TRIM-style ECG representations of the MIMIC-IV dataset. To enhance visibility given the low proportion of CVD concepts, their corresponding points were displayed 50 times darker than other representations. c , UMAP visualization of CVD and non-CVD concept representations and TRIM-style ECG representations of the SNUH dataset. To enhance visibility given the low proportion of CVD concepts, their corresponding points were displayed 50 times darker than other representations. d , UMAP visualization of TRIM-style ECG representations of the MIMIC-IV and SNUH datasets. e , Boxplots of cosine similarity to CVD concepts for non-CVD EHR concept representations and TRIM-style ECG representations. Next, we analyzed the characteristics of TRIM representations through UMAP visualization 13 . In MIMIC-IV, CVD concept representations formed a clear cluster, and TRIM representations were closely located within this cluster, as shown in the shaded region in Fig. 2b . However, TRIM representations were not fully covered by CVD concept representations, demonstrating their distinctiveness and diversity. In contrast, non-CVD concept representations were widely scattered without specific patterns. In SNUH, CVD concept representations did not form a distinct cluster, but TRIM representations were closely located with them, as shown in the shaded regions in Fig. 2c . Compared to MIMIC-IV, SNUH TRIM representations formed clearer clusters, demonstrating less diversity. Non-CVD concept representations were also widely scattered without specific patterns, similar to MIMIC-IV. Since TRIM representations were generated from ECG diagnosis descriptions, they inherently contained cardiovascular information, explaining their proximity to CVD concept representations in both datasets. TRIM representations from MIMIC-IV and SNUH formed separate, non-overlapping clusters ( Fig. 2d ), reflecting differences in the reporting practices of ECG systems. MIMIC-IV TRIM representations showed a scattered pattern with only several small clusters, while SNUH TRIM representations formed several large, distinct clusters. Despite thousands of unique ECG diagnoses in each dataset, only a few major clusters were observed, indicating common reporting patterns of cardiovascular conditions. Nevertheless, many irregularly scattered representations existed outside these clusters, reflecting diverse or rare ECG findings. Quantitatively, cosine similarity to CVD concepts was also higher for TRIM representations than for non-CVD concept representations across both datasets, consistent with the UMAP visualization patterns ( Fig. 2e ). CVD prediction performance evaluation We evaluated CVD prediction performance on seven models: (1) raw ECG model 14 , (2) EHR FM 15 , (3) EHR FM with raw ECG signals, (4) MedRep-based EHR FM, (5) MedRep-based EHR FM with raw ECG signals, (6) MedRep-based EHR FM with TRIM, and (7) MedRep-based EHR FM with TRIM and raw ECG signals ( Table 2 ). For evaluation metrics, we used macro area under the receiver operating characteristic curve (AUROC), macro area under the precision-recall curve (AUPRC), and macro F1-score. The MedRep-based EHR FM with TRIM and raw ECG signals achieved the best performance across both datasets and all metrics with AUROC of 0.729, AUPRC of 0.159, and F1-score of 0.190 in MIMIC-IV, and AUROC of 0.764, AUPRC of 0.204, and F1-score of 0.216 in SNUH. The adoption of TRIM improved overall predictive performance for both models with and without raw ECG signals, across both datasets. MedRep representations substantially improved performance compared to the baseline EHR FM, and adding TRIM further enhanced predictive accuracy beyond MedRep alone, demonstrating the complementary value of structured ECG diagnostic information. Disease-specific prediction performance for each CVD is summarized in Supplementary Tables 1 - 4 . The models with TRIM achieved the best performance across all metrics for all CVDs, except for the IHD cohort in MIMIC-IV. View this table: View inline View popup Download powerpoint Table 2. CVD prediction performance. Experiments were performed with five random seeds and all values are shown as mean ± SD. Model interpretation of the MIMIC-IV dataset In this section, we first explore which components of the model mainly affected model decisions. We conducted a cross-modal correlation analysis between trajectory and ECG representations—the output vectors from EHR FM and ECG encoder ( Fig. 1d )—by calculating the Pearson correlation coefficient (PCC) between all pairs of their 768 latent dimensions ( Fig. 3a ) 9 . The EHR FMs with TRIM exhibited more significant correlations than those without TRIM, with 223,328 (15.20%) and 119,856 (8.16%) significant correlations among out of 1,472,640 total dimension pairs (5 seeds × 768(768-1)/2 pairs), respectively, at p<0.01. This increase in cross-modal connections demonstrates that TRIM integration encourages better semantic alignment between trajectory and ECG representations, which may contribute to the improved and stable performance observed consistently across CVDs and datasets 9 . Download figure Open in new tab Fig. 3. Model interpretation of the MIMIC-IV dataset. a , Cross-modal correlation analysis between trajectory and ECG representations. Lines represent statistically significant correlations (p<0.01). b , SHAP value distributions for trajectory and ECG representations. c , Attention score distributions for EHR concepts and TRIM within patient trajectories. d , Top 20 EHR concepts with the highest average attention scores. e , Top 20 TRIM records with the highest average attention scores. To measure the impact of each latent representation on model decisions, we compared the SHAP values 16 of trajectory and ECG representations ( Fig. 3b ). Both models with and without TRIM demonstrated that ECG representations had limited impact on predictions, with SHAP values concentrated near zero. In contrast, trajectory representation showed larger SHAP value distributions, indicating their dominant role in model decisions. Notably, the models with TRIM exhibited a wider SHAP value distribution for trajectory representations compared to those without TRIM, suggesting that TRIM integration amplified the influence of patient trajectory information on model predictions. While the combination of ECG and EHR improved overall performance, model decisions were predominantly driven by trajectory representations, as raw ECG signals alone were insufficient for accurate CVD prediction ( Table 2 ). In addition to latent space analysis, we explored attention scores within patient trajectories, as attention scores can reflect the importance of each record 15 , 17 . For both models with and without raw ECG signals, the attention scores for TRIM records were substantially higher than those for EHR concepts, indicating that ECG diagnosis descriptions integrated into patient trajectories played a more dominant role in the feature selection process of EHR FMs ( Fig. 3c ). To examine which ECG diagnoses were influential in predicting CVDs, we reported the top 20 EHR concepts and TRIM records with the highest attention scores ( Figs. 3d - 3e ). For EHR concepts, obstructive sleep apnea syndrome (OSA), which has close relationship with CVDs 18 , 19 , had the highest average attention score ( Fig. 3d ). Syncope and collapse 20 , 21 , obesity 22 , 23 , chronic obstructive lung disease (COPD) 24 , and acquired hypothyroidism 25 have also been reported as risk factors for CVDs. Hypokalemia 26 and iron deficiency anemia 27 are risk factors of HF, and chest pain is a primary symptom of myocardial infarction (MI). Low back pain, osteoporosis, and benign prostatic hyperplasia without outflow obstruction are associated with older age and share common risk factors with CVDs; however, their direct relation to CVDs remains unclear. Among TRIM records, premature ventricular complex (PVC), which is highly associated with HF and IHD 28 , 29 , had the highest attention score ( Fig. 3e ). Ischemia-related ST-T changes 30 , left atrial abnormality 31 , and ventricular hypertrophy-related changes 32 are closely related to IHD, atrial fibrillation (AF), and HF, respectively. While the most frequent ECG diagnoses in the dataset were simple statements such as “Abnormal ECG”, “Sinus rhythm”, “Borderline ECG”, and “Normal ECG”, these diagnoses were not represented in the top 20 TRIM records. This result indicates that the model focused more on specific ECG conditions with clinical significance rather than generic diagnostic statements. Model interpretation of the SNUH dataset Similar to MIMIC-IV, more significant correlations were observed in the EHR FMs with TRIM than those without TRIM, with 110,006 (7.47%) and 88,664 (6.02%) significant correlations, respectively ( Fig. 4a ). SHAP value distributions of trajectory and ECG representations also showed similar patterns to those of MIMIC-IV, although the distribution of trajectory representations in the models with TRIM was only slightly broader than those without TRIM compared to the MIMIC-IV result ( Fig. 4b ). The attention scores for TRIM records were also higher than those for EHR concepts across both models with and without raw ECG signals ( Fig. 4c ). Download figure Open in new tab Fig. 4. Model interpretation of the SNUH cohort. a , Cross-modal correlation analysis between trajectory and ECG representations. Lines represent statistically significant correlations (p<0.01). b , SHAP value distributions for trajectory and ECG representations. c , Attention score distributions for EHR concepts and TRIM within patient trajectories. d , Top 20 EHR concepts with the highest attention scores. e , Top 20 TRIM records with the highest attention scores. For the top 20 EHR concepts, polyneuropathy due to diabetes mellitus, which is a major risk factor for CVD 33 , received the highest average attention score ( Fig. 4d ). Dyspnea is a cardinal symptom of HF and CAD 34 , while cerebral ischemia and carotid artery stenosis are primary risk factors for stroke. Several medications for CVD prevention and treatment were also included in the top 20. These drugs, including nitroglycerin 35 , metoprolol tartrate 36 , fimasartan potassium 37 , candesartan cilexetil 38 , pravastatin 39 , and telmisartan 40 , are used for CVD management, whereas lafutidine is a gastric acid suppressant. Benign prostatic hyperplasia and chest pain were common to both MIMIC-IV and SNUH. In contrast to MIMIC-IV, SNUH models focused more on stroke-related concepts and medication records regarding CVD management, while MIMIC-IV did not include any drug concept in the top 20. Unlike the MIMIC-IV dataset, the top 20 TRIM records in SNUH included “Normal ECG” and “Normal sinus rhythm” ( Fig. 4e ). This was because 48.64% of MIMIC-IV trajectories contained these records, while only 1.52% of SNUH trajectories included them. Thus, the presence of “Normal ECG” and “Normal sinus rhythm” records represented distinctive features in SNUH, whereas MIMIC-IV models recognized them as common features. Similarly, “Borderline ECG” appeared in 53.18% of MIMIC-IV trajectories, but only in 17.69% of SNUH trajectories. Although “Abnormal ECG” was the most frequent ECG diagnosis in SNUH, it was not included in the top 20, similar to MIMIC-IV. This suggests that SNUH models also focused more on specific ECG conditions than generic diagnostic statements. Besides these generic records, several specific diagnoses, including septal infarct 30 , anterior infarct 41 , left ventricular hypertrophy (LVH) 32 , sinus bradycardia 42 , sinus tachycardia 43 , and left axis deviation 44 , were included, all of which are established indicators of CVD risk. Survival analysis for model decision validation We conducted survival analysis to validate model decisions by fitting Cox proportional hazard (CPH) models, adjusted for age and sex, that regressed each CVD outcome (HF, IHD, CAD, and stroke) on model decisions ( Figs. 5 - 6 ). Patients were classified into positive and negative groups based on thresholds determined by Youden’s index 45 , and Nelson-Aalen cumulative hazard curves were constructed for each CVD. Across all CVDs and models in both datasets, the gap between positive and negative groups increased proportionally over time, supporting the proportional hazards assumption. For models with raw ECG signals, TRIM integration generally widened the gap between risk groups ( Figs. 5a and 6a ). Models without raw ECG signals also exhibited a larger gap with TRIM, except for the IHD cohort in MIMIC-IV and the IHD and stroke cohorts in SNUH ( Figs. 5c and 6c ). In all cases, hazard ratios (HRs) of model decisions were statistically significant ( Figs. 5b , 5d , 6b , and 6d ). Notably, HRs consistently increased with TRIM integration, demonstrating stronger associations between positive predictions and actual CVD occurrence. All adjusted HRs for CVDs are summarized in Supplementary Tables 5 - 6 . Download figure Open in new tab Fig. 5. Survival analysis comparing models with and without TRIM on the MIMIC-IV dataset. a , Nelson-Aalen cumulative hazard curves for four CVDs in the models with raw ECG signals. b , Forest plot for HRs of the model decision with raw ECG signals, adjusted for age and sex. c , Nelson-Aalen cumulative hazard curves for four CVDs in the models without raw ECG signals. d , Forest plot for HRs of the model decision without raw ECG signals, adjusted for age and sex. Download figure Open in new tab Fig. 6. Survival analysis comparing models with and without TRIM on the SNUH dataset. a , Nelson-Aalen cumulative hazard curves for four CVDs in the models with raw ECG signals. b , Forest plot for HRs of the model decision with raw ECG signals, adjusted for age and sex. c , Nelson-Aalen cumulative hazard curves for four CVDs in the models without raw ECG signals. d , Forest plot for HRs of the model decision without raw ECG signals, adjusted for age and sex. Discussion In this study, we proposed TRIM, a novel strategy for integrating unstructured medical data (e.g., ECG, CXR, CT) into EHR-based patient trajectories for multimodal EHR FMs. TRIM was motivated by two key observations: First, EHR FMs adopting text-based representations have achieved superior performance compared to traditional token-based models 11 . Second, unstructured medical data are typically accompanied by free-text diagnostic reports written by clinicians or automated systems. Leveraging this, we generated representations for unstructured data using their corresponding reports and MedRep’s text-based representation generator, thereby creating MedRep-style representations for ECG records that could be seamlessly integrated into patient trajectories. TRIM addresses critical limitations of prior multimodal EHR FM frameworks. Previous studies (e.g., COMET 9 and HAIM 10 ) generated representations for each modality separately and integrated them only at the final prediction stage. This approach could not consider temporal relationships between different data types throughout the patient timeline. On the other hand, representing multiple unstructured data points may have computational challenges—in this study, each EHR record was a 768-dimensional vector, while a single ECG comprised 60,000-dimensional (12 lead × 500 Hz × 10 seconds). The lack of standardized methods for processing longitudinal unstructured data further limits the reliability of such approaches. Even when constructing unstructured data representations is possible, integrating them into EHR-based trajectories remains challenging due to semantic incompatibility across modalities. By converting unstructured data into compatible representations through MedRep’s text-based representation generator, TRIM representations aligned with related EHR concept representations ( Fig. 2b - 2c, 2e ) and enabled EHR FMs to simultaneously analyze longitudinal structured and unstructured data while considering the time intervals between all records. We demonstrated the effectiveness of TRIM through comprehensive quantitative analyses (performance evaluation and survival analysis) and qualitative assessments (representation analysis and model interpretation). While the models with TRIM and raw ECG signals achieved the best overall performance, the models with only TRIM showed the second-best performance with AUROC of 0.711, AUPRC of 0.150, F1-score of 0.186 in MIMIC-IV and AUROC of 0.742, AUPRC of 0.198, and F1-score of 0.209 in SNUH ( Table 2 ). This result demonstrates that directly integrating longitudinal unstructured data into patient trajectories without requiring complex signal processing is more effective than integrating modality-specific representations at the final prediction stage (EHR FM with raw ECG signals and without TRIM). Furthermore, the combination of TRIM with raw ECG signals exhibited synergistic effects, suggesting that TRIM representations and signal features provide complementary information for CVD prediction. The interpretability of TRIM-integrated models offers significant advantages for clinical practice. Our model identified clinically established risk factors for CVDs, demonstrating strong alignment with existing literature and clinical knowledge. This is essential for using artificial intelligence (AI) models in clinical practice because physicians are more inclined to trust and implement AI systems if they perceive the results as being more explainable or comprehensible 46 . Our approach, which integrates ECG records into patient trajectories, can provide clinicians with additional information to trace meaningful cardiovascular findings. The higher attention scores for TRIM records compared to EHR concepts ( Figs. 3c and 4c ) validate that the model properly selected cardiovascular-specific information when making decisions. Moreover, the cross-modal correlation analysis revealed that TRIM integration enhanced semantic alignment between trajectory and ECG representations ( Figs. 3a and 4a ), suggesting that our models made stable and enhanced decisions fully utilizing different data types. The survival analysis validated the clinical utility of model predictions. Since we designed the model to predict CVDs within one year after the index date, the Nelson-Aalen curves exhibited steep slopes until around 365 days across all CVDs and models ( Figs. 5a , 5c , 6a , 6c ), yet the curves continued to show monotonically increasing gaps between CVD and non-CVD groups even after the monitoring period. This implies that long-term CVD risk can be assessed through our model and that patients currently without CVDs but predicted to develop them can be provided with proper lifestyle modifications and medical interventions to prevent the development of CVDs. Moreover, the higher HRs observed in the models with TRIM provide clinicians with greater confidence in implementing preventive interventions for high-risk patients identified by the model. It is notable that TRIM can be applied to other modalities beyond ECG, since most medical images, including CXR, CT, and MRI, are accompanied by free-text radiology reports written by radiologists 47 . Additionally, there are many other unstructured medical data types accompanied by textual descriptions, including nursing notes, endoscopy reports, and echocardiogram reports 48 . In particular, the file size of medical images is usually much larger than ECG signals (e.g., a single chest CT scan can exceed 100 MB), making direct integration computationally challenging. However, the textual reports or metadata associated with these images are readily accessible. Although such metadata could be integrated into an EHR database, unstructured data and EHR records are often not compatible due to different management systems, as demonstrated in Fig. 2a . Therefore, TRIM provides an optimal solution for integrating longitudinal unstructured medical data with structured EHR records, enabling EHR FMs to achieve a more comprehensive understanding of patient trajectories. Despite their cardiovascular relevance, the target CVDs (HF, IHD, CAD, and stroke) are not directly diagnosed by ECGs alone, and the definitive diagnostic process is associated with substantial costs: HF diagnosis requires comprehensive evaluation through echocardiography, the gold standard for assessing left ventricular function and structural abnormalities, with the median prices ranging from $204 to $2,588 49 . For IHD and CAD, diagnosis typically involves coronary angiography or CT angiography, with median costs ranging from $2,868 to $9,203 for coronary angiography 49 . Stroke diagnosis requires emergency brain imaging, predominantly through CT or MRI, with aggregate costs of post-emergency department diagnostic evaluation around $2,000 50 . As these processes entail significant economic burdens, reducing unnecessary testing and promoting the use of diagnostic evaluations in clearly indicated cases is essential. Since ECG testing costs are relatively lower than the above tests and range from $50 to $300 for standard 12-lead recordings in primary care settings, leveraging routinely collected ECG and EHR data for CVD risk stratification offers a cost-effective screening approach. Rather than requiring expensive diagnostic imaging as an initial assessment tool, our approach enables early risk identification using readily available longitudinal data, potentially reserving advanced imaging modalities for high-risk patients. This risk-stratified diagnostic paradigm could reduce healthcare expenditures, addressing the growing economic burden of cardiovascular imaging 50 . This study has several limitations. First, we only used ECG for unstructured medical data. This choice was intentional to effectively evaluate TRIM by incorporating a target-related modality (ECG for CVD prediction). Future work should explore other modalities such as CXR and CT to further investigate more complex multimodal EHR FMs across diverse clinical outcomes. Second, while the original MedRep includes relational information between concepts, we only used a graph-free version containing textual information only, because integrating ECG records into the graph ontology of medical concepts was not feasible. Future research should investigate methods to fully utilize the relational information included in the original MedRep for enhanced representation learning. Third, we used a single ECG raw signal from the last measurement. As raw signals contain more detailed information than the metadata used for TRIM, strategies for merging longitudinal raw signal data and free-text diagnoses need to be explored. Fourth, we constructed TRIM at the diagnosis-level rather than the record-level. Most ECG records consisted of multiple diagnoses like “Normal ECG” and “Normal sinus rhythm”, or “Sinus rhythm” and “Left axis deviation”. This study treated these multiple diagnoses as attached but separate tokens, but record-level TRIM may capture more detailed diagnostic patterns. Methods Data curation This study used data from 257,992 and 39,128 adult patients aged over 18 years from MIMIC-IV and SNUH, respectively. For SNUH, we randomly sampled 39,128 patients with at least one ECG record measured in the inpatient ECG room or emergency room to exclude healthy individuals who routinely undergo ECG testing for biennial health checkups in Korea 51 . The data period spanned from 15 October 2004 to 2 February 2024. The MIMIC-IV data period was between 2008 and 2022 12 . Both MIMIC-IV and SNUH datasets were based on the Observational Medical Outcomes Partnership (OMOP) Common Data Model (CDM) format. Since MedRep is based on OMOP format and MIMIC-IV is not originally formatted in OMOP CDM, we converted the original MIMIC-IV into OMOP format using the official OHDSI GitHub repository ( https://github.com/OHDSI/MIMIC ). We used data from 85% of patients for pretraining (70% for training and 15% for validation) and the remaining 15% was used for finetuning with a 6:2:2 ratio for training, validation, and hold-out test sets. Among patients in the finetuning dataset, those without ECG were excluded from MIMIC-IV (SNUH patients were initially selected based on ECG availability, so none were excluded). We then extracted all available past ECG records of these patients, resulting in 117,345 and 69,164 records from MIMIC-IV and SNUH, respectively. We divided patients with ECG records according to CVD record existence. For patients with CVD records, the index date was defined as the date of the last ECG measurement before the first CVD occurrence. Patients whose first CVD did not occur between one month and one year after the index date were excluded (one-month washout period and one-year monitoring period). For patients without CVD records, the index date was defined as the date of the last ECG measurement. To ensure no CVD occurrence within the monitoring period, patients without any visits at least one year after the index date were excluded. For both CVD and non-CVD groups, patients with fewer than 30 EHR records were excluded. Finally, MIMIC-IV contained 1,005 CVD patients and 4,616 non-CVD patients, and SNUH contained 477 and 3,084 patients, respectively. The population flowcharts are shown in Supplementary Figure 1 . The Institutional Review Board (IRB) of Seoul National University Hospital (IRB approval No. 2409-073-1570) approved the study with a waiver of informed consent, considering that our study used retrospective and observational EHR data. The approval aligns with the principles outlined in the Declaration of Helsinki, the Korean Bioethics and Safety Act (Law No. 16372), and the Human Research Protection Program–Standard Operating Procedure of Seoul National University Hospital. Data preprocessing and outcomes Each patient trajectory consisted of integer sequences of medical concept indices, age indices, visit indices, record indices, and domain indices, all sorted in order of time. The maximum trajectory length was set to 2048. Every trajectory started with a [CLS] token, and [SEP] tokens were not used as visit indices already distinguished different visits. Unique ECG diagnoses were added to the original vocabularies of MIMIC-IV and SNUH, and these ECG diagnoses were treated as medical concepts and merged into patient trajectories as shown in Fig. 1d . The vocabulary size was 33,726 (29,864 EHR concepts and 3,862 ECG diagnoses) for MIMIC-IV and 26,704 (21,192 EHR concepts and 5,512 ECG diagnoses) for SNUH. For raw ECG signals, we followed the preprocessing process described in a previous study that used a one-dimensional ResNet-based model for ECG analysis 14 . Specifically, we first applied a fifth-order Butterworth filter with a frequency range between 0.05 and 150 Hz to remove noise and then scaled the filtered signal to range between -1 and 1 for normalization. Missing values were imputed with 0. The dimension of ECG signals in both MIMIC-IV and SNUH was 12 × 5000. For CVD outcomes, we used the ICD-10 taxonomy and converted the codes into OMOP concepts: I50 for HF; I20, I21, and I24 for IHD; I25 for CAD; and I60, I61, and I63 for stroke. OMOP concepts for each CVD are summarized in Supplementary Table 7 . Generating descriptions for ECG diagnoses TRIM representations were generated using LLM-enriched ECG diagnosis descriptions and the text-based representation generator of MedRep. ECG diagnoses are phrase-level, for example, “RBBB with left anterior fascicular block”. These phrase-level diagnoses were enriched through LLMs as shown in Figs. 1b - 1c . Instead of training a new representation generating model, we used the text-based representation generator of MedRep which was trained on descriptions of more than 7 million medical concepts 11 to align new ECG representations with original concept representations. The prompt for ECG diagnosis description was as follows: “Instruction: Briefly explain the clinical background and regarding treatments of each ECG diagnostic report with less than 5 sentences. Do not include sentences that are too ordinary (such as “further details would depend on the specific situation”) and focus on describing the representative clinical features of the concept. If possible, avoid using negation.” Generating descriptions for 9,374 (3,862 from MIMIC-IV and 5,512 from SNUH) unique diagnoses costed $0.95 with ChatGPT-4o-mini (OpenAI Inc). Examples of ECG diagnosis descriptions are provided in Supplementary Table 8 . Model and training details The architecture of the EHR FMs was based on CDM-BERT 15 , which introduces domain embedding to indicate the domain of masked tokens during pretraining, thereby preventing the model from finding unnecessary medical concepts from other domains. We used a 768-dimensional hidden dimension consistent with MedRep, 12 attention layers, and 12 attention heads. For the ECG encoder, we used a one-dimensional ResNet-based model. The detailed configuration of the ECG encoder is summarized in Supplementary Table 9 . For pretraining, we selected the models with the lowest masked language model (MLM) loss during 50-epoch training. The pretraining configuration was as follows: a batch size of 32, a learning rate of 0.00005, and an AdamW optimizer with a weight decay of 0.01. Patient trajectories exceeding the maximum length were sliced into non-overlapping sub-trajectories to avoid potential dependency among trajectories from a single patient. Pretraining was conducted using 8 NVIDIA RTX A6000 GPUs, requiring approximately 18 hours for MIMIC-IV and 12 hours for SNUH. Although SNUH had substantially fewer patients for pretraining than MIMIC-IV (33,258 vs. 219,293), it contained considerably more EHR records per patient (4,934 vs. 541), resulting in many sliced sub-trajectories. Consequently, the training time for SNUH was approximately 67% that of MIMIC-IV. For finetuning, we trained each model for 50 epochs with an early stopping patience of 10 to prevent overfitting. The loss function was binary cross entropy for each target, and early stopping was applied based on the macro AUROC. We conducted finetuning using five random seeds, randomly splitting the data into training, validation, and hold-out test sets. All performance evaluation processes were performed on the hold-out test sets. Each finetuning task was performed with a single NVIDIA RTX A6000 GPU, requiring 1-4 hours per random seed. Model interpretation To explore which components of the model mainly affected model decisions, we conducted a two-fold analysis: latent space analysis and attention score analysis. For latent space analysis, we conducted a cross-modal correlation analysis between trajectory and ECG representations by calculating the PCC between all pairs of their 768 latent dimensions, to evaluate the alignment between these representations. In addition, we calculated SHAP values 16 of trajectory and ECG representations to compare the impact of each latent representation on model decisions. We used an Integrated Gradients-based SHAP implementation 52 (GradientExplainer in the SHAP package) with a background sample size of 100. For attention score analysis, we used the attention vector of each [CLS] token from the last attention layer output and averaged the attention scores for each concept. For qualitative analysis of concepts with high average attention scores, we only included concepts that appeared in more than 100 patients, to avoid rare concepts coincidentally having extremely high attention scores. All model interpretation processes were performed on the hold-out test sets. As we conducted experiments with five random seeds, we reported the results of both latent space analysis and attention score analysis after merging the five results. Statistical analysis Age between the datasets were compared by calculating p-values using the Student’s t-test and sex and CVD incidence ratio between the datasets were compared by chi-squared test. For performance metrics, we used the AUROC, AUPRC, and F1-score, and the confidence intervals (CIs) of the AUROC and AUPRC were calculated using DeLong’s method, and the CIs for F1-score was calculated using Wilson’s method. For survival analysis, CPH models were fitted by Breslow’s method with a penalizer of 0.01. Statistical significance was set at α = 0.05. All statistical analyses were performed using Python (version 3.9.19), and Lifelines (version 0.30.0) in Python was used for survival analysis. Data Availability MIMIC-IV is publicly available upon application for access at https://physionet.org/content/mimiciv/2.2/ . The SNUH dataset is not publicly available due to patient privacy and is available from the corresponding author on reasonable request and IRB approvals. The MedRep dataset is available in our GitHub repository at https://github.com/kicarussays/MedRep . Code Availability The source code used in this study is publicly available at https://github.com/kicarussays/TRIM . Supplementary Materials View this table: View inline View popup Download powerpoint Supplementary Table 1. HF prediction performance. Experiments were performed with five random seeds and all values are shown as mean ± SD. View this table: View inline View popup Download powerpoint Supplementary Table 2. IHD prediction performance. Experiments were performed with five random seeds and all values are shown as mean ± SD. View this table: View inline View popup Download powerpoint Supplementary Table 3. CAD prediction performance. Experiments were performed with five random seeds and all values are shown as mean ± SD. View this table: View inline View popup Download powerpoint Supplementary Table 4. Stroke prediction performance. Experiments were performed with five random seeds and all values are shown as mean ± SD. View this table: View inline View popup Download powerpoint Supplementary Table 5. Adjusted HRs for CVDs (MIMIC-IV). View this table: View inline View popup Download powerpoint Supplementary Table 6. Adjusted HRs for CVDs (SNUH). Download figure Open in new tab Supplementary Figure 1. Population flowchart. View this table: View inline View popup Download powerpoint Supplementary Table 7. OMOP concepts for target outcomes. View this table: View inline View popup Download powerpoint Supplementary Table 8. Example descriptions of ECG diagnoses. View this table: View inline View popup Download powerpoint Supplementary Table 9. Configuration of the model. N and L indicate the batch size and the number of ECG leads. References ↵ Parasrampuria , S. & Henry , J. Hospitals’ use of electronic health records data, 2015–2017 . ONC Data Brief 46 , 13 ( 2019 ). OpenUrl ↵ Liang , J. et al. Adoption of Electronic Health Records (EHRs) in China During the Past 10 Years: Consecutive Survey Data Analysis and Comparison of Sino-American Challenges and Experiences . J Med Internet Res 23 , e24813 ( 2021 ). doi: 10.2196/24813 OpenUrl CrossRef PubMed ↵ Li , Y. et al. BEHRT: Transformer for Electronic Health Records . Scientific Reports 10 , 7155 ( 2020 ). doi: 10.1038/s41598-020-62922-y OpenUrl CrossRef Rasmy , L. , Xiang , Y. , Xie , Z. , Tao , C. & Zhi , D . Med-BERT: pretrained contextualized embeddings on large-scale structured electronic health records for disease prediction . npj Digital Medicine 4 , 86 ( 2021 ). doi: 10.1038/s41746-021-00455-y OpenUrl CrossRef PubMed Yang , Z. , Mitra , A. , Liu , W. , Berlowitz , D. & Yu , H . TransformEHR: transformer-based encoder-decoder generative model to enhance prediction of disease outcomes using electronic health records . Nature Communications 14 , 7857 ( 2023 ). doi: 10.1038/s41467-023-43715-z OpenUrl CrossRef PubMed ↵ Renc , P. et al. Zero shot health trajectory prediction using transformer . npj Digital Medicine 7 , 256 ( 2024 ). doi: 10.1038/s41746-024-01235-0 OpenUrl CrossRef PubMed ↵ Guo , L. L. et al. A multi-center study on the adaptability of a shared foundation model for electronic health records . npj Digital Medicine 7 , 171 ( 2024 ). doi: 10.1038/s41746-024-01166-w OpenUrl CrossRef PubMed ↵ Pang , C. et al. CEHR-XGPT: A Scalable Multi-Task Foundation Model for Electronic Health Records . arXiv preprint arXiv: 2509.03643 ( 2025 ). doi: 10.48550/arXiv.2509.03643 OpenUrl CrossRef ↵ Mataraso , S. J. et al. A machine learning approach to leveraging electronic health records for enhanced omics analysis . Nature Machine Intelligence 7 , 293 – 306 ( 2025 ). doi: 10.1038/s42256-024-00974-9 OpenUrl CrossRef PubMed ↵ Soenksen , L. R. et al. Integrated multimodal artificial intelligence framework for healthcare applications . npj Digital Medicine 5 , 149 ( 2022 ). doi: 10.1038/s41746-022-00689-4 OpenUrl CrossRef PubMed ↵ Kim , J. , Lee , N. , Kim , J. & Kim , K . MedRep: Medical Concept Representation for General Electronic Health Record Foundation Models . arXiv preprint arXiv: 2504.08329 ( 2025 ). doi: 10.48550/arXiv.2504.08329 OpenUrl CrossRef ↵ Johnson , A. E. W. et al. MIMIC-IV, a freely accessible electronic health record dataset . Scientific Data 10 , 1 ( 2023 ). doi: 10.1038/s41597-022-01899-x OpenUrl CrossRef PubMed ↵ McInnes , L. , Healy , J. & Melville , J . Umap: Uniform manifold approximation and projection for dimension reduction . arXiv preprint arXiv: 1802.03426 ( 2018 ). doi: 10.48550/arXiv.1802.03426 OpenUrl CrossRef ↵ Kim , J. et al. Deep learning-based long-term risk evaluation of incident type 2 diabetes using electrocardiogram in a non-diabetic population: a retrospective, multicentre study . eClinicalMedicine 68 ( 2024 ). doi: 10.1016/j.eclinm.2024.102445 OpenUrl CrossRef ↵ Kim , J. et al. Pretrained patient trajectories for adverse drug event prediction using common data model-based electronic health records . Communications Medicine 5 , 232 ( 2025 ). doi: 10.1038/s43856-025-00914-7 OpenUrl CrossRef ↵ Lundberg , S. M. & Lee , S.-I. in Proceedings of the 31st International Conference on Neural Information Processing Systems 4768 – 4777 ( Curran Associates Inc. , Long Beach, California, USA , 2017 ). ↵ Vaswani , A. et al. Attention is all you need . Advances in neural information processing systems 30 ( 2017 ). ↵ Ryan , S . Mechanisms of cardiovascular disease in obstructive sleep apnoea . J Thorac Dis 10 , S4201 – s4211 ( 2018 ). doi: 10.21037/jtd.2018.08.56 OpenUrl CrossRef PubMed ↵ Jean-Louis , G. , Zizi , F. , Clark , L. T. , Brown , C. D. & McFarlane , S. I . Obstructive sleep apnea and cardiovascular disease: role of the metabolic syndrome and its components . J Clin Sleep Med 4 , 261 – 272 ( 2008 ). OpenUrl CrossRef PubMed ↵ Soteriades , E. S. et al. Incidence and Prognosis of Syncope . New England Journal of Medicine 347 , 878 – 885 ( 2002 ). doi: 10.1056/NEJMoa012407 OpenUrl CrossRef PubMed Web of Science ↵ Koene , R. J. , Adkisson , W. O. & Benditt , D. G . Syncope and the risk of sudden cardiac death: Evaluation, management, and prevention . J Arrhythm 33 , 533 – 544 ( 2017 ). doi: 10.1016/j.joa.2017.07.005 OpenUrl CrossRef PubMed ↵ Powell-Wiley , T. M. et al. Obesity and Cardiovascular Disease: A Scientific Statement From the American Heart Association . Circulation 143 , e984 – e1010 ( 2021 ). doi: 10.1161/CIR.0000000000000973 OpenUrl CrossRef PubMed ↵ Ebong , I. A. , Goff , D. C. , Jr. , Rodriguez , C. J. , Chen , H. & Bertoni , A. G . Mechanisms of heart failure in obesity . Obes Res Clin Pract 8 , e540 – 548 ( 2014 ). doi: 10.1016/j.orcp.2013.12.005 OpenUrl CrossRef PubMed ↵ Sin , D. D. & Man , S. F . Chronic obstructive pulmonary disease as a risk factor for cardiovascular morbidity and mortality . Proc Am Thorac Soc 2 , 8 – 11 ( 2005 ). doi: 10.1513/pats.200404-032MS OpenUrl CrossRef PubMed ↵ Razvi , S. , Shakoor , A. , Vanderpump , M. , Weaver , J. U. & Pearce , S. H . The influence of age on the relationship between subclinical hypothyroidism and ischemic heart disease: a metaanalysis . J Clin Endocrinol Metab 93 , 2998 – 3007 ( 2008 ). doi: 10.1210/jc.2008-0167 OpenUrl CrossRef PubMed Web of Science ↵ Macdonald , J. E. & Struthers , A. D . What is the optimal serum potassium level in cardiovascular patients? J Am Coll Cardiol 43 , 155 – 161 ( 2004 ). doi: 10.1016/j.jacc.2003.06.021 OpenUrl FREE Full Text ↵ Klip , I. T. et al. Iron deficiency in chronic heart failure: an international pooled analysis . Am Heart J 165 , 575 – 582 .e573 ( 2013 ). doi: 10.1016/j.ahj.2013.01.017 OpenUrl CrossRef PubMed Web of Science ↵ Dukes , J. W. et al. Ventricular Ectopy as a Predictor of Heart Failure and Death . J Am Coll Cardiol 66 , 101 – 109 ( 2015 ). doi: 10.1016/j.jacc.2015.04.062 OpenUrl FREE Full Text ↵ Baman , T. S. et al. Relationship between burden of premature ventricular complexes and left ventricular function . Heart Rhythm 7 , 865 – 869 ( 2010 ). doi: 10.1016/j.hrthm.2010.03.036 OpenUrl CrossRef PubMed Web of Science ↵ Thygesen , K. et al. Fourth Universal Definition of Myocardial Infarction ( 2018 ). Circulation 138 , e618 – e651 (2018). doi: 10.1161/cir.0000000000000617 OpenUrl CrossRef PubMed ↵ Tsang , T. S. , Barnes , M. E. , Gersh , B. J. , Bailey , K. R. & Seward , J. B . Left atrial volume as a morphophysiologic expression of left ventricular diastolic dysfunction and relation to cardiovascular risk burden . Am J Cardiol 90 , 1284 – 1289 ( 2002 ). doi: 10.1016/s0002-9149(02)02864-3 OpenUrl CrossRef PubMed Web of Science ↵ Levy , D. , Garrison , R. J. , Savage , D. D. , Kannel , W. B. & Castelli , W. P . Prognostic implications of echocardiographically determined left ventricular mass in the Framingham Heart Study . N Engl J Med 322 , 1561 – 1566 ( 1990 ). doi: 10.1056/nejm199005313222203 OpenUrl CrossRef PubMed Web of Science ↵ Tesfaye , S. et al. Diabetic neuropathies: update on definitions, diagnostic criteria, estimation of severity, and treatments . Diabetes Care 33 , 2285 – 2293 ( 2010 ). doi: 10.2337/dc10-1303 OpenUrl Abstract / FREE Full Text ↵ Parshall , M. B. et al. An official American Thoracic Society statement: update on the mechanisms, assessment, and management of dyspnea . Am J Respir Crit Care Med 185 , 435 – 452 ( 2012 ). doi: 10.1164/rccm.201111-2042ST OpenUrl CrossRef PubMed Web of Science ↵ Thadani , U . Nitrate tolerance, rebound, and their clinical relevance in stable angina pectoris, unstable angina, and heart failure . Cardiovasc Drugs Ther 10 , 735 – 742 ( 1997 ). doi: 10.1007/bf00053031 OpenUrl CrossRef PubMed Web of Science ↵ Heidenreich , P. A. et al. 2022 AHA/ACC/HFSA Guideline for the Management of Heart Failure: A Report of the American College of Cardiology/American Heart Association Joint Committee on Clinical Practice Guidelines . Circulation 145 , e895 – e1032 ( 2022 ). doi: 10.1161/cir.0000000000001063 OpenUrl CrossRef PubMed ↵ Lee , H. Y. & Oh , B. H . Fimasartan: A New Angiotensin Receptor Blocker . Drugs 76 , 1015 – 1022 ( 2016 ). doi: 10.1007/s40265-016-0592-1 OpenUrl CrossRef PubMed ↵ Granger , C. B. et al. Effects of candesartan in patients with chronic heart failure and reduced left-ventricular systolic function intolerant to angiotensin-converting-enzyme inhibitors: the CHARM-Alternative trial . Lancet 362 , 772 – 776 ( 2003 ). doi: 10.1016/s0140-6736(03)14284-5 OpenUrl CrossRef PubMed Web of Science ↵ Shepherd , J. et al. Pravastatin in elderly individuals at risk of vascular disease (PROSPER): a randomised controlled trial . Lancet 360 , 1623 – 1630 ( 2002 ). doi: 10.1016/s0140-6736(02)11600-x OpenUrl CrossRef PubMed Web of Science ↵ Yusuf , S. et al. Effects of the angiotensin-receptor blocker telmisartan on cardiovascular events in high-risk patients intolerant to angiotensin-converting enzyme inhibitors: a randomised controlled trial . Lancet 372 , 1174 – 1183 ( 2008 ). doi: 10.1016/s0140-6736(08)61242-8 OpenUrl CrossRef PubMed Web of Science ↵ Stone , G. W. et al. Relationship Between Infarct Size and Outcomes Following Primary PCI: Patient-Level Analysis From 10 Randomized Trials . J Am Coll Cardiol 67 , 1674 – 1683 ( 2016 ). doi: 10.1016/j.jacc.2016.01.069 OpenUrl FREE Full Text ↵ Mangrum , J. M. & DiMarco , J. P . The evaluation and management of bradycardia . N Engl J Med 342 , 703 – 709 ( 2000 ). doi: 10.1056/nejm200003093421006 OpenUrl CrossRef PubMed Web of Science ↵ Böhm , M. et al. Heart rate as a risk factor in chronic heart failure (SHIFT): the association between heart rate and outcomes in a randomised placebo-controlled trial . Lancet 376 , 886 – 894 ( 2010 ). doi: 10.1016/s0140-6736(10)61259-7 OpenUrl CrossRef PubMed Web of Science ↵ Surawicz , B. et al. AHA/ACCF/HRS recommendations for the standardization and interpretation of the electrocardiogram: part III: intraventricular conduction disturbances: a scientific statement from the American Heart Association Electrocardiography and Arrhythmias Committee, Council on Clinical Cardiology; the American College of Cardiology Foundation; and the Heart Rhythm Society: endorsed by the International Society for Computerized Electrocardiology . Circulation 119 , e235 – 240 ( 2009 ). doi: 10.1161/circulationaha.108.191095 OpenUrl FREE Full Text ↵ Fluss , R. , Faraggi , D. & Reiser , B . Estimation of the Youden Index and its associated cutoff point . Biom J 47 , 458 – 472 ( 2005 ). doi: 10.1002/bimj.200410135 OpenUrl CrossRef PubMed Web of Science ↵ Rosenbacke , R. , Melhus , Å. , McKee , M. & Stuckler , D . How Explainable Artificial Intelligence Can Increase or Decrease Clinicians’ Trust in AI Applications in Health Care: Systematic Review . JMIR AI 3 , e53207 ( 2024 ). doi: 10.2196/53207 OpenUrl CrossRef ↵ Hong , Y. & Kahn , C. E. , Jr . . Content analysis of reporting templates and free-text radiology reports . J Digit Imaging 26 , 843 – 849 ( 2013 ). doi: 10.1007/s10278-013-9597-4 OpenUrl CrossRef PubMed ↵ Gow , B. et al. MIMIC-IV-ECHO: Echocardiogram matched subset (version 0.1) . PhysioNet ( 2023 ). doi: 10.13026/ef48-v217 OpenUrl CrossRef ↵ Oseran , A. S. et al. Assessment of Prices for Cardiovascular Tests and Procedures at Top-Ranked US Hospitals . JAMA Intern Med 182 , 996 – 999 ( 2022 ). doi: 10.1001/jamainternmed.2022.2602 OpenUrl CrossRef PubMed ↵ Burke , J. F . Cost and utility in the diagnostic evaluation of stroke . Continuum (Minneap Minn ) 20 , 436 – 440 ( 2014 ). doi: 10.1212/01.Con.0000446112.05291.35 OpenUrl CrossRef PubMed ↵ Tran , T. X. M. , Kim , S. , Cha , C. & Park , B . Temporal Trend in Uptake of the National General Health Checkups and Cancer Screening Program among Korean Women with Breast Cancer . crt 56 , 522 – 530 ( 2023 ). doi: 10.4143/crt.2023.729 OpenUrl CrossRef ↵ Sundararajan , M. , Taly , A. & Yan , Q. in Proceedings of the 34th International Conference on Machine Learning Vol. 70 (eds Precup Doina & Teh Yee Whye ) 3319 –– 3328 ( PMLR, Proceedings of Machine Learning Research , 2017 ). View the discussion thread. Back to top Previous Next Posted November 11, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Multimodal Electronic Health Record Foundation Models with Electrocardiogram for Cardiovascular Disease Prediction Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Multimodal Electronic Health Record Foundation Models with Electrocardiogram for Cardiovascular Disease Prediction Junmo Kim , Young-Kwan Kim , Kwangsoo Kim medRxiv 2025.11.10.25339886; doi: https://doi.org/10.1101/2025.11.10.25339886 Share This Article: Copy Citation Tools Multimodal Electronic Health Record Foundation Models with Electrocardiogram for Cardiovascular Disease Prediction Junmo Kim , Young-Kwan Kim , Kwangsoo Kim medRxiv 2025.11.10.25339886; doi: https://doi.org/10.1101/2025.11.10.25339886 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Cardiovascular Medicine Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (300) Cardiovascular Medicine (4435) Dentistry and Oral Medicine (444) Dermatology (382) Emergency Medicine (608) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1509) Epidemiology (15229) Forensic Medicine (30) Gastroenterology (1124) Genetic and Genomic Medicine (6600) Geriatric Medicine (668) Health Economics (997) Health Informatics (4536) Health Policy (1368) Health Systems and Quality Improvement (1613) Hematology (541) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15916) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (146) Nephrology (667) Neurology (6599) Nursing (346) Nutrition (998) Obstetrics and Gynecology (1144) Occupational and Environmental Health (957) Oncology (3332) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (663) Pediatrics (1693) Pharmacology and Therapeutics (691) Primary Care Research (711) Psychiatry and Clinical Psychology (5447) Public and Global Health (9232) Radiology and Imaging (2198) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (593) Sexual and Reproductive Health (712) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a00c789bdecef047',t:'MTc3OTYyNzQ5OA=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.