Full text
45,662 characters
· extracted from
preprint-html
· click to expand
An unbiased comparison of 14 epigenetic clocks in relation to 10-year onset of 174 disease outcomes in 18,859 individuals | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search An unbiased comparison of 14 epigenetic clocks in relation to 10-year onset of 174 disease outcomes in 18,859 individuals Christos Mavrommatis , View ORCID Profile Daniel W Belsky , Kejun Ying , View ORCID Profile Mahdi Moqri , Archie Campbell , Anne Richmond , Vadim N Gladyshev , Tamir Chandra , Daniel L McCartney , Riccardo E Marioni doi: https://doi.org/10.1101/2025.07.14.25331494 Christos Mavrommatis 1 Centre for Genomic and Experimental Medicine, Institute of Genetics and Cancer, University of Edinburgh , UK 5 Robert and Arlene Kogod Center on Aging, Mayo Clinic , Rochester, MN, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Daniel W Belsky 2 Robert N Butler Columbia Aging Center & Department of Epidemiology , New York, NY, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Daniel W Belsky Kejun Ying 3 Department of Medicine, Brigham and Women’s Hospital, Harvard Medical School , Boston, MA, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Mahdi Moqri 3 Department of Medicine, Brigham and Women’s Hospital, Harvard Medical School , Boston, MA, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Mahdi Moqri Archie Campbell 1 Centre for Genomic and Experimental Medicine, Institute of Genetics and Cancer, University of Edinburgh , UK 4 Centre for Medical Informatics, Usher Institute, University of Edinburgh , UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Anne Richmond 1 Centre for Genomic and Experimental Medicine, Institute of Genetics and Cancer, University of Edinburgh , UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Vadim N Gladyshev 3 Department of Medicine, Brigham and Women’s Hospital, Harvard Medical School , Boston, MA, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Tamir Chandra 5 Robert and Arlene Kogod Center on Aging, Mayo Clinic , Rochester, MN, USA 6 Department of Biochemistry and Molecular Biology, Mayo Clinic , Rochester, MN, USA 7 Department of Quantitative Health Sciences, Mayo Clinic , Rochester, MN, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Daniel L McCartney 1 Centre for Genomic and Experimental Medicine, Institute of Genetics and Cancer, University of Edinburgh , UK 8 bioXcelerate, Optima Partners , Edinburgh, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Riccardo E Marioni 1 Centre for Genomic and Experimental Medicine, Institute of Genetics and Cancer, University of Edinburgh , UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: riccardo.marioni{at}ed.ac.uk Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Epigenetic Clocks have been trained to predict chronological age, healthspan and lifespan. Such clocks are often analysed in relation to disease outcomes – typically using small datasets and a limited number of clocks. Here, we present the first large-scale (n=18,849), unbiased comparison of 14 widely used clocks as predictors of 174 incident disease outcomes and all-cause mortality. Second-generation clocks significantly outperformed first-generation clocks, which have limited applications in disease settings. Of the 176 Bonferroni significant (P<0.05/174) associations, there were 27 diseases (including primary lung cancer and diabetes) where the hazard ratio for the clock exceeded the clock’s association with all-cause mortality. Furthermore, there were 35 instances where adding a clock to a null classification model with traditional risk factors increased the classification accuracy by >1% with an AUC full > 0.80. Second-generation epigenetic clocks show promise for disease risk prediction, particularly in relation to respiratory and liver-based conditions. Main We all age at the same chronological rate; everyone gets a year older every 12 months. But we experience the passage of time differently. Some of us maintain our health into our later years, while others develop chronic disease and disability by midlife. However, defining the biological differences that underlie this heterogeneity is complex. There is no gold standard measurement of biological aging [ 1 ]. However, there are now a number of candidate biomarkers of aging derived from integrating high-dimensional molecular data with machine-learning methods that have accumulated substantial validation evidence [ 2 ]. Among these, the best studied are a family of DNA methylation (DNAm) algorithms known as epigenetic clocks [ 3 ]. The first generation of epigenetic clocks were developed by comparing DNA methylation data between older and younger people to develop algorithms predictive of chronological age (e.g., the Horvath and Hannum clocks [ 4 ], [ 5 ]). A second generation of epigenetic clocks were subsequently developed by modelling differences between individuals in mortality risk and phenotypes that track general health [ 6 ], [ 7 ]. Finally, a third generation were developed by modelling differences between individuals of the same chronological age in their rate of multi-organ system deterioration [ 8 ]. The later generation clocks are therefore trained to predict complex outcomes, compared to chronological age. They often include two-step processes whereby DNAm proxies of health-related biomarkers (e.g., smoking, protein levels) are considered in place of individual DNAm CpG sites that are typically used to derive first-generation clocks. While this incorporation of broader biological information may enhance the utility for clinical outcome prediction, it also complicates interpretability compared to first-generation clocks, which may remain more suitable for investigating the mechanisms underlying cellular ageing. A key question in evaluating the clinical utility of epigenetic clock biomarkers of aging is their capacity to predict the future incidence of aging-related disease. However, while there are now a large number of studies reporting clock associations with different disease outcomes in a range of datasets [ 9 ], [ 10 ] no large-scale systematic comparison of many clocks predicting many diseases has been conducted. Here, we provide an unbiased assessment of 14 leading clocks ( Table 1 ) in relation to 10-year onset of a comprehensive set of 174 disease outcomes within one of the world’s single-largest DNAm datasets, the Generation Scotland cohort (n=18,859) [ 11 ]. There was a minimum of 30 incident cases per disease (median=108, max=1,527 cases for hypertension, see Table S1 ). View this table: View inline View popup Download powerpoint Table 1. Overview of the 14 epigenetic clocks considered as disease risk predictors Cox proportional hazards regression was run for each clock-disease pairing, adjusting for age, sex, body mass index, smoking, alcohol consumption, education, and socioeconomic deprivation ( Table S2 ). Age, estimated cell proportions and relatedness were regressed out of each clock prior to the Cox regression analyses. This covariate setup might directly capture information that is included in the clocks e.g., a DNAm proxy for smoking is included in the construction of GrimAge, a predictor of mortality [ 7 ]. However, these covariates are easy to assess and commonly collected in clinical settings. Thus, in terms of disease prediction, it is valuable to note what added information epigenetic clocks might contribute. A total of 176 Bonferroni significant associations were found for 13 of the clocks across 57 diseases (P < 2.9 x10 −4 ). In addition to the Cox regressions, logistic regression 10-year classification was conducted using the same covariates (null model). The differences in AUC between these models and full models (adding in an epigenetic clock) were then calculated. An R ShinyApp displays the results from both the Cox and logistic regression analyses ( https://shiny.igc.ed.ac.uk/Epigenetic_Clock_and_Disease_Association/ ). Users can visualise findings for specific or multiple clocks and disease outcomes or diseases within a grouping e.g, psychiatric or cardiovascular traits. There were 9 Bonferroni significant disease associations for the first-generation clocks, representing ~5% of all significant findings. Across all 174 diseases that were considered, and using GrimAge v1 as the reference category, the average log hazards ( Figure 1 , Table S3 and S4 ) of the first-generation clocks were around 50% smaller in magnitude (P≤2.9×10 −10 ). Smaller effect sizes were also noted for PhenoAge (P=6.3×10 −3 ) and DNAm telomere length (P0.05) apart from Zhang10 (P=0.042). Download figure Open in new tab Figure 1. Distribution of log hazard ratios for each epigenetic clock across all 174 incident disease outcomes. Clocks are presented in descending order of the median effect size. Median and interquartile range presented within the violins. First generation clocks are highlighted in pink, second generation in green, third generation clocks in purple and telomere length (where log HR effect sizes have been multiplied by −1 for visual display purposes) in turquoise. To help contextualise the magnitude and significance of the clock-disease associations, we first ran survival models for 10-year all-cause mortality (n cases = 842; Table S2 ) – one of the best-established health outcomes to be related to epigenetic age acceleration [ 12 ]. The largest and most significant association was with GrimAge v2 (Hazard Ratio (HR) per SD of age acceleration = 1.54, 95% CI [1.46, 1.62], P = 7.1×10 −62 ). All clocks had significant associations at P<0.05 apart from Horvath’s skin and blood clock, Ying’s AdaptAge and Lin’s age predictor. Using logistic regression, an AUC of 0.851 was obtained for the model with covariates only. This increased by up to 0.014 (1.4%) upon the addition of GrimAge v2 (AUC=0.865) as a covariate. There were 27 unique disease outcomes where the clock-disease hazard ratio was Bonferroni-significant and exceeded the magnitude of the corresponding clock-mortality association ( Table S5 ). A diverse set of diseases were highlighted, however there was a strong focus on respiratory/smoking-related and liver-related outcomes, including primary lung cancer (HR GrimAgev1 per SD = 1.56 [1.42, 1.72], P = 5.3×10 −19 ) and cirrhosis (HR GrimAgev2 = 1.86 [1.57, 2.21], P = 8.9×10 −13 ). Also of note, were associations with diabetes (HR DunedinPACE = 1.44 [1.33, 1.57], P = 9.6×10 −19 ), Crohn’s disease (HR PhenoAge = 1.39 [1.19, 1.64], P = 4.7×10 −5 ) and delirium (HR Zhang10 = 1.44 [1.23, 1.68], P = 6.7×10 −6 ). Logistic regression models were then run for all clock-disease analysis using a null model (covariates only) and a full model where a clock was added as a predictor of interest. After filtering to the 176 clock-disease associations that were Bonferroni significant in the Cox models, there were 35 instances where the AUC from the full model exceeded 0.8 (indicative of being clinically meaningful) and the AUC improvement between the null and full model was greater than 0.01 ( Figure 2 and Table S6 ). Download figure Open in new tab Figure 2. AUC increments for disease – clock associations where the hazard ratio from the Cox regression was Bonferroni significant, the AUC of the full model was >0.8 and the improvement to the AUC upon adding the clock to the null model was >0.01. Null model covariates include: age, sex, education, alcohol, smoking, BMI and deprivation. The full models also included the relevant epigenetic clock. Again, several clocks were linked to respiratory/smoking and alcohol-related disease outcomes, including COPD, primary oesophageal and lung cancer, respiratory failure and cirrhosis. In addition, PhenoAge and DunedinPACE improved classification of Parkinson’s disease and ischaemic stroke, respectively. Hannum’s clock and Horvath’s skin and blood clock improved the classification of primary uterine and pancreatic cancer, respectively. Our findings clearly indicate that second- and third-generation epigenetic clocks should be prioritised for disease association studies. These clocks showed particularly strong links to respiratory and liver-related disease outcomes, including primary lung and oesophageal cancers and cirrhosis. Furthermore, the findings are present after adjusting for key risk factors such as deprivation, self-reported smoking behaviour and alcohol consumption as covariates. The 162 Bonferroni significant second- and third-generation clock disease associations were evenly spread across the clocks, with a maximum of 37 associations from GrimAge v2 i.e., there is no clear “best” clock for pan-disease analyses. The construction of both v1 and v2 of GrimAge includes a DNAm surrogate for smoking, which may help to drive downstream associations with respiratory diseases. Similarly, the inclusion of longitudinal changes in BMI, waist-hip ratio and HbA1c in DunedinPACE may contribute to its predictive utility for diabetes. Our study contains certain limitations. For example, we related DNAm profiling from whole-blood samples against multi-tissue diseases and non-blood tissue specific diseases in a Scottish-based cohort. Our data analysis did not exhaustively adjust for covariates that might track disease risk and multi-morbidity, such as family history of disease, genetic risk scores (polygenic scores), medication usage, social interactions and blood pressure. However, bespoke covariate setups are not feasible when studying such a broad range of disease outcomes. Smoking status and alcohol consumption data were self-reported and may therefore carry biases. Future studies could consider the addition of epigenetic proxies for these measures as covariates. It is also crucial to highlight that epigenetic clocks do not provide insights into the mechanisms of action of diseases. Lastly, despite the longitudinal data utilized in this study to compute incident disease outcomes, serial biosamples were not available. Replication of our findings using longitudinal samples across diverse cohorts is needed. The time from blood draw to disease onset varied in this study. Investigations of specific time windows e.g., in increments of 5 years, could yield different strengths of associations. Future research should also consider the training and testing of disease-specific clocks. For example, we have previously shown that a DNAm predictor for incident Type 2 Diabetes augments models containing traditional risk factors [ 13 ]. Finally, our disease phenotyping approach, whilst consensus-based, might be too broad in some instances e.g., the all-cause dementia phenotype captures both Alzheimer’s disease and vascular dementia, as well as other, less common dementia sub-types. Here, we performed a comprehensive and unbiased comparison of leading epigenetic clocks as putative biomarkers for 174 incident disease outcomes. We identified 176 disease associations across 13 clocks with 57 unique diseases. By anchoring our findings to well-established associations with all-cause mortality, we highlighted multiple novel associations with large effect sizes. We also focus on outcomes where classification gains may lead to clinical impact. These results form a starting point for the targeted selection of epigenetic clocks for consideration in clinical risk prediction models. Methods Generation Scotland Cohort Generation Scotland (GS) is a family-based research study comprised of 24,084 volunteers [ 14 ]. Volunteers joined the cohort between 2006 and 2011 with the majority of recruitment taking place via invitation from the individuals’ general practitioners (GPs). Initially, individuals aged 35-65 years were recruited from across five geographic areas (Glasgow, Aberdeen, Dundee, Ayr and Arran). They were then encouraged to recruit family members living in Scotland to join the study. This resulted in a baseline cohort aged between 17 and 99 years. All individuals were invited to complete questionnaires and to attend a baseline clinic visit for further questionnaires and testing, resulting in a detailed collection of lifestyle, clinical, health, cognitive and sociodemographic data. The majority also agreed to provide biosamples, including blood, from which DNA has been extracted and profiled for genetic and epigenetic data. Most individuals also provided consent for researchers to access their medical records via data linkage to primary and secondary care codes. Ethics and Consent All components of Generation Scotland received ethical approval from the NHS Tayside Committee on Medical Research Ethics (REC Reference Number: 05/S1401/89). All participants provided broad and enduring written informed consent for biomedical research. Generation Scotland has also been granted Research Tissue Bank status by the East of Scotland Research Ethics Service (REC Reference Number: 15/0040/ES), providing generic ethical approval for a wide range of uses within medical research. This study was performed in accordance with the Helsinki declaration. DNA Methylation Profiling Methylation data have been quantified for 18,413 GS volunteers at a total of 752,722 genomic (CpG) sites after quality control via the Illumina EPIC850k array [ 11 ]. Thereafter, epigenetic age and age acceleration estimates were derived via the Biolearn platform. Biolearn is an open-source python library that enables easy and versatile analyses of biomarkers of aging data. It provides tools to easily load data from publicly available sources and contains reference implementations for common aging clocks such as the Horvath clock, DunedinPACE, and many others that can easily be run in only a few lines of code [ 15 ]. Age acceleration for each clock/predictor was calculated as the residual from a linear mixed model where the clock/predictor was regressed on age and estimated cell proportions (derived from the Biolearn platform). To avoid collinearity (as the cell proportions sum to one), basophil proportion was not included as a covariate. A pedigree kinship matrix was included as a random effect to control for the family structure present in the cohort. The regression models were run using the lmekin function from the coxme R package [ 16 ]. Disease Coding Using a list of consensus definitions based on primary and secondary care codes [ 17 ], 308 disease outcomes were derived from the electronic health records data in Generation Scotland from January 1980 to April 2022. Despite having volunteer consent to access primary care data, these were only accessible for ~40% of the cohort due to consent constraints with individual GP surgeries (the data holders). These data were subsequently filtered to only consider the first diagnosis for each disease, which could be made in either a primary or secondary care setting. Those with a diagnosis prior to joining the study were excluded from downstream analyses for that specific disease outcome, in order to ensure investigation of incident as opposed to prevalent disease outcomes. Not all diseases were observed in the cohort. The latest date of linkage with primary and secondary healthy records was April 2022. Filtering to diseases with at least 30 cases over the first 10-years of follow-up resulted in 174 outcomes for the main analyses. A list of the 174 diseases observed and the number of incident events (events occurring after the blood draw) along with mean age at diagnosis are presented in Table S1 . Mortality Records Mortality records were obtained via Community Health Index linkage to the National Records of Scotland. These data formed part of our censoring criteria where individuals either survived and remained unaffected by a disease or died during the follow up period to April 2022. Covariates Demographic, lifestyle and health variables were considered as covariates in the regression models with each clock and disease outcome. These included: age, sex, body mass index (BMI, calculated as weight in kg divided by squared height in metres), smoking pack years (calculated by self-reported packs per day multiplied by number of years as a smoker), alcohol units consumed over the last week, years of education (an ordinal variable with 11 categories: (1) 0 years, (2) 1–4 years, (3) 5–9 years, (4) 10–11 years, (5) 12–13 years, (6) 14–15 years, (7) 16–17 years, (8) 18–19 years, (9) 20–21 years, (10) 22–23 years, (11) 24 or more years), and an area-based rank of socioeconomic deprivation (Scottish Index of Multiple Deprivation, SIMD). SIMD measures relative deprivation across 6,976 data zones, calculated across seven domains: income, employment, education, health, access to services, crime and housing. K-nearest neighbours’ imputation – using k=10 and a maximum missingness per person of 4/7 of variables – was used to generate complete data for covariates. There was complete data on age and sex with a range of missingness for the other variables (SIMD: n = 1,152, BMI: n = 120, Education: n = 1,012, Pack years: n = 395, Alcohol: n = 1,734). Natural log transformations were applied to alcohol and pack years (adding a constant of 1 to all values to account for non-drinkers/smokers) and BMI. All covariates were then standardised to mean zero and unit variance prior to imputation. Association between age acceleration and disease outcomes Cox proportional hazards regression models, adjusting for the aforementioned covariates, were used to relate age acceleration for each epigenetic clock to 10-year onset for the list of 174 incident disease outcomes. The analyses were subset to the most frequently affected by sex where the proportion of male or female cases was >90% for any given disease. A total of 174 models were run for each of the 14 clocks, giving 2,436 models in total. P-value filtering was conducted per individual clock-regression model, resulting in a Bonferroni threshold of P < 0.05/174 = 2.9 × 10 −4 . A further set of analyses were run where time to all-cause mortality was the outcome. The proportional hazards assumption was tested by examining the Schoenfeld residuals. A test of the residuals for both the overall model and the predictor variable of interest (age acceleration) was performed using the cox.zph function in the survival package. A formal comparison of the log Hazard Ratios for the clocks across all 174 disease outcomes was then conducted using a linear mixed effects model. The logHR was the outcome while the clock was the predictor (GrimAge v1 was the reference level) and disease was included as a random effect on the intercept. In addition to the Cox models, logistic regression was used to generate area under the curve (AUC) estimates for 10-year disease classification. Null models contained the aforementioned covariates, while a full model also included an age acceleration measure. Code and Data Availability Fully annotated copies of the analysis scripts are available at: https://github.com/marioni-group/Epigenetic_Clocks_and_Disease_GS . The source data that were analysed during the current study are not publicly available due to them containing information that could compromise participant consent and confidentiality. Data can be obtained from the data owners. Instructions for accessing Generation Scotland data can be found here: https://www.ed.ac.uk/generation-scotland/for-researchers/access ; the ‘GS Access Request Form’ can be downloaded from this site. Completed request forms must be sent to access{at}generationscotland.org to be approved by the Generation Scotland Access Committee. Ethics approval and consent to participate All components of Generation Scotland received ethical approval from the NHS Tayside Committee on Medical Research Ethics (REC Reference Number: 05/S1401/89). GS has also been granted Research Tissue Bank status by the East of Scotland Research Ethics Service (REC Reference Number: 20-ES-0021), providing generic ethical approval for a wide range of uses within medical research. All participants provided written informed consent. The study was performed in accordance with the Helsinki declaration. Competing interests R.E.M is an advisor to the Epigenetic Clock Development Foundation and Optima Partners Ltd. D.L.M. is employed by Optima Partners Ltd. D.W.B is an inventor of DunedinPACE, which is licensed to TruDiagnostic. The remaining authors declare no competing interests. List of Supplementary Tables Table S1 . Descriptive statistics for the 174 disease outcomes Table S2 . Cox regression and logistic regression results for 14 clocks and 174 incident disease outcomes plus all-cause mortality. HR = Hazard Ratio, LCI = lower 95% confidence interval, UCI = upper 95% confidence interval, P = p-value, Schoenfeld local p = p-value for the Shoenfeld residual test for the predictor (clock) of interest, Schoenfeld global p = p-value for the Shoenfeld residual test for all predictors in the model, auc null = area under the curve for the logistic regression model with covariates only, auc full = area under the curve for the logistics regression model with covariates and the clock of interest, auc diff = difference between the auc_null and auc_full Table S3 . Mean and standard deviation of the log hazard ratios for each clock, averaged across all 174 disease associations. Table S4 . Linear mixed effects model output contrasting the mean log hazard ratio for each clock against GrimAge v1 (reference category). Table S5 . Subset of Table S2 showing Bonferroni significant associations where the log hazard ratio is greater for the respective disease-clock association compared to the mortality-clock association. Table S6 . Subset of Table S2 showing Bonferroni significant associations where the AUC of the fully-adjusted model exceeded 0.8 and the difference in AUC with the basic-adjusted model is greater than 0.01 (1%). Acknowledgements This research was funded in whole, or in part, by the Wellcome Trust (104036/Z/14/Z and 221890/Z/20/Z). For the purpose of open access, the author has applied a CC BY public copyright license to any Author Accepted Manuscript version arising from this submission. Generation Scotland received core support from the Chief Scientist Office of the Scottish Government Health Directorates (CZD/16/6) and the Scottish Funding Council (HR03006). DNA methylation profiling of the Generation Scotland samples was carried out by the Genetics Core Laboratory at the Edinburgh Clinical Research Facility, Edinburgh, Scotland, and was funded by the Medical Research Council UK and Wellcome (Wellcome Trust Strategic Award STratifying Resilience and Depression Longitudinally (STRADL; Reference 104036/Z/14/Z). DNA methylation data for Generation Scotland was also funded by a 2018 NARSAD Young Investigator Grant from the Brain & Behavior Research Foundation (Ref: 27404; awardee: Dr David M Howard) and by a John, Margaret, Alfred and Stewart Sim Fellowship from the Royal College of Physicians of Edinburgh (Awardee: Dr Heather C Whalley). D.W.B a fellow of the CIFAR CBD Network and is supported in part by R01AG073402 and R01AG087158. T.C and C.M are funded by the Mayo Clinic Robert and Arlene Kogod Center on Aging. Footnotes ↵ * These authors contributed jointly. References 1. ↵ Ferrucci , L. , Gonzalez-Freire , M. , Fabbri , E. , Simonsick , E. , Tanaka , T. , Moore , Z. , Salimi , S. , Sierra , F. and de Cabo , R. ( 2020 ) ‘ Measuring biological aging in humans: A quest’ , Aging Cell , 19 ( 2 ), p. e13080 . doi: 10.1111/acel.13080 . OpenUrl CrossRef PubMed 2. ↵ Moqri , M. , Herzog , C. , Poganik , J.R. , Biomarkers of Aging Consortium , Justice , J. , Belsky , D.W. , Higgins-Chen , A. , Moskalev , A. , Fuellen , G. , Cohen , A.A. , Bautmans , I. , Widschwendter , M. , Ding , J. , Fleming , A. , Mannick , J. , Han , J.J. , Zhavoronkov , A. , Barzilai , N. , Kaeberlein , M. , Cummings , S. , Kennedy , B.K. , Ferrucci , L. , Horvath , S. , Verdin , E. , Maier , A.B. , Snyder , M.P. , Sebastiano , V. and Gladyshev , V.N. ( 2023 ) ‘ Biomarkers of aging for the identification and evaluation of longevity interventions’ , Cell , 186 ( 18 ), pp. 3758 – 3775 . doi: 10.1016/j.cell.2023.08.003 . OpenUrl CrossRef PubMed 3. ↵ Teschendorff , A.E. and Horvath , S. ( 2025 ) ‘ Epigenetic ageing clocks: statistical methods and emerging computational challenges’ , Nature Reviews Genetics , 26 ( 5 ), pp. 350 – 368 . doi: 10.1038/s41576-024-00807-w . OpenUrl CrossRef PubMed 4. ↵ Hannum , G. , Guinney , J. , Zhao , L. , Zhang , L. , Hughes , G. , Sadda , S. , Klotzle , B. , Bibikova , M. , Fan , J.B. , Gao , Y. , Deconde , R. , Chen , M. , Rajapakse , I. , Friend , S. , Ideker , T. and Zhang , K. ( 2013 ) ‘ Genome-wide methylation profiles reveal quantitative views of human aging rates’ , Molecular Cell , 49 ( 2 ), pp. 359 – 367 . doi: 10.1016/j.molcel.2012.10.016 . OpenUrl CrossRef PubMed Web of Science 5. ↵ Horvath , S. ( 2013 ) ‘ DNA methylation age of human tissues and cell types’ , Genome Biology , 14 ( 10 ), p. R115 . doi: 10.1186/gb-2013-14-10-r115 . OpenUrl CrossRef PubMed 6. ↵ Levine , M.E. , Lu , A.T. , Quach , A. , Chen , B.H. , Assimes , T.L. , Bandinelli , S. , Hou , L. , Baccarelli , A.A. , Stewart , J.D. , Li , Y. , Whitsel , E.A. , Wilson , J.G. , Reiner , A.P. , Aviv , A. , Lohman , K. , Liu , Y. , Ferrucci , L. and Horvath , S. ( 2018 ) ‘ An epigenetic biomarker of aging for lifespan and healthspan’ , Aging , 10 ( 4 ), pp. 573 – 591 . doi: 10.18632/aging.101414 . OpenUrl CrossRef PubMed 7. ↵ Lu , A.T. , Quach , A. , Wilson , J.G. , Reiner , A.P. , Aviv , A. , Raj , K. , Hou , L. , Baccarelli , A.A. , Li , Y. , Stewart , J.D. , Whitsel , E.A. , Assimes , T.L. , Ferrucci , L. and Horvath , S. ( 2019 ) ‘ DNA methylation GrimAge strongly predicts lifespan and healthspan’ , Aging , 11 ( 2 ), pp. 303 – 327 . doi: 10.18632/aging.101684 . OpenUrl CrossRef PubMed 8. ↵ Belsky , D.W. , Caspi , A. , Corcoran , D.L. , Sugden , K. , Poulton , R. , Arseneault , L. , Baccarelli , A. , Chamarti , K. , Gao , X. , Hannon , E. , Harrington , H.L. , Houts , R. , Kothari , M. , Kwon , D. , Mill , J. , Schwartz , J. , Vokonas , P. , Wang , C. , Williams , B.S. and Moffitt , T.E. ( 2022 ) ‘ DunedinPACE, a DNA methylation biomarker of the pace of aging’ , eLife , 11 , p. e73420 . doi: 10.7554/eLife.73420 . OpenUrl CrossRef PubMed 9. ↵ Chervova , O. , Panteleeva , K. , Chernysheva , E. , Widayati , T.A. , Baronik , Ž.F. , Hrbková , N. , Schneider , J.L. , Bobak , M. , Beck , S. and Voloshin , V. ( 2024 ) ‘ Breaking new ground on human health and well-being with epigenetic clocks: A systematic review and meta-analysis of epigenetic age acceleration associations’ , Ageing Research Reviews , 102 , p. 102552 . doi: 10.1016/j.arr.2024.102552 . OpenUrl CrossRef PubMed 10. ↵ Oblak , L. , van der Zaag , J. , Higgins-Chen , A.T. , Levine , M.E. and Boks , M.P. ( 2021 ) ‘ A systematic review of biological, social and environmental factors associated with epigenetic clock acceleration’ , Ageing Research Reviews , 69 , p. 101348 . doi: 10.1016/j.arr.2021.101348 . OpenUrl CrossRef PubMed 11. ↵ Walker , R.M. , McCartney , D.L. , Carr , K. , Barber , M. , Shen , X. , Campbell , A. , Bernabeu , E. , Aitken , E. , Fawkes , A. , Wrobel , N. , Murphy , L. , Whalley , H.C. , Howard , D.M. , Adams , M.J. , Rawlik , K. , Navarro , P. , Tenesa , A. , Sudlow , C.L. , Porteous , D.J. , Marioni , R. , McIntosh , A.M. and Evans , K.L. ( 2024 ) ‘ Data Resource Profile: Whole Blood DNA Methylation Resource in Generation Scotland (MeGS)’ , medRxiv [Preprint] . Available at : doi: 10.1101/2024.04.30.24306314 (Accessed: 7 March 2025 ). OpenUrl Abstract / FREE Full Text 12. ↵ Marioni , R.E. , Shah , S. , McRae , A.F. , Chen , B.H. , Colicino , E. , Harris , S.E. , Gibson , J. , Henders , A.K. , Redmond , P. , Cox , S.R. , Pattie , A. , Corley , J. , Murphy , L. , Martin , N.G. , Montgomery , G.W. , Feinberg , A.P. , Fallin , M.D. , Multhaup , M.L. , Jaffe , A.E. , Joehanes , R. , Schwartz , J. , Just , A.C. , Lunetta , K.L. , Murabito , J.M. , Starr , J.M. , Horvath , S. , Baccarelli , A.A. , Levy , D. , Visscher , P.M. , Wray , N.R. and Deary , I.J. ( 2015 ) ‘ DNA methylation age of blood predicts all-cause mortality in later life’ , Genome Biology , 16 , p. 25 . doi: 10.1186/s13059-015-0584-6 . OpenUrl CrossRef PubMed 13. ↵ Cheng Y , Gadd DA , Gieger C , Monterrubio-Gómez K , Zhang Y , Berta I , Stam MJ , Szlachetka N , Lobzaev E , Wrobel N , Murphy L , Campbell A , Nangle C , Walker RM , Fawns-Ritchie C , Peters A , Rathmann W , Porteous DJ , Evans KL , McIntosh AM , Cannings TI , Waldenberger M , Ganna A , McCartney DL , Vallejos CA , Marioni RE . Development and validation of DNA methylation scores in two European cohorts augment 10-year risk prediction of type 2 diabetes . Nat Aging . 2023 Apr ; 3 ( 4 ): 450 – 458 . doi: 10.1038/s43587-023-00391-4 . Epub 2023 Apr 6. PMID: 37117793 . OpenUrl CrossRef PubMed 14. ↵ Milbourn , H. , McCartney , D. , Richmond , A. , Campbell , A. , Flaig , R. , Robertson , S. , Fawns-Ritchie , C. , Hayward , C. , Marioni , R.E. , McIntosh , A.M. , Porteous , D.J. , Whalley , H.C. and Sudlow , C. ( 2024 ) ‘ Generation Scotland: an update on Scotland’s longitudinal family health study’ , BMJ Open , 14 ( 6 ), p. e084719 . doi: 10.1136/bmjopen-2024-084719 . OpenUrl CrossRef PubMed 15. ↵ Ying , K. , Paulson , S. , Eames , A. , Tyshkovskiy , A. , Li , S. , Perez-Guevara , M. , Emamifar , M. , Martínez , M.C. , Kwon , D. , Kosheleva , A. , Snyder , M.P. , Gobel , D. , Herzog , C. , Poganik , J.R. , Biomarker of Aging Consortium , Moqri , M. and Gladyshev , V.N. ( 2023 ) ‘ A Unified Framework for Systematic Curation and Evaluation of Aging Biomarkers’ , bioRxiv [Preprint] . Available at : doi: 10.1101/2023.12.02.569722 (Accessed: 26 June 2025 ). OpenUrl Abstract / FREE Full Text 16. ↵ Therneau , T.M. ( 2024 ) coxme: Mixed Effects Cox Models. R package version 2 . 2 – 22 . Available at: https://CRAN.R-project.org/package=coxme . 17. ↵ Kuan , V. , Denaxas , S. , Gonzalez-Izquierdo , A. , Direk , K. , Bhatti , O. , Husain , S. , Sutaria , S. , Hingorani , M. , Nitsch , D. , Parisinos , C.A. , Lumbers , R.T. , Mathur , R. , Sofat , R. , Casas , J.P. , Wong , I.C.K. , Hemingway , H. and Hingorani , A.D. ( 2019 ) ‘ A chronological map of 308 physical and mental health conditions from 4 million individuals in the English National Health Service’ , The Lancet Digital Health , 1 ( 2 ), pp. e63 – e77 . doi: 10.1016/S2589-7500(19)30012-3 . OpenUrl CrossRef 18. Lin , Q. , Weidner , C.I. , Costa , I.G. , Marioni , R.E. , Ferreira , M.R. , Deary , I.J. and Wagner , W. ( 2016 ) ‘ DNA methylation levels at individual age-associated CpG sites can be indicative for life expectancy’ , Aging , 8 ( 2 ), pp. 394 – 401 . doi: 10.18632/aging.100908 . OpenUrl CrossRef PubMed 19. Zhang , Y. , Wilson , R. , Heiss , J. , Breitling , L.P. , Saum , K.U. , Schöttker , B. , Holleczek , B. , Waldenberger , M. , Peters , A. and Brenner , H. ( 2017 ) ‘ DNA methylation signatures in peripheral blood strongly predict all-cause mortality’ , Nature Communications , 8 , p. 14617 . doi: 10.1038/ncomms14617 . OpenUrl CrossRef PubMed 20. Horvath , S. , Oshima , J. , Martin , G.M. , Lu , A.T. , Quach , A. , Cohen , H. , Felton , S. , Matsuyama , M. , Lowe , D. , Kabacik , S. , Wilson , J.G. , Reiner , A.P. , Maierhofer , A. , Flunkert , J. , Aviv , A. , Hou , L. , Baccarelli , A.A. , Li , Y. , Stewart , J.D. , Whitsel , E.A. , Ferrucci , L. , Matsuyama , S. and Raj , K. ( 2018 ) ‘ Epigenetic clock for skin and blood cells applied to Hutchinson Gilford Progeria Syndrome and ex vivo studies’ , Aging , 10 ( 7 ), pp. 1758 – 1775 . doi: 10.18632/aging.101508 . OpenUrl CrossRef PubMed 21. Lu , A.T. , Seeboth , A. , Tsai , P.C. , Sun , D. , Quach , A. , Reiner , A.P. , Kooperberg , C. , Ferrucci , L. , Hou , L. , Baccarelli , A.A. , Li , Y. , Harris , S.E. , Corley , J. , Taylor , A. , Deary , I.J. , Stewart , J.D. , Whitsel , E.A. , Assimes , T.L. , Chen , W. , Li , S. , Mangino , M. , Bell , J.T. , Wilson , J.G. , Aviv , A. , Marioni , R.E. , Raj , K. and Horvath , S. ( 2019 ) ‘ DNA methylation-based estimator of telomere length’ , Aging , 11 ( 16 ), pp. 5895 – 5923 . doi: 10.18632/aging.102173 . OpenUrl CrossRef PubMed 22. Belsky , D.W. , Caspi , A. , Arseneault , L. , Baccarelli , A. , Corcoran , D.L. , Gao , X. , Hannon , E. , Harrington , H.L. , Rasmussen , L.J.H. , Houts , R. , Huffman , K. , Kraus , W.E. , Kwon , D. , Mill , J. , Pieper , C.F. , Prinz , J.A. , Poulton , R. , Schwartz , J. , Sugden , K. , Vokonas , P. , Williams , B.S. and Moffitt , T.E. ( 2020 ) ‘ Quantification of the pace of biological aging in humans through a blood test, the DunedinPoAm DNA methylation algorithm’ , eLife , 9 , p. e54870 . doi: 10.7554/eLife.54870 . OpenUrl CrossRef PubMed 23. Lu , A.T. , Binder , A.M. , Zhang , J. , Yan , Q. , Reiner , A.P. , Cox , S.R. , Corley , J. , Harris , S.E. , Kuo , P.L. , Moore , A.Z. , Bandinelli , S. , Stewart , J.D. , Wang , C. , Hamlat , E.J. , Epel , E.S. , Schwartz , J.D. , Whitsel , E.A. , Correa , A. , Ferrucci , L. , Marioni , R.E. and Horvath , S. ( 2022 ) ‘ DNA methylation GrimAge version 2’ , Aging , 14 ( 23 ), pp. 9484 – 9549 . doi: 10.18632/aging.204434 . OpenUrl CrossRef PubMed 24. Ying , K. , Liu , H. , Tarkhov , A.E. , Sadler , M.C. , Lu , A.T. , Moqri , M. , Horvath , S. , Kutalik , Z. , Shen , X. and Gladyshev , V.N. ( 2024 ) ‘ Causality-enriched epigenetic age uncouples damage and adaptation’ , Nature Aging , 4 ( 2 ), pp. 231 – 246 . doi: 10.1038/s43587-023-00557-0 . OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted July 15, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following An unbiased comparison of 14 epigenetic clocks in relation to 10-year onset of 174 disease outcomes in 18,859 individuals Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share An unbiased comparison of 14 epigenetic clocks in relation to 10-year onset of 174 disease outcomes in 18,859 individuals Christos Mavrommatis , Daniel W Belsky , Kejun Ying , Mahdi Moqri , Archie Campbell , Anne Richmond , Vadim N Gladyshev , Tamir Chandra , Daniel L McCartney , Riccardo E Marioni medRxiv 2025.07.14.25331494; doi: https://doi.org/10.1101/2025.07.14.25331494 Share This Article: Copy Citation Tools An unbiased comparison of 14 epigenetic clocks in relation to 10-year onset of 174 disease outcomes in 18,859 individuals Christos Mavrommatis , Daniel W Belsky , Kejun Ying , Mahdi Moqri , Archie Campbell , Anne Richmond , Vadim N Gladyshev , Tamir Chandra , Daniel L McCartney , Riccardo E Marioni medRxiv 2025.07.14.25331494; doi: https://doi.org/10.1101/2025.07.14.25331494 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Epidemiology Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (297) Cardiovascular Medicine (4421) Dentistry and Oral Medicine (443) Dermatology (382) Emergency Medicine (606) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1507) Epidemiology (15212) Forensic Medicine (30) Gastroenterology (1121) Genetic and Genomic Medicine (6581) Geriatric Medicine (667) Health Economics (996) Health Informatics (4520) Health Policy (1366) Health Systems and Quality Improvement (1611) Hematology (539) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15906) Intensive Care and Critical Care Medicine (1103) Medical Education (620) Medical Ethics (144) Nephrology (667) Neurology (6580) Nursing (345) Nutrition (998) Obstetrics and Gynecology (1141) Occupational and Environmental Health (956) Oncology (3324) Ophthalmology (970) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (663) Pediatrics (1689) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5432) Public and Global Health (9212) Radiology and Imaging (2193) Rehabilitation Medicine and Physical Therapy (1368) Respiratory Medicine (1194) Rheumatology (593) Sexual and Reproductive Health (709) Sports Medicine (529) Surgery (709) Toxicology (99) Transplantation (288) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9ff3965ba868ad07',t:'MTc3OTM2NjU3Mw=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.