LDSC++: Improving linkage disequilibrium score regression estimation of heritability and genetic correlation for multivariate GWAS analysis

doi:10.1101/2025.04.07.25324946

LDSC++: Improving linkage disequilibrium score regression estimation of heritability and genetic correlation for multivariate GWAS analysis

2025 · doi:10.1101/2025.04.07.25324946

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 51,056 characters · extracted from preprint-html · click to expand

LDSC++: Improving linkage disequilibrium score regression estimation of heritability and genetic correlation for multivariate GWAS analysis | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search LDSC++: Improving linkage disequilibrium score regression estimation of heritability and genetic correlation for multivariate GWAS analysis View ORCID Profile Johan Zvrskovec , View ORCID Profile Alexandra Gillett , Michel Nivard , View ORCID Profile Jonathan R I Coleman , View ORCID Profile Christopher Hübel , Raquel Iniesta , View ORCID Profile Gerome Breen doi: https://doi.org/10.1101/2025.04.07.25324946 Johan Zvrskovec 1 Institute of Psychiatry, Psychology and Neuroscience, King’s College London , Denmark Hill, Camberwell, London, UK 2 National Institute for Health and Care Research (NIHR) Maudsley Biomedical Research Centre, South London and Maudsley NHS Foundation Trust , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Johan Zvrskovec For correspondence: johan.zvrskovec{at}gmail.com Alexandra Gillett 1 Institute of Psychiatry, Psychology and Neuroscience, King’s College London , Denmark Hill, Camberwell, London, UK 2 National Institute for Health and Care Research (NIHR) Maudsley Biomedical Research Centre, South London and Maudsley NHS Foundation Trust , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Alexandra Gillett Michel Nivard 5 Medical Research Council Integrative Epidemiology Unit, University of Bristol, Bristol, UK 6 Population Health Sciences, University of Bristol , Bristol, UK 7 Dept of biological psychology, Vrije Universiteit Amsterdam , the Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jonathan R I Coleman 1 Institute of Psychiatry, Psychology and Neuroscience, King’s College London , Denmark Hill, Camberwell, London, UK 2 National Institute for Health and Care Research (NIHR) Maudsley Biomedical Research Centre, South London and Maudsley NHS Foundation Trust , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jonathan R I Coleman Christopher Hübel 1 Institute of Psychiatry, Psychology and Neuroscience, King’s College London , Denmark Hill, Camberwell, London, UK 3 Clinic for Child and Adolescent Psychiatry, Psychotherapy and Psychosomatics, German Red Cross Hospitals Berlin Westend , Berlin, Germany 4 National Centre for Register-based Research, Aarhus University , Aarhus, Denmark 1 Institute of Psychiatry, Psychology and Neuroscience, King’s College London , Denmark Hill, Camberwell, London, UK 2 National Institute for Health and Care Research (NIHR) Maudsley Biomedical Research Centre, South London and Maudsley NHS Foundation Trust , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Christopher Hübel Raquel Iniesta 1 Institute of Psychiatry, Psychology and Neuroscience, King’s College London , Denmark Hill, Camberwell, London, UK 2 National Institute for Health and Care Research (NIHR) Maudsley Biomedical Research Centre, South London and Maudsley NHS Foundation Trust , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Gerome Breen 1 Institute of Psychiatry, Psychology and Neuroscience, King’s College London , Denmark Hill, Camberwell, London, UK 2 National Institute for Health and Care Research (NIHR) Maudsley Biomedical Research Centre, South London and Maudsley NHS Foundation Trust , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Gerome Breen Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Introduction Linkage disequilibrium (LD) score regression is widely used for estimating common variant heritability and genetic correlations from genome-wide association study (GWAS) summary statistics. We hypothesise that segmented regression (also known as piecewise regression) improves on previous LD score regression implementations, when estimating both genetic covariance and its standard error. Methods We present novel extensions to LD score regression (LDSC++) improving I.) handling of varying numbers of shared genetic variants across trait pairs and reference panels, II.) estimation of genetic covariance and its variance, and III.) handling of imputation quality. We propose supporting statistical tests that use our novel extensions to improve sensitivity, and are further aimed at comparing parameter estimates that are highly correlated, such as those obtained from the same trait but from different methods. We validate LDSC++ first on real-world individual level data from the Genetic Links to Anxiety and Depression study and the United Kingdom National Institute of Health and Social Care Research BioResource (N: 14,190 - 20,144), second on simulated data with different degrees of shared QTL, and third on a battery of publicly available GWASs of ten diverse traits of varying statistical power and heritability. Results Using variance-component method (GCTA-GREML) estimates for reference, LDSC++ extensions were found to yield heritability estimates with a bias of about -10% to -20% while standard LD score regression yielded a bias of -30%, and heritability variability estimates with a bias of -1% to -7% while standard LD score regression yielded a bias of 8%. For ten external trait GWASs, LDSC++ was shown to recover 5% to 8% larger heritabilities with 4% smaller variability on average compared to standard LD score regression. Weighting by imputation quality in the model, rather than excluding genetic variants of low imputation quality, contributed to retaining information. Our supporting statistical tests enabled us to detect statistically significant differences in genetic covariance and its standard error while considering the varying number of shared genetic variants across bivariate trait pairs. Conclusion LDSC++ was confirmed to produce less biassed estimates of genetic covariance and its variability in our GLAD+ sample compared to standard LD score regression, using GCTA-REML as reference. This performance was supported by results from external trait GWASs of varying character, also implying an important performance of our extended weighting schemes. Our proposed extensions to LD score regression, among which genome-wide parameters are constructed as aggregates of heterogeneous local parameters, may prove important for large-scale multivariate studies such as genomic structural equation models or local genetic covariance analyses. 1 INTRODUCTION Genome-wide association study (GWAS) summary statistics are readily available to researchers worldwide compared to individual level genotyped or sequenced data, which typically require considerable cost and time to access due to data sharing restrictions 1 , 2 . This prevents the use of optimal methods that use individual level genotype data to estimate components of variance, such as GCTA-GREML 3 , 4 , BOLT-REML 5 , 6 and REML in LDAK 7 . Popular alternatives 8 are Linkage Disequilibrium (LD) score regression 9 (LDSR) and SumHer 10 , which instead use GWAS summary statistics and an LD reference panel to obtain common genetic variant covariance (covG) and heritability (h 2 ), which are standardised to estimate genetic correlations 11 (r g ). LDSR was later re-implemented for calculation of large-scale bivariate trait pair analyses to obtain covG matrices and variance estimates of the elements of these for genomic structural equation modelling in Genomic SEM 12 . However, available implementations of LDSR do not: 1.) explicitly account for varying numbers of genetic variants between association statistics from contributing GWASs, 2.) consider local association and LD patterns in GWASs, or 3.) adjust for imputation quality differences. In bivariate LDSR, genetic variant overlap between two traits and the LD score panel is usually drastically smaller compared to the regressions performed on single traits (supplementary tab. S6), due to differing patterns of missingness across datasets. This limits the power to carry out many downstream multivariate GWAS analyses, such as in Genomic SEM 12 , and related methods such as mtCOJO 13 , 4 , MTAG 14 , and METAL 15 . These methods rely on the covG estimates from LDSR, and/or use the LDSR intercept to adjust associations (genomic control) for spurious associations due to confounding from population stratification or sample overlap. In comparison, the variance-component REML method in LDAK 7 is both assuming a variable contribution to heritability across the genome and includes an information score weighting 16 to differentially treat variants of varying genotyping or imputation quality. It may be of interest to bring this functionality over to an LDSR setting to be applicable to summary level data rather than individual level data. Standard LDSR further assumes there to exist a heteroskedastic relationship between genome-wide covG and its standard error, mainly due to the expected larger variability of variants in high LD regions. Despite a weighting correction to account for genome-wide covG heteroskedasticity, it also served as justification 9 for employing resampling to estimate standard errors that are robust to bias from heteroskedasticity. It may therefore be of interest to investigate whether this assumption can be relaxed when estimating covG standard errors, to allow for sampling across the genome. Here we present an enhanced version of LDSR, LDSC++, extended to improve on 1.) the handling of varying numbers of shared genetic variants across trait pairs and reference panels, 2.) the estimation of genetic covariance and its standard error, and 3.) the handling of imputation quality of imputed genotypes or genetic associations. Finally, through our extensions we aim to allow for tractable statistical tests of covG, its standard error, or differences between them, also accounting for high correlations between compared variables. We validate the performance of our extensions to LDSR, first using simulations, second on real-world data in the form of GWASs performed on selected measurements in the Genetic Links to Anxiety and Depression study and the United Kingdom National Institute of Health and Social Care Research BioResource, and third on a selection of ten GWAS summary statistics representing a wide variety of traits. We hypothesise the accuracy of estimating both covG and its standard error may be improved and the average measured variability of covG estimates across a sample of multiple diverse traits will be reduced when applying our extensions in LDSC++ individually or in combination, as compared to standard LDSR. 2 MATERIALS AND METHODS To enable more precise covG estimation from GWAS summary statistics, we extend the LDSR method based on the multivariate implementation included in Genomic SEM. We have named this extension LDSC++ (supplementary info. 1.8). The extensions to LDSR are: ❖ Extension 1 - Variable block-count: Allowing the number of blocks to vary when estimating covG and covG standard error, in contrast to a fixed number of blocks. ❖ Extension 2 - Extended block definitions to allow for variable block-count: Block definitions to be used while allowing the number of blocks to vary with Extension 1. These are based on either a set number of variants or a recombination distance in cM. ❖ Extension 3 - Variable block-count sampling: A novel approach to sample across genome blocks to estimate genome-wide covG and covG variance, rather than performing block jackknife resampling. ❖ Extension 4 - Extended weighting scheme for imputation quality: An addition to the standard LDSR weighting scheme to also control for imputation quality. ❖ xtension 5 - Adjusted weighting scheme to correct for the correlation between LD score and association statistic: We adjusted the standard weighting scheme in LDSR to correct for correlation between the regression variables, to allow for LD scores smaller than one while preventing influences by extreme LD (close to zero) values due to noise. LDSC++ alongside standard LDSR (emulated in our LDSC++ code) were validated in both real-world data and simulated traits, using REML covG estimates for reference. An individual level sample from cohorts part of the National Institute of Health Research (NIHR) BioResource was used for assessing genetic associations with phenotypes and for simulation. This selection included participants of European ancestry from the Genetic Links to Anxiety and Depression study (GLAD) 17 , the United Kingdom Eating Disorders Genetics Initiative (EDGI) 18 , 19 , the NIHR BioResource Inflammatory Bowel Disease BioResource panel and the NIHR BioResource General Population panel, which together form a collection of cohorts colloquially referred to as GLAD+ (N=36,746). We selected the traits height, weight, neuroticism measured by the Eysenck Personality Questionnaire-Revised Short form (EPQR-S) 20 , and negative affect measured by the PID-5 Brief Form 21 , 22 , in the GLAD+ cohort. Additionally, we simulated two phenotypes (further referred to as SIM1 and SIM2 respectively) created to have 20% heritability and a genetic correlation of 0.4 with each other, in four pairs with fractions of 100%, 75%, 50%, and 25% shared quantitative trait loci (QTL) respectively. A simulation was performed in GCTA 4 for each phenotype and fraction combination, using 30,000 QTL and GLAD+ as an individual level sample. We used GCTA-GREML 3 implemented in GCTA 4 to estimate variance component covG for our individual level GLAD+ samples. Association tests were performed in GCTA fastGWA 23 . The covariates included in the association analysis were: genotyping array type/version, tissue source, genotyping batch, and the first seven principal component scores of participant genotypes as computed by the genetic principal component eigenvalues of the 1000 Genome Project 24 Phase 3 (1kG3) reference panel projected on the genetic variants of GLAD+. Additionally, ten external GWAS summary statistics covering a range of traits of various statistical power, h 2 , and genome coverage in terms of the number of variants included were selected for validating methods ( Tab. 1 ). All summary statistics were documented to be based on samples with predominantly European ancestry. View this table: View inline View popup Download powerpoint Table 1. Selected external GWAS summary statistics A selection of ten diverse publicly available GWAS summary statistics. The table describes the dataset reference, the number of cases or total number of participants, and for binary traits; the number of controls, the sample prevalence estimate, and the population prevalence estimate used throughout the study. ‘INFO range’ describes the range of the provided imputation quality information score. To match GCTA-GREML, we used GCTA 4 , 25 to generate the GLAD+ LD scores, using a window of 1 Mb and a prior filter on minor allele frequency (MAF) > 0.01. For our external GWAS summary statistics, we instead created LD scores based on the European ancestry subset of the 1kG3 26 , not including Finnish ancestry. For this second LD score library, we used a 1 cM window and 250 blocks setting in LDSC 9 , 27 . GWAS summary statistics were first harmonised using our Supermunge routine part of the shru 28 package for the R language [ https://github.com/tnggroup/tng_fork_shru_jz2024 ], based on the original LDSC munge routine 9 , the Genomic SEM routines for munging and preparation for latent factor GWAS 12 , and the MungeSumstats routine 29 (supplementary info. 1.4.4). To account for heteroskedastic relationships for comparisons of covG inferential uncertainty (sampling variance and thus standard errors) across traits of varying heritabilities, we applied the coefficient of variation (CV) of covG rather than comparing direct estimates (supplementary info. 1.5.1). We formulated simple parametric statistical tests specifically accounting for the novel varying number of blocks in the LDSR sampling and resampling methods and non-independent variables (supplementary info. 1.10), supported by paired samples Wilcoxon signed-rank tests 30 (supplementary info. 1.10.5). Test results were corrected for multiple comparisons using the Benjamini & Hochberg 31 method (q-values, also called false discovery rate; FDR), additionally and unconventionally taking the effective number of comparisons from correlated variables 32 – 34 into account (supplementary info. 1.10.6). 3 RESULTS We estimated REML h 2 and r g of our four selected GLAD+ traits and their bivariate combinations. The REML h 2 of the simulated traits SIM1 and SIM2 were estimated in the range from 13% to 15%, and the REML r g between traits in a pair to 0.43, 0.24, 0.19, and 0.2 for the QTL sharing fractions 100%, 75%, 50%, and 25% respectively. Deviations of LDSR method results from GCTA-REML estimates were obtained, run on both the selected GLAD+ traits ( Tab. 2 , supplementary tab. S7A, S7B) and the simulated traits (supplementary tab. S8A, S8B). Most deviations between covG and covG variance estimates by our LDSR method extensions compared to standard LDSR were seen to be statistically significant, supporting our extensions to yield empirically distinct results. As results were quite different comparing results from diagonal and off-diagonal elements of covG matrices, we decided to stratify them accordingly. View this table: View inline View popup Download powerpoint Table 2. LDSR estimate deviation from a REML ideal measured over four GLAD+ traits The table shows deviations of LD score regression (LDSR) method estimates of genetic covariance (covG) and covG SE (converted to coefficient of variation, CV) from the chosen ideal; estimates from GCTA-GREML using individual level data. We used the LDSC++ implementation of LDSR applied to our selection of four real-world traits from the GLAD+ sample: height, weight, neuroticism measured by the Eysenck Personality Questionnaire-Revised Short form (EPQR-S), and negative affect measured by the PID-5 Brief Form. Deviation was measured as average relative difference (Avg. Δ) and root-mean-square error (RMSE). LDSR method combinations were defined by their configuration in regard to block definition, (re)sampling method, alternative correlation correction weighting, and imputation quality weighting. Estimates are stratified in diagonal (heritability) and off-diagonal (bivariate genetic covariance) estimates from a genetic covariance matrix. Only significant covG values (q<0.05) were considered. Only considering h 2 estimates (diagonal elements in the covG or covG SE matrix), the top performing LDSR method combination was variable block-count sampling using the recombination distance block-definition, which yielded average relative h 2 differences as small as -11% and average relative h 2 CV differences of -1% compared to GCTA-GREML in GLAD+. The same pattern was seen for the simulated traits only using the 100% QTL sharing fraction, while for lesser sharing fractions the performance among methods was mixed with the standard LDSR block jackknife or LDSC++ variable block-count sampling with recombination distance blocks yielding the on average most accurate and less biassed estimates. In the GLAD+ data, all LDSR methods under-estimated diagonal covG with about -30% for block jackknife resampling and - 10% to -20% for variable block-count sampling. Block jackknife resampling was also consistently seen to over-estimate diagonal variability estimates from 5% to 9%, while variable block-count sampling seemed to under-estimate diagonal variability estimates with about -1% to -7%. The influence of our weighting extensions were seen to only have tiny effects on the differences in the preferred direction for the GLAD+ traits, primarily detectable for h 2 estimates and when using block jackknife resampling and imputation quality weighting. Off-diagonal deviations were markedly larger by about a factor of two to four for average relative covG estimates and a factor of ten to sixty for average relative covG CV estimates, compared to the corresponding diagonal matrix element results for the GLAD+ traits. A similar but attenuated pattern was seen for the simulated traits. As for the diagonal elements, the LDSR methods under-estimated off-diagonal covG estimates with about -60% for block jackknife resampling and -40% to -50% for variable block-count sampling in the GLAD+ traits. Off-diagonal covG CVs were consistently and grossly over-estimated by all LDSR methods. For block jackknife resampling, the recombination distance block definition brought the off-diagonal covG CV difference to about 100% compared to 120% when using number-of-variants defined blocks. Variable block count sampling produced off-diagonal covG CV estimates with deviations from about 60% with the recombination distance block definition to 80% with the number-of-variants block definition. We applied the different LDSR method combinations in our selection of ten external trait GWASs ( Tab. 1 ) for which samples we did not have individual level data (supplementary tab. S9A, S9B). Default block-size settings resulted in block-counts in the range of 249 - 405 for the number-of-variants block definition and 338 - 364 for the recombination distance block definition, without INFO filter. Estimates from method combinations using our extensions were first assessed independently in reference to suitable baselines (supplementary tab. S9A). Compared to standard LDSR, applying our block definitions and sampling extensions yielded 4% to 8% larger h 2 estimates, 3% smaller h 2 CV estimates using number-of-variants blocks, but 7% larger h 2 CV estimates using recombination distance blocks. The weighting extensions made a relatively small contribution to average differences in estimates compared to the block and sampling extensions, but specific traits showed statistically significant results. Applying imputation score weighting resulted in an approximate gain of 4% to 5% (q<0.05) in BIPD h 2 and a 1% to 7% (q<0.02) reduction in BIPD bivariate covG CV with specific traits across block and sampling methods. Similarly, applying alternative correlation correction weighting yielded an approximate gain of 3% to 4% (q<0.05) in BMI h 2 and multiple significant bivariate BMI covG CV reductions in the range of 1% to 10% (q<0.05). Applying all extensions in concert and comparing to standard LDSR yielded 5% to 8% larger h 2 estimates, 4% smaller h 2 CV estimates using number-of-variants blocks, but 6% larger h 2 CV estimates using recombination distance blocks. 4 DISCUSSION We have adapted the LDSR routine from Genomic SEM into a modified implementation called LDSC++, which performs LDSR with extensions specifically aimed at improving covG estimation in large-scale multivariate analyses with varying genomic overlaps among trait GWAS dataset and reference panels. For this purpose, we created a variable block-count sampling routine in LDSC++ aimed to be applied with a variable number of blocks to discriminate between situations with a varying number of participating genetic variants, which further makes it possible to use this information in statistical tests. Variable block-count sampling performs segmented (also called piecewise) regression using one of our two block definitions, which putatively makes the aggregate genome-wide parameter estimates (averages of segmented regression parameters) robust to heteroskedasticity and outliers. The most obvious and important assumption for both the variable block-count sampling method and the statistical tests is that the estimated genome-wide covG can be assumed to have the same variance across the genome, or rather can be estimated as an aggregate of piecewise estimates. While resampling techniques 49 , 50 traditionally have been used to obtain robust covG standard errors in LDSR, a sufficiently better model from the segmented regression is in our project theorised to make robust standard errors superfluous 51 . LDSC++ further takes advantage of imputation quality information to weight the LDSR, instead of relying on filters which otherwise reduce the overall information content in the analysis. Variable block-count sampling may be interpreted as applying a slightly different h 2 model, allowing for a different contribution to h 2 across the genome similar to the LDAK h 2 model 7 , 16 , 52 , in contrast to the standard LDSR heritability model 9 , 16 , 52 . We additionally proposed statistical tests in which the varying number of blocks from our extensions can be applied to translate statistical power from a large number of genetic variants in a GWAS into statistical power for LDSR covG and covG variance, and thus making these tests more sensitive and differentiating in collections of bivariate trait pairs proportional to the variability in genetic variant overlap. Our LDSR extensions were shown to yield more accurate results as validated by GCTA-GREML than standard LDSR settings, both when using each extension independently and when applied in concert, yielding average relative deviations from about -10% to -20% for h 2 and -1% to -6% for h 2 CV compared to the corresponding deviations of -30% and 8% respectively for standard LDSR. This performance was seen in estimates made in the individual level GLAD+ sample and replicated to a lesser extent in simulated data using GCTA-GREML. The performance increase when using the combined extensions could be attributed to allowing the number of blocks to vary and using our new block definitions or using our variable block-count sampling, and only a small fraction could be attributed to the weighting extensions in this setting. Applying our extensions to a set of ten trait GWASs external to our individual level sample, supported the above validations through convergent results primarily for h 2 estimates rather than off-diagonal covG estimates and when using number-of-variants block definitions. In this diverse selection of GWASs of varying power and coverage our combined LDSC++ extensions yielded on average up to 8% larger and 4% less variable h 2 estimates compared to standard LDSR. Larger h 2 estimates were convergent with the previous individual level data validation validations, but only the number-of-variants block definition were seen to produce smaller average h 2 estimates compared to standard LDSR, while using the recombination distance block definition instead yielded larger average h 2 estimates - contrary to the previous validation results. This may indicate a sensitivity of the recombination distance block definition to missingness patterns or other factors that were not represented by our four GLAD+ trait GWASs. The external GWASs also allowed us to explore other imputation score ranges and highly polygenic trait GWASs of high power, which implicated putative improved estimates when applying the imputation score weighting to the BIPD GWAS and when applying the alternate correlation correction weighting to the BMI GWAS. Our proposed explanation for these results is that the BIPD GWAS has a wide distribution of imputation quality INFO scores in contrast to other included datasets which the corresponding weighting extension would be able to leverage, and the BMI GWAS is relatively well-powered and represents a highly polygenic trait for which the alternative correlation correction weighting may be able to correct bias due to tiny LD scores to a higher degree. The major strength in our simulations came from using a relatively large sample size of 36,746 individuals from the GLAD+ cohort, in contrast to the Bulik-Sullivan study which simulated associations based on a sample of 2,062 individuals. We additionally simulated whole genome associations, where the Bulik-Sullivan study only simulated chromosome 2. Unfortunately, we did not manage to perform sufficiently many repetitions in our simulations for them to appear trustworthy, with an effective number of GCTA simulations of 2.5 for any randomly sampled QTL compared to 100 repetitions done in a previous study by Bulik-Sullivan 53 . Our effort to investigate the influence of effect QTL overlap on REML and LDSR estimates was interesting, but proved practically challenging enough to be one of the reasons for why we did not manage to repeat the simulations to a higher degree. The discrepancy between validation results from diagonal and off-diagonal covG elements was identified as a cause for concern about the LDSR method in general. Because of this we were inclined to trust off-diagonal validation results less. Off-diagonal covG estimates from bivariate LDSR are however the foundation for genetic correlation analyses, and also provide the majority and arguably the more important information for analyses performed on covG such as Genomic SEM, underscoring the importance of accurate off-diagonal covG estimation and the need to critically investigate bivariate LDSR further. Our results provide support for the accuracy of statistical models where genome-wide h 2 and covG parameters are constructed as aggregates of heterogeneous local parameters. The recombination distance block definition was part of the method combination displaying the strongest performance in our individual level real-world and simulated GCTA-GREML validations. In the external GWASs, the recombination distance block definition also recovered some of the largest covG estimates on average compared to the number-of-variants block definition and standard LDSR. We would suggest that these properties are promising and may prompt further research into block definitions for LDSR that are consistent across traits and bivariate trait pairs in the way our recombination distance definition was made or how local genetic correlation methods such as LAVA 54 define consistent genomic blocks. The arbitrary definition of blocks is a general limitation of LDSR. Creating more optimised block definitions is indeed an active research area 55 , 56 . Reconciling the recombination based block definition approach with the utility of the number-of-variants block definition may be important to advance LDSR and similar methods further. 5 CONFLICT OF INTEREST Prof Breen has received honoraria, research or conference grants and consulting fees from Illumina, Otsuka, and COMPASS Pathfinder Ltd. 7 DATA AVAILABILITY All data produced in the present study are available upon reasonable request to the authors. While some data is contained in the manuscript, an attempt has been made to additionally present results in table format in the accompanying supplementary tables. GWAS summary statistics of our traits used for validation are available upon reasonable request. LD scores based on the GLAD+ sample are available upon reasonable request. The analysis code will be made available at https://github.com/tnggroup/jz-phd-c2c3-2024 . The software package ‘shru’ will be made available on https://github.com/johanzvrskovec/shru . 8 ETHICS APPROVAL STATEMENT The London—Fulham Research Ethics Committee approved the GLAD Study on 21st August 2018 (REC reference: 18/LO/1218). The London—Fulham Research Ethics Committee approved the EDGI UK Study on 29th July 2019 (REC reference: 19/LO/1254). The East of England— Cambridge Central Committee approved the NIHR BioResource as a Research Tissue Bank (REC reference: 17/EE/0025). The South West—Central Bristol Research Ethics Committee approved the COVID-19 Psychiatry and Neurological Genetics study on 27th April 2020 (REC reference: 20/SW/0078). 6 ACKNOWLEDGEMENTS This study/research is funded by the National Institute for Health and Care Research (NIHR) Maudsley Biomedical Research Centre (BRC). The views expressed are those of the author(s) and not necessarily those of the NIHR or the Department of Health and Social Care. Christopher Hübel acknowledges funding by Lundbeckfonden (R276-2018-4581). Alexandra Gillett is supported by the Medical Research Council (MR/X009815/1). The authors acknowledge use of the research computing facility at King’s College London, King’s Computational Research, Engineering and Technology Environment (CREATE) ( https://doi.org/10.18742/rnvf-m076 ) 57 . Footnotes Updated descriptions of Extension 5 in Materials and Methods and in the supplementary information, clarifying how we circumvent the capping of small LD scores to one. Removed some mentions of sampling distributions in the supplementary information to make these distinct from the distributions of test variables. Some other minor cosmetic changes. 9 REFERENCES 1. ↵ Abdellaoui , A. & Verweij , K. J. H. Dissecting polygenic signals from genome-wide association studies on human behaviour . Nat. Hum. Behav . 1 – 9 ( 2021 ) doi: 10.1038/s41562-021-01110-y . OpenUrl CrossRef PubMed 2. ↵ Pasaniuc , B. & Price , A. L. Dissecting the genetics of complex traits using summary association statistics . Nat. Rev. Genet . 18 , 117 – 127 ( 2017 ). OpenUrl CrossRef PubMed 3. ↵ Yang , J. et al. Common SNPs explain a large proportion of the heritability for human height . Nat. Genet . 42 , 565 – 569 ( 2010 ). OpenUrl CrossRef PubMed Web of Science 4. ↵ Yang , J. , Lee , S. H. , Goddard , M. E. & Visscher , P. M. GCTA: A tool for genome-wide complex trait analysis . Am. J. Hum. Genet . 88 , 76 – 82 ( 2011 ). OpenUrl CrossRef PubMed 5. ↵ Loh , P.-R. et al. Contrasting genetic architectures of schizophrenia and other complex diseases using fast variance-components analysis . Nat. Genet . 47 , 1385 – 1392 ( 2015 ). OpenUrl CrossRef PubMed 6. ↵ Loh , P.-R. et al. Efficient Bayesian mixed-model analysis increases association power in large cohorts . Nat. Genet . 47 , 284 – 290 ( 2015 ). OpenUrl CrossRef PubMed 7. ↵ Speed , D. , Hemani , G. , Johnson , M. R. & Balding , D. J. Improved Heritability Estimation from Genome-wide SNPs . Am. J. Hum. Genet . 91 , 1011 – 1021 ( 2012 ). OpenUrl CrossRef PubMed 8. ↵ Barry , C.-J. S. et al. How to estimate heritability: a guide for genetic epidemiologists . Int. J. Epidemiol . 52 , 624 – 632 ( 2023 ). OpenUrl CrossRef PubMed 9. ↵ Bulik-Sullivan , B. K. et al. LD Score regression distinguishes confounding from polygenicity in genome-wide association studies . Nat. Genet . 47 , 291 – 295 ( 2015 ). OpenUrl CrossRef PubMed 10. ↵ Speed , D. & Balding , D. J. SumHer better estimates the SNP heritability of complex traits from summary statistics . Nat. Genet . 51 , 277 – 284 ( 2019 ). OpenUrl PubMed 11. ↵ van Rheenen , W. , Peyrot , W. J. , Schork , A. J. , Lee , S. H. & Wray , N. R. Genetic correlations of polygenic disease traits: from theory to practice . Nat. Rev. Genet . 20 , 567 – 581 ( 2019 ). OpenUrl PubMed 12. ↵ Grotzinger , A. D. et al. Genomic structural equation modelling provides insights into the multivariate genetic architecture of complex traits . Nat. Hum. Behav . 3 , 513 – 525 ( 2019 ). OpenUrl PubMed 13. ↵ Zhu , Z. et al. Causal associations between risk factors and common diseases inferred from GWAS summary data . Nat. Commun . 9 , 224 ( 2018 ). OpenUrl CrossRef PubMed 14. ↵ Turley , P. et al. Multi-trait analysis of genome-wide association summary statistics using MTAG . Nat. Genet . 50 , 229 – 237 ( 2018 ). OpenUrl CrossRef PubMed 15. ↵ Willer , C. J. , Li , Y. & Abecasis , G. R. METAL: fast and efficient meta-analysis of genomewide association scans . Bioinformatics 26 , 2190 – 2191 ( 2010 ). OpenUrl CrossRef PubMed Web of Science 16. ↵ Speed , D. , Cai , N. , Johnson , M. R. , Nejentsev , S. & Balding , D. J. Reevaluation of SNP heritability in complex human traits . Nat. Genet . 49 , 986 – 992 ( 2017 ). OpenUrl CrossRef PubMed 17. ↵ Davies , M. R. et al. The Genetic Links to Anxiety and Depression (GLAD) Study: Online recruitment into the largest recontactable study of depression and anxiety . Behav. Res. Ther . ( 2019 ) doi: 10.1016/j.brat.2019.103503 . OpenUrl CrossRef 18. ↵ Monssen , D. et al. The United Kingdom Eating Disorders Genetics Initiative . Int. J. Eat. Disord . 57 , 1145 – 1159 ( 2024 ). OpenUrl PubMed 19. ↵ Bulik , C. M. et al. The Eating Disorders Genetics Initiative (EDGI): study protocol . BMC Psychiatry 21 , 234 ( 2021 ). OpenUrl CrossRef PubMed 20. ↵ Eysenck , H. J. & Eysenck , M. W. Personality and Individual Differences . Plenum Press N. Y . ( 1985 ) doi: 10.1007/978-1-4613-2413-3 . OpenUrl CrossRef 21. ↵ Krueger , R. F. , Derringer , J. , Markon , K. E. , Watson , D. & Skodol , A. E. Initial construction of a maladaptive personality trait model and inventory for DSM-5 . Psychol. Med . 42 , 1879 – 1890 ( 2012 ). OpenUrl CrossRef PubMed 22. ↵ Maples , J. L. et al. Supplemental Material for Testing Whether the DSM-5 Personality Disorder Trait Model Can Be Measured With a Reduced Set of Items: An Item Response Theory Investigation of the Personality Inventory for DSM-5 . Psychol. Assess . 27 , 1195 – 1210 ( 2015 ). OpenUrl PubMed 23. ↵ Jiang , L. et al. A resource-efficient tool for mixed model association analysis of large-scale data . Nat. Genet . ( 2019 ) doi: 10.1038/s41588-019-0530-8 . OpenUrl CrossRef PubMed 24. ↵ Altshuler , D. M. et al. An integrated map of genetic variation from 1,092 human genomes . Nat. 2012 4917422 491 , 56 – 65 ( 2012 ). OpenUrl 25. ↵ Yang , J. et al. Genetic variance estimation with imputed variants finds negligible missing heritability for human height and body mass index . Nat. Genet . 47 , 1114 – 1120 ( 2015 ). OpenUrl CrossRef PubMed 26. ↵ Auton , A. et al. A global reference for human genetic variation . Nature 526 , 68 – 74 ( 2015 ). OpenUrl CrossRef PubMed 27. ↵ Bulik-Sullivan , B. K. LDSC (LD SCore) . ( 2015 ). 28. ↵ Zvrskovec , J. shru . https://github.com/johanzvrskovec/shru ( 2023 ). 29. ↵ Murphy , A. E. & Skene , N. G. MungeSumstats: A Bioconductor package for the standardisation and quality control of many GWAS summary statistics . bioRxiv 2021.06.21.449239 ( 2021 ) doi: 10.1101/2021.06.21.449239 . OpenUrl Abstract / FREE Full Text 30. ↵ Wilcoxon , F. Individual Comparisons by Ranking Methods . Biom. Bull . 1 , 80 – 83 ( 1945 ). OpenUrl CrossRef 31. ↵ Benjamini , Y. & Hochberg , Y. Controlling the False Discovery Rate: A Practical and Powerful Approach to Multiple Testing . J. R. Stat. Soc. Ser. B Methodol . 57 , 289 – 300 ( 1995 ). OpenUrl CrossRef 32. ↵ Gao , X. , Starmer , J. & Martin , E. R. A multiple testing correction method for genetic association studies using correlated single nucleotide polymorphisms . Genet. Epidemiol . 32 , 361 – 369 ( 2008 ). OpenUrl CrossRef PubMed Web of Science 33. Nyholt , D. R. A Simple Correction for Multiple Testing for Single-Nucleotide Polymorphisms in Linkage Disequilibrium with Each Other . Am. J. Hum. Genet . 74 , 765 – 769 ( 2004 ). OpenUrl CrossRef PubMed Web of Science 34. ↵ Cheverud , J. M. A simple correction for multiple comparisons in interval mapping genome scans . Heredity 87 , 52 – 58 ( 2001 ). OpenUrl CrossRef PubMed Web of Science 35. Purves , K. L. et al. A major role for common genetic variation in anxiety disorders . Mol. Psychiatry ( 2019 ) doi: 10.1038/s41380-019-0559-1 . OpenUrl CrossRef PubMed 36. Kessler , R. C. et al. The global burden of mental disorders: An update from the WHO World Mental Health (WMH) Surveys . Epidemiol. Psichiatr. Soc . 18 , 23 – 33 ( 2009 ). OpenUrl CrossRef PubMed Web of Science 37. Stahl , E. A. et al. Genome-wide association study identifies 30 loci associated with bipolar disorder . Nat. Genet . 51 , 793 – 803 ( 2019 ). OpenUrl CrossRef PubMed 38. Kessler , R. C. , Petukhova , M. , Sampson , N. A. , Zaslavsky , A. M. & Wittchen , H.-U. Twelve-month and lifetime prevalence and lifetime morbid risk of anxiety and mood disorders in the United States . Int. J. Methods Psychiatr. Res . 21 , 169 – 184 ( 2012 ). OpenUrl CrossRef PubMed 39. Pulit , S. L. et al. Meta-analysis of genome-wide association studies for body fat distribution in 694 649 individuals of European ancestry . Hum. Mol. Genet . 28 , 166 – 174 ( 2019 ). OpenUrl CrossRef PubMed 40. Wray , N. R. et al. Genome-wide association analyses identify 44 risk variants and refine the genetic architecture of major depression . Nat. Genet . 50 , 668 – 681 ( 2018 ). OpenUrl CrossRef PubMed 41. Kessler , R. C. & Bromet , E. J. The Epidemiology of Depression Across Cultures . Annu. Rev. Public Health 34 , 119 – 138 ( 2013 ). OpenUrl CrossRef PubMed Web of Science 42. Howard , D. M. et al. Genome-wide meta-analysis of depression identifies 102 independent variants and highlights the importance of the prefrontal brain regions . Nat. Neurosci . 22 , 343 – 352 ( 2019 ). OpenUrl CrossRef PubMed 43. Lee , J. J. et al. Gene discovery and polygenic prediction from a genome-wide association study of educational attainment in 1.1 million individuals . Nat. Genet. 2018 508 50 , 1112 – 1121 ( 2018 ). OpenUrl CrossRef PubMed 44. Jansen , P. R. et al. Genome-wide analysis of insomnia in 1,331,010 individuals identifies new risk loci and functional pathways . Nat. Genet . 51 , 394 – 403 ( 2019 ). OpenUrl CrossRef PubMed 45. Morphy , H. , Dunn , K. M. , Lewis , M. , Boardman , H. F. & Croft , P. R. Epidemiology of Insomnia: a Longitudinal Study in a UK Population . Sleep 30 , 274 – 280 ( 2007 ). OpenUrl PubMed Web of Science 46. Nagel , M. et al. Meta-analysis of genome-wide association studies for neuroticism in 449,484 individuals identifies novel genetic loci and pathways . Nat. Genet. 2018 507 50 , 920 – 927 ( 2018 ). OpenUrl CrossRef PubMed 47. Pardiñas , A. F. et al. Common schizophrenia alleles are enriched in mutation-intolerant genes and in regions under strong background selection . Nat. Genet . 50 , 381 – 389 ( 2018 ). OpenUrl CrossRef PubMed 48. McGrath , J. , Saha , S. , Chant , D. & Welham , J. Schizophrenia: A Concise Overview of Incidence, Prevalence, and Mortality . Epidemiol. Rev . 30 , 67 – 76 ( 2008 ). OpenUrl CrossRef PubMed Web of Science 49. ↵ Friedl , H. & Stampfer , E. Jackknife Resampling . Encycl. Environmetrics 2 , ( 2001 ). 50. ↵ Efron , B. Nonparametric estimates of standard error: The jackknife, the bootstrap and other methods . Biometrika 68 , 589 – 599 ( 1981 ). OpenUrl CrossRef Web of Science 51. ↵ King , G. & Roberts , M. E. How Robust Standard Errors Expose Methodological Problems They Do Not Fix, and What to Do About It . Polit. Anal . 23 , 159 – 179 ( 2015 ). OpenUrl CrossRef 52. ↵ Speed , D. , Holmes , J. & Balding , D. J. Evaluating and improving heritability models using summary statistics . Nat. Genet . 52 , 458 – 462 ( 2020 ). OpenUrl CrossRef PubMed 53. ↵ Bulik-Sullivan , B. Relationship between LD Score and Haseman-Elston Regression. 018283 Preprint at doi: 10.1101/018283 ( 2015 ). OpenUrl Abstract / FREE Full Text 54. ↵ Werme , J. , Sluis , S. van der , Posthuma , D. & Leeuw , C. A. de. LAVA: An integrated framework for local genetic correlation analysis . bioRxiv ( 2021 ) doi: 10.1101/2020.12.31.424652 . OpenUrl Abstract / FREE Full Text 55. ↵ Privé , F. Optimal linkage disequilibrium splitting . Bioinformatics 38 , 255 – 256 ( 2022 ). OpenUrl 56. ↵ Muggeo , V. M. R. Estimating regression models with unknown break-points . Stat. Med . 22 , 3055 – 3071 ( 2003 ). OpenUrl CrossRef PubMed Web of Science 57. ↵ King’s College London. King’s Computational Research, Engineering and Technology Environment (CREATE) . ( 2022 ) doi: 10.18742/rnvf-m076 . OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted May 13, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following LDSC++: Improving linkage disequilibrium score regression estimation of heritability and genetic correlation for multivariate GWAS analysis Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share LDSC++: Improving linkage disequilibrium score regression estimation of heritability and genetic correlation for multivariate GWAS analysis Johan Zvrskovec , Alexandra Gillett , Michel Nivard , Jonathan R I Coleman , Christopher Hübel , Raquel Iniesta , Gerome Breen medRxiv 2025.04.07.25324946; doi: https://doi.org/10.1101/2025.04.07.25324946 Share This Article: Copy Citation Tools LDSC++: Improving linkage disequilibrium score regression estimation of heritability and genetic correlation for multivariate GWAS analysis Johan Zvrskovec , Alexandra Gillett , Michel Nivard , Jonathan R I Coleman , Christopher Hübel , Raquel Iniesta , Gerome Breen medRxiv 2025.04.07.25324946; doi: https://doi.org/10.1101/2025.04.07.25324946 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Genetic and Genomic Medicine Subject Areas All Articles Addiction Medicine (570) Allergy and Immunology (864) Anesthesia (302) Cardiovascular Medicine (4445) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1515) Epidemiology (15236) Forensic Medicine (30) Gastroenterology (1127) Genetic and Genomic Medicine (6610) Geriatric Medicine (669) Health Economics (1000) Health Informatics (4549) Health Policy (1370) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1266) Infectious Diseases (except HIV/AIDS) (15926) Intensive Care and Critical Care Medicine (1104) Medical Education (623) Medical Ethics (147) Nephrology (668) Neurology (6613) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1147) Occupational and Environmental Health (957) Oncology (3341) Ophthalmology (975) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1694) Pharmacology and Therapeutics (693) Primary Care Research (714) Psychiatry and Clinical Psychology (5458) Public and Global Health (9244) Radiology and Imaging (2205) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1197) Rheumatology (596) Sexual and Reproductive Health (715) Sports Medicine (530) Surgery (713) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a02386ab8a3edfa9',t:'MTc3OTg2OTI0Nw=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00