Assessing the genetic contribution of cumulative behavioral factors associated with longitudinal type 2 diabetes risk highlights adiposity and the brain-metabolic axis

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 66,246 characters · extracted from preprint-html · click to expand
Assessing the genetic contribution of cumulative behavioral factors associated with longitudinal type 2 diabetes risk highlights adiposity and the brain-metabolic axis | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Assessing the genetic contribution of cumulative behavioral factors associated with longitudinal type 2 diabetes risk highlights adiposity and the brain-metabolic axis Nuno R. G. Carvalho , Yixuan He , Patrick Smadbeck , Jason Flannick , Josep M. Mercader , Miriam Udler , Arjun K Manrai , View ORCID Profile Jordi Moreno , View ORCID Profile Chirag J. Patel doi: https://doi.org/10.1101/2024.01.30.24302019 Nuno R. G. Carvalho 1 School of Biological Sciences; Georgia Institute of Technology ; Atlanta, GA, 30332, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Yixuan He 2 Programs in Metabolism and Medical and Population Genetics, Broad Institute of Harvard and MIT , Boston, MA, 02142, USA 3 Stanley Center for Psychiatric Research, Broad Institute of MIT and Harvard , Cambridge, MA, 02142, USA 4 Analytic and Translational Genetics Unit, Massachusetts General Hospital , Boston, MA, 02114, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Patrick Smadbeck 2 Programs in Metabolism and Medical and Population Genetics, Broad Institute of Harvard and MIT , Boston, MA, 02142, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jason Flannick 2 Programs in Metabolism and Medical and Population Genetics, Broad Institute of Harvard and MIT , Boston, MA, 02142, USA 5 Division of Genetics and Genomics, Boston Children’s Hospital , Boston, MA, 02115, USA 6 Department of Pediatrics, Harvard Medical School , Boston, MA, 02115, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Josep M. Mercader 2 Programs in Metabolism and Medical and Population Genetics, Broad Institute of Harvard and MIT , Boston, MA, 02142, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Miriam Udler 2 Programs in Metabolism and Medical and Population Genetics, Broad Institute of Harvard and MIT , Boston, MA, 02142, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Arjun K Manrai 9 Department of Biomedical Informatics, Harvard Medical School , Boston, MA, 02115, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jordi Moreno 2 Programs in Metabolism and Medical and Population Genetics, Broad Institute of Harvard and MIT , Boston, MA, 02142, USA 7 Department of Medicine, Harvard Medical School , Boston, MA, 02115, USA 8 Diabetes Unit and Center for Genomic Medicine, Massachusetts General Hospital , Boston, MA, 02114, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jordi Moreno Chirag J. Patel 9 Department of Biomedical Informatics, Harvard Medical School , Boston, MA, 02115, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Chirag J. Patel For correspondence: chirag_patel{at}hms.harvard.edu Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract While genetic factors, behavior, and environmental exposures form a complex web of interrelated associations in type 2 diabetes (T2D), their interaction is poorly understood. Here, using data from ∼500K participants of the UK Biobank, we identify the genetic determinants of a “polyexposure risk score” (PXS) a new risk factor that consists of an accumulation of 25 associated individual-level behaviors and environmental risk factors that predict longitudinal T2D incidence. PXS-T2D had a non-zero heritability (h 2 = 0.18) extensive shared genetic architecture with established clinical and biological determinants of T2D, most prominently with body mass index (genetic correlation [r g ] = 0.57) and Homeostatic Model Assessment for Insulin Resistance (r g = 0.51). Genetic loci associated with PXS-T2D were enriched for expression in the brain. Biobank scale data with genetic information illuminates how complex and cumulative exposures and behaviors as a whole impact T2D risk but whose biology have been elusive in genome-wide studies of T2D. Diabetes is a complex disease with many genetic, environmental, and behavioral factors hypothesized to have a role in etiology and disease progression. However, most studies focus on a single modality and the complex interplay between these factors across domains in diabetes onset has not been systematically characterized. 1 – 3 While genetic and environmental factors are traditionally modeled as independent axes of physiological variation, they are, in fact, correlated. 1 , 2 Work to uncover the correlation between genetic, environment, and behavioral factors has highlighted the importance of studying the “exposome.” 4 The exposome is a classification of non-genetically measured variables belonging to domains of lifestyle behavior (e.g., as diet, physical activity, and smoking), social standing (e.g., income, education), and physical-chemical (e.g., pollution) 5 . 6 – 8 Previously, we investigated domains of the exposome such as lifestyle behaviors and social factors, in prediction of incident type 2 diabetes (T2D). 9 , 10 We called individual factors of the exposome within the domains “ exposures. ” We developed a “polyexposure score” (PXS) composed from 12 individual-level exposures that were indicators of lifestyle, social standing, and physical-chemical factors, executing a longitudinal exposure-wide association study (ExWAS) to identify variables with robust statistical support. 6 The PXS played a complementary and independent role to a polygenic risk score (PRS) and traditional clinical risk factors (e.g., glycated hemoglobin A1C), body mass index [BMI], blood pressure, family history of disease, and cholesterol levels) in predicting incident T2D. Finding the role of antecedent exposures in diabetes physiology would complement recent advances in elucidating the biological function of genetic findings from large-scale GWAS. 11 , 12 However, the mechanistic role of the PXS in T2D and its genetic architecture have not been interrogated. In the following, we derive a new cumulative risk factor for T2D, called the PXS-T2D, and investigate the extent to which the composite PXS for incident T2D (PXS-T2D) and its individual-level behaviors are genetically heritable. We also investigate whether their genetic architectures are similar to that of clinical risk factors for disease. We focus on the subset of the exposome pertaining to individually-measured behaviors and study the phenomena of gene-exposure correlation (e.g. 13 ) to understand the relationship between the totality of exposure behaviors, as ascertained by the PXS, in T2D. We estimate the heritability and genetic correlations between behaviors and metabolic measurements and map associated variants to genes and tissue expression patterns, revealing the PXS is heritable and shares genetic architecture with antecedents of the disease and its complications. We show that elucidation of gene-exposure correlation at biobank scale enhances the identification of causal connections between exposures and physiological factors that are elusive in current day diabetes research. Results Here, we systematically investigated the network of type 2 diabetes etiology ( Figure 1A-C ). We expanded on the model of He et al. 9 ( Figure 1B ) by estimating the longitudinal risk for diabetes as a function of multiple behavior factors, creating a new cumulative score called PXS-T2D ( Figure 1A , C). Next, we calculated the correlation between PXS-T2D and the polygenic risk score as well as the genetic correlation between PXS-T2D and clinical risk factors of type 2 diabetes ( Figure 1B ). We identified the genetic variants associated with the PXS-T2D and its component behaviors, for which we also compute genetic correlations with clinical risk factors ( Figure 1C ). The mean time to T2D diagnosis (incident T2D) was 2,741 days (7.51 years, range: 2–5242 days, standard deviation: 1174.4 days). Download figure Open in new tab Fig. 1. Model for the etiology of type 2 diabetes. Our model for type 2 diabetes (T2D) risk (A). The central columns (B) consists of the polygenic risk score (PRS), polyexposure score (PXS-T2D), and clinical risk factors (CRFs), which were considered in He et al. 9 to predict incident T2D in the UK Biobank participants. In this paper, we investigate the genetic components of PXS-T2D and the 25 behavioral components that make it up (C), and how they correlate with clinical risk factors. Arrows shown in a darker shade of blue consist of relationships explored in this paper, and the methods employed are listed. Exposure-wide association study and PXS derivation After false-discovery rate (FDR) correction, 14 84 variables remained with FDR-adjusted p-value less than 0.05 (Table S1). The final PXS-T2D model consisted of linear weights for 25 behavior variables in addition to age, sex, and 40 genetic principal components (Table S2) and predicted future diabetes with an area under the curve (AUC) of 0.74. Factors in the PXS-T2D included alcohol intake (Hazard Ratio = 1.2, p = 2 x 10 -43 ), frequency of daytime naps (HR = 1.25, p = 6 x 10 -15 ), current smoker (vs. non-smokers; HR = 1.2, p = 1 x 10 -10 ), diet variety (HR = 1.3, p = 7 x 10 -15 ) and time watching television (HR = 1.2, p = 3 x 10 -8 ) associated with increased risk of future T2D. We also found factors such as walking pace (HR = 0.7, p = 4 x 10 -34 ) and moderate physical activity (HR = 0.97, p = 9 x 10 -5 ) associated with decreased risk for T2D. We note these were independently associated with T2D. The 25 behavioral exposures were weakly correlated with each other (Figure S1). The Polyexposure Score (PXS) is weakly correlated with the T2D Polygenic Risk Score, but is causally associated with Type 2 Diabetes We used the PRS for T2D present in the UK Biobank 15 to compute the correlation between the PRS and PXS for T2D. The correlation between the two variables was low, but significant given the large sample size (r = 0.0422, p < 2.2 x 10 -16 , Figure S2). We were next interested in the potential causal relationship between the PXS-T2D and T2D. We used an approach called “Mendelian Randomization,” 16 a method that associates genetic variants as proxies for exposures to disease outcomes, mitigating confounding that is common in observational/non-experimental studies. We input GWAS-significant SNP summary statistics for PXS-T2D (obtained via a GWAS in the UK Biobank, results discussed below) and GWAS summary statistics for T2D incidence in an inverse variance weighted Mendelian Randomization. 17 PXS-T2D was associated causally for incident T2D (effect size = 0.072, 95% CI [0.065, 0.079], p < 1E-3). We also tested the reverse direction and had no statistically significant evidence to support that the association was reverse causal (effect size = -0.176 [-0.389, 0.037], p = 0.104). When using a broader definition for T2D that included cases before the first assessment, we found T2D to have a slightly stronger and significant causal association with PXS-T2D (effect size = 0.082 [0.030, 0.133], p = 0.002). PXS-T2D and its individual component exposure behaviors are heritable We estimated SNP-based heritabilities for PXS-T2D and its 25 behavioral components. PXS-T2D has a heritability of 0.184 (95% CI [0.178, 0.190]), greater than the heritability of broadly defined (both incident and cross-sectional cases combined) T2D (h 2 =0.109, [0.106, 0.113]) and of incident T2D (h 2 =0.038, [0.034, 0.041]). We estimated the heritability of BMI-adjusted PXS-T2D and found a modest decrease in heritability compared to its non-adjusted counterpart (h 2 = 0.144 [0.138, 0.149] vs. h 2 = 0.184). The heritability of 25 individual behaviors ranged from h 2 = 0.0127 [0.00946, 0.0159] for “Renting for private landlord or letting agency” to h 2 = 0.143 [0.138, 0.147] for “Time spent watching television.” The most heritable behaviors also included “Alcohol intake frequency” (h 2 = 0.120, [0.116, 0.124]) and “Nap during day” (h 2 = 0.119, [0.115, 0.123]). Heritability of all behaviors are in Table 1 . No individual behavior had a higher heritability than PXS-T2D, even after adjusting it for BMI. View this table: View inline View popup Download powerpoint Table 1: Number of samples collected per time interval. Genetic markers associated with PXS-T2D and behaviors Using the PXS-T2D model, we computed the PXS score for each subject in the UK Biobank and performed a Genome-Wide Association Study (GWAS) for PXS-T2D and all its component exposure behaviors ( Table 1 ). For PXS-T2D, we identified 6,306 SNPs below the genome-wide significance threshold (p < 5 x 10 -8 ), which mapped to 342 genes and 88 genomic loci ( Figure 2 , Table S3). The most significant locus was rs13135092 (beta = -0.0276, p = 3.5 x 10 -20 ), an intronic variant found in chromosome 4. This SNP maps closely onto the SLC39A8 gene, which encodes the manganese solute carrier ZIP8 and is associated with neurological disorders like congenital disorder of glycosylation type II. 18 SLC39A8 was not found to be associated with T2D in the T2DKP 19 , 20 (z = 1.53, p = 0.063), but the gene includes SNPs that have achieved GWAS-significant association with body mass index (BMI), diastolic blood pressure, triglycerides, and high density lipoprotein (HDL) cholesterol, and Insulin Growth Factor-1 (IGF-1). 19 SLC39A8 was also associated with behavior variables such as walking pace (beta = 0.0205, p = 9.2 x 10 -16 ), Alcohol intake (beta = -0.0384, p = 7.8 x 10 -11 ), “Sleep duration” (beta = 0.0297, p = 1.5 x 10 -10 ), and “Time watching TV” (beta = -0.0192, p = 1.9 x 10 -9 ); all associations were directionally consistent with those for PXS-T2D and T2D. Another gene within the same locus as rs13135092 is the BANK1 gene, associated with systemic sclerosis 21 and other autoimmune diseases 22 but not T2D in the T2DKP (p = 0.823). Download figure Open in new tab Fig. 2. Manhattan plot for the polyexposure score for type 2 diabetes. Results of genome-wide association study performed on the polyexposure score for type 2 diabetes. Of the 19,400,443 SNPs plotted, 6,306 exceed the Bonferroni significance threshold (p < 5 x 10 -8 ). The genomic inflation factor (λ GC ) is 1.22.. Significant loci with p < 10 -10 that were distant enough from other loci are labeled with their lead SNP and closest gene. We also found a missense variant, rs1260326, strongly associated with higher PXS-T2D scores (beta = 0.01, risk allele: T). This locus maps to GCKR (Glucokinase regulatory protein, Table S3, Figure 2 ), expressed both in the liver and pancreatic beta cells. The variant has strong prior association in GWASs for T2D (OR = 1.1, p < 7 x 10 - 52 ) and concordant in direction with respect to the risk allele (e.g., higher odds for T2D for individuals with the T allele). Interestingly, the variant is also associated with clinical risk factors, such as total cholesterol (p < 5 x 10 -324 ), triglycerides (p < 5 x 10 -324 ) and fasting glucose (adjusted for BMI, p < 7 x 10 -91 ). While the risk allele is associated with higher glucose levels (concordant with PXS-T2D and T2D), it is also associated with lower cholesterol and triglyceride levels. Other top loci included rs4587178 (beta = 0.0017, p = 3.8 x 10 -18 ), which was previously found to be associated with the first principal component of dietary patterns in the UK Biobank 23 (p = 9.7 x 10 -10 ) and is associated with higher urinary sodium excretion (p = 6.8 x 10 -9 ) in the T2DKP. Interestingly, it was not associated with T2D itself (p = 0.09, OR = 1.008). The next top locus was rs2280406 (beta = -0.0136, p = 1.8 x 10 -16 ), which has been associated with HDL cholesterol (p = 7.4 x 10 -56 ), BMI (p = 5.90 x 10 -42 ), and plasma C-reactive protein (2.25 x 10 -26 ), but narrowly misses genome-wide significance for type 2 diabetes (p = 6.78 x 10 -8 ). The locus maps to multiple genes, including MST1R , CTD-2330K9.3 , MON1A , TRAIP , and CAMKV . 18:21101658_TC_T (p = 4.70 x 10 -16 ) is also strongly associated with lower triglyceride levels (p = 8.34 x 10 -13 ). Across the 342 genes associated with PXS-T2D, 42 (12.4%) had a previous association with T2D, as currently documented by the T2DKP. Body Mass Index, FTO locus, and PXS-T2D A locus associated with FTO , rs9937521, known for its strong association with both obesity 24 and T2D (p = 3.5 x 10 -80 in the T2DKP), was significant in 8 of our component behavior GWAS including “White bread consumption”, “No recent dietary change”, and “Sleep Duration”. However, none of the SNPs that mapped onto the FTO gene were identified as genome-wide significant in our PXS-T2D GWAS (most significant SNP: rs9937521, p = 4.3 x 10 -6 ), although the SNP effect sizes in the FTO region were directionally consistent with their effects in T2D. SNPs found near the FTO region were significantly enriched for association with PXS-T2D (p = 3.9 x 10 -34 , Figure S3), with 19 SNPs reaching the threshold of suggestive significance (p < 10 -5 ). Colocalization analyses of GWAS results in the FTO region show strong posterior probability that PXS-T2D has the same causal variant as the other behaviors for which FTO was found to be significant in (Figure S4). A full list of all genomic loci and genes associated with PXS-T2D is shown in Table S3. BMI was by far the most replicated trait among our behaviors’ associated SNPs, followed by insomnia and T2D. Since the GWAS Catalog does not have standardized names for traits, we grouped the top 150 traits by replicated SNPs into 9 groups (traits within each group listed in Table S4). The most replicated trait group was “metabolic traits”, followed by “anthropometric traits” (mostly consisting of BMI and related metrics) and “cognitive/behavior traits” (see Tables S5 and S6). PXS-T2D exhibits genetic correlation with clinical risk factors and metabolic traits We estimated the genetic correlation between the PXS-T2D and six CRFs (BMI, glucose, triglycerides, systolic blood pressure, HDL, and HbA1c; Figure 3 ). All genetic correlations were significant. PXS-T2D had a moderate mean absolute genetic correlation (mean |r g | = 0.25) across the six CRFs, with BMI being its strongest correlation (r g = 0.57). We also estimated the same genetic correlations with our 25 component behaviors. “Usual walking pace” had the highest mean absolute genetic correlation (mean |r g | = 0.21) while also being the third most significant component of the PXS-T2D. For BMI, triglycerides, and HDL, the genetic correlation with the highest absolute value was with PXS-T2D (and not an individual behavior component). Download figure Open in new tab Fig. 3. Genetic correlation between PXS-T2D plus individual behaviors and T2D clinical risk factors. Genetic correlations (r g ) between T2D-associated behaviors (including PXS-T2D itself) and clinical risk factors for T2D as estimated by BOLT-REML. Only Bonferroni-adjusted significant genetic correlations have text displayed in the plot. Behaviors listed higher in the y-axis are also more strongly associated with incident T2D as reflected by their p-values in the PXS. We also estimated the genetic correlation using LD-score correlation using PXS-T2D summary statistics and from summary statistics in the T2DKP (e.g., 25 Figure S8) to more broadly examine T2D-related physiological traits, including fasting insulin and proxies of insulin resistance (e.g., HOMA-IR). First, we found that LD-score-based genetic correlations between PXS-T2D and CRFs were not significantly different in the T2DKP vs. UKBB, with the exception of HbA1c (r g = 0.123, [0.090, 0.156] in UK Biobank vs. r g = 0.242, [0.192, 0.292] in T2DKP) and random glucose (r g = 0.055, [0.0003, 0.1096] vs. r g = 0.181, [0.1102, 0.253]). This is likely due to our inclusion criteria for the PXS generation: we removed individuals who had HbA1c values above 48 mmol/mol (see Methods). Furthermore, we found that the observational correlation between HbA1c and glucose is significantly smaller when individuals with higher baseline HbA1c are removed (r = 0.617, [0.615, 0.619] vs. r = 0.212, [0.209, 0.215]). We found that PXS-T2D and incident T2D were moderately genetically correlated (r g = 0.474). Next, we correlated the PXS-T2D with fasting glucose, fasting insulin, HbA1c, BMI, HOMA-IR, and HOMA-B. We found strong genetic correlations between PXS-T2D and HOMA-IR (r g = 0.512, [0.360, 0.664]) and HOMA-B (r g = 0.295, [0.181, 0.410]). On the other hand, we found weaker and non-significant correlations with fasting glucose (r g = -0.006, [-0.091, 0.079]) and 2-hour glucose (r g = 0.056, [-0.058, 0.170]). Compared to fasting glucose and 2-hour glucose, we found higher and significant correlations with fasting insulin (r g = 0.143, [0.0599, 0.226]) and HbA1c (r g = 0.168, [0.0949, 0.241]. Interestingly, BMI had a significantly stronger genetic correlation with PXS-T2D than with T2D itself (r g = 0.57 vs. r g = 0.42 respectively), while the opposite was true for glucose, HbA1c, HDL, and systolic blood pressure (Figure S5). We provide a broad atlas of genetic correlation for traits in the T2DKP (Table S7, n = 628). In addition to BMI and HOMA-IR, the phenotypes with the largest genetic correlation with PXS-T2D included Non-Alcoholic Fatty Liver Disease ([NAFLD] r g = 0.75, p = 1.4 x 10 -21 ) and gastroesophageal reflux disease (r g = 0.72, p < 1 x 10 -20 ). Tissue expression of behavior-associated genes Given that PXS-T2D shares genetic architecture with metabolic traits, we hypothesized that associated variant’s mapped genes should have similar expression patterns. After Bonferroni correction, the only tissue types of the 30 in GTEx to be significantly enriched in expression for any behavior’s or PXS-T2D’s associated genes are the brain and the pituitary ( Figure 4 , Figure S6), with the exception of the association between “Major dietary changes in the last 5 years because of illness” and testis tissue (p = 0.0183). Brain tissue was most strongly enriched for expression for the traits “Nap during day” (p = 5.10 x 10 -10 ), “Sleep duration” (p = 4.11 x 10 -9 ), and “Time spent watching television” (p = 6.89 x 10 -9 ). Adjusting PXS-T2D for BMI still yielded significant expression enrichment in brain tissue (p = 6.42 x 10 -5 ). Download figure Open in new tab Fig. 4. Enriched expression of behaviors’ associated genes across 30 tissue types. GWAS summary statistics for PXS-T2D and its 25 behaviors components were fed into FUMA to calculate the significance of differential expression in 30 tissue types and 53 specific tissues in GTEx. Within each of the two analyses, we further Bonferroni-adjusted the p-values for the number of traits tested. The heatmap colors were set such that p = 0.05 appeared as white, p > 0.05 appeared as red, and p < 0.05 appeared as green. Only tissue types (left section) and specific tissues (right section) with significant expression in at least one trait are shown and combined into one plot. The top row consists of tissue expressions for PXS-T2D, and behaviors listed higher in the y-axis are also more strongly associated with incident T2D as reflected by their p-values in the PXS. For the full expression heatmaps for all tissue types and specific tissues, see Figures S5 and S6 respectively. We found similar results when looking across GTEx’s 53 specific tissues, some of which overlap with tissue types tested above. Only brain-related tissue, the pituitary, and the testis are enriched for expression in any behavior (Figure S7). Among brain tissues, PXS-T2D is most strongly enriched in the cerebellum (p = 3.97 x 10 -8 ), frontal cortex (p = 4.39 x 10 -7 ), and hippocampus (p = 4.21 x 10 -6 ). Discussion In summary, we interrogated the genetic determinants of cumulative exposure behaviors that are predictive of longitudinal type 2 diabetes. Findings from longitudinal diabetes studies have shown that risk may manifest 10 years or greater before onset 26 , but not readily apparent via glucose levels 27 . Study of longitudinal exposures is important, but a challenge to understand how they exert their impact. Here, we conduct massive gene-by-exposure correlations to identify behavior exposures related to physiological components of T2D. Overall, we find (1) the genetic basis of a new latent behavior risk factor (the PXS-T2D) (2) the genetic architecture of the feature is connected with adiposity and insulin resistance, but not to glucose levels, complementary but distinct from current day T2D GWAS. We provide data resources for others to interrogate other components of T2D physiology. T2D is caused by a combination of decreased insulin sensitivity (i.e., increase in insulin resistance) and secretion or a “decanalization” of the steady state. 28 , 29 The underlying biological mechanisms by which behavioral exposure antecedents impact the steady state of insulin sensitivity and secretion, and ultimately T2D, are understudied. Re-analysis of GWAS of T2D and glycemic traits have recovered genetic signals that are associated with resistance and secretion to a varying degree. 11 , 30 , 31 A major contributor to insulin resistance includes higher BMI. 32 By comparing the genetic architecture of PXS-T2D with adiposity (e.g., BMI), cardiometabolic (e.g., triglycerides, cholesterol, blood pressure), and glycemic traits (e.g., hemoglobin A1c, glucose, insulin), we find that indeed the genetic architecture is largely shared between PXS-T2D and BMI (r g = 0.57). Notably, the correlation between PXS-T2D and BMI is greater than the correlation between PXS-T2D and T2D itself (r g = 0.47). We also found significant genetic correlation between PXS-T2D and HOMA-IR, HOMA-B, and triglyceride levels. In contrast, we observed smaller shared genetic architecture between glucose control and overall glucose levels. Our data on the PXS-T2D suggests that the role of PXS-captured behavior in T2D is via higher adiposity and potentially insulin resistance. Since these same clinical risk factors are associated with other detrimental health outcomes, estimation of genetic liability of cumulative unhealthy (or healthy) behavior can be potentially extended to diseases outside of diabetes. 33 Human behavior, such as physical activity and dietary intake, is a result of the complex interactions between individuals agents and the specific environmental contexts they are in. 13 , 23 , 34 , 35 Behavior is partly heritable, 36 with estimates ranging from 5-15% in SNP-based heritability estimates 37 to 30-60% in twin studies. 37 – 39 We believe that the genetic variants associated with PXS-T2D are effective at capturing shared genetic architecture across behavioral traits. This builds on efforts that examine behavior factors one at a time in GWAS. For example, Merino and colleagues recently identified genetic variants associated with dietary intake behavior and cardiometabolic traits. 13 Given that the PXS is a composite score of T2D risk-associated behavior, its genetic architecture could be understood as a measure of genetic liability of latent unhealthy behavior, or, in other words, behavior that is not directly measured by individual components, analogous “latent” traits in psychiatric research. 40 , 41 For example, first, we found the GWAS-based heritability of the PXS-T2D to be 19%, greater than any one of the behavioral components alone. Second, exploring the genetic component of PXS-T2D offers insights that are not found when interrogating T2D directly. This is evidenced by PXS-T2D and T2D only sharing about half of their genetic architecture (r g = 0.474) and that an overwhelming majority of genes associated with the former are not associated with latter phenotype. We found functional enrichment of PXS-T2D in brain tissue, particularly in the cerebellum and cortex. This is inline with personality- and dietary-related variants being expressed in the brain, 13 , 42 – 46 and recent studies have shown the important effect that brain-related variants have on metabolic health outcomes. 47 The only other tissue type enriched in expression among PXS-T2D-associated genes was the pituitary gland. Our paper comes with limitations. First, our GWAS had inflated genomic inflation factors ( Table 1 ), which can be a sign of population stratification. 48 We attempted to remedy this by using genetic principal components as covariates 49 in linear mixed model software optimized for controlling for population structure, 50 , 51 as well restricting our sample to self-reported “White British.” We therefore posit that the inflated lambdas in our GWAS are resulting from the high polygenicity 48 often found in personality traits. 43 , 46 A downside of filtering the genetic ancestral group used is that our results are less generalizable to other ancestral groups, compounded by the finding that lifestyle and psychological traits especially lack portability. 52 In order to equitably share the benefits of research to all, we acknowledge that genomics research needs to diversify the samples used in studies. 53 Furthermore, like all UK Biobank studies, our cohort is not entirely representative of the socioeconomic status and health outcomes of the general UK population. 54 UK Biobank participants also lack extensive fasting or oral glucose tolerance testing measurements to estimate insulin sensitivity and secretion, two critical axes of diabetes etiology. In future studies, we aim to perform extensive exposome-wide assessment along the axes of fasting insulin and glucose to pin down what behaviors matter, and when they matter, for beta cell function and insulin resistance. In this study, we attempt to disentangle the complex and correlated nature of behavioral exposures via a new computational construct, the polyexposure score (PXS). The PXS is an indicator of complex behavior exposures, summarizing activity, diet, and social exposure variables and is heritable, potentially impacting CRFs before T2D onset. Additionally, PXS may have implications for mental factors not previously linked to T2D, which merits further investigation. The trait correlations, associated genetic loci, and the tissues where variants impact expression largely align with those connected to adiposity. However, there are additional findings that include both established T2D risk factors (e.g., triglycerides) and potentially novel risk factors that could provide greater specificity and potency to existing models, such as complex associations in GCKR . 55 , 56 Highlighting these novel genetic loci may offer new insights into the intricate relationship between PXS and T2D risk. Online Methods All code and methods for reproducing the results of this paper is publicly available on our github repository. We deposit the PXS-T2D summary statistics in FigShare (doi: 10.6084/m9.figshare.24975564). The UK Biobank project number for this project was 2288; the Harvard University IRB approved of this study (IRB: IRB16-245). Study Participants The UK Biobank (UKBB) is a cohort consisting of ∼500,000 individuals recruited across 22 assessment centers in the United Kingdom between 2006 and 2010. 57 The UKBB assessed participants through questionnaires, physical measurements, and biological samples at the assessment center. Disease diagnoses were also attained via questionnaires and through linkages to participant health care provider data. Individuals were genotyped for over 800,000 single nucleotide polymorphisms (SNPs) using the UK BiLEVE Axiom Array or the UK Biobank Axiom Array. Genotypes were imputed to over 96 million SNPs using the Haplotype Reference Consortium, the UK10K panel, and the 1000 Genomes panel. 58 In our analysis, we filtered the sample to the 455,813 individuals with self-identified ethnic background of “White British” in order to reduce population structure which can inflate genetic variant associations with a phenotype. 48 For subsequent analyses, the remaining sample was randomly split into a training and validation group according to a 2:1 ratio. Prospective Type 2 Diabetes Definition We defined incident T2D as whether an individual had an ICD10 code of E11.X (non-insulin-dependent diabetes; T2D) reported for the first time after their first assessment with the UKBB. Those with diagnosed diabetes before their first assessment or HbA1c values above 48 mmol/mol were removed from the analysis. For supplementary analyses, we also defined a broader binary T2D variable purely by E11.X reported or diabetes self-reported at any time point, acknowledging that this may include Type 1 Diabetes cases. We defined time to incident T2D by the number of days between the day of an individual’s first assessment and the day of their T2D diagnosis. A total of 388,452 participants remained, 14,294 of which developed T2D after the first assessment. Building a Polyexposure Risk Score (PXS) for T2D We followed a similar procedure to that employed by He et al. 9 to calculate the PXS for incident T2D on UK Biobank participants. Among He et al.’s 111 UKBB fields representing the exposome, e.g., physical exposures (e.g, air pollution), and “lifestyle” behavior variables (e.g., smoking behavior), with greater than 90% coverage in the UK Biobank, we selected 65 individual-level exposure behavior variables (variables that are measured on individuals as opposed to external measures often measured at the neighborhood or regional level), which are listed in Table S1. We only analyzed behavioral exposures ascertained in the first examination. We used PHESANT, 59 a tool for standardizing UKBB diverse variable types (e.g., continuous, categorical, ordinal), to harmonize phenotypic data, which included dummy encoding categorical variables, yielding a total of 103 variables. Using a modified version of the software package PXStools, 10 we performed an exposure-wide association study (ExWAS) to associate each of the 103 exposome variables with incident T2D using Cox Proportional Hazards regression, controlled for sex, age, and the first 40 genetic principal components (PCs) as covariates. Only exposure variables with an FDR-adjusted p-value below 0.05 and their related binarized variables were passed onto the next step (e.g., for categorical variables that were split into binary variables, only one of these variables needed to be significant for all others to be included). Next, we fit a multivariate regression model as a function of the 84 ExWAS identified fields (which mapped to a total of 98 variables) using LASSO until only independently significant (p < 0.05) variables remain, again also adjusting for age, sex, and the first 40 genetic PCs. The coefficient of each regression term allows us to compute the polyexposure score for type 2 diabetes (PXS-T2D) for individuals with complete data. Polygenic Risk Scores and Mendelian Randomization In order to quantify the relationship between PXS-T2D and polygenic risk scores (PRS) for T2D, we extracted field 26285 from the UK Biobank, which contains a PRS for T2D for over 486,000 participants trained on external data by Thompson et al. 15 We note that the PRS-T2D was not trained on the exact same definition of incident T2D that we used for our PXS. We then calculated the correlation between the PXS-T2D and PRS-T2D of an individual. Furthermore, we used the inverse-variance weighted (IVW) method in the MendelianRandomization R package 60 to estimate causal relationships between PXS-T2D and incident T2D. We used significantly associated variants for each phenotype derived from our genome-wide association studies (described below) as instrumental variables for Mendelian randomization in each direction. Performing genome wide associations for PXS-T2D and behaviors We used BOLT-LMM v2.3.2 51 , 61 to perform a genome-wide association study (GWAS) on the PXS-T2D phenotype, the 25 behavioral phenotypes that composed it, and incident T2D itself. We filtered the full set of 96 million imputed SNPs to just those with a minor allele frequency (MAF) above 0.001 and an imputation information score (INFO) above 0.3, narrowing the set down to 19,400,443 markers. We used LD scores from the 1000 Genomes Project 62 European cohort. Sex, age, the assessment center where data was collected, and the first 40 PCs were covariates. We calculated the lambda genomic inflation factor (λ GC ) for each GWAS as the ratio of median 2 statistic to the expected median 2 statistic (∼0.455). Annotating GWAS variants to function We used FUMA to annotate variants associated with PXS-T2D, which calls the MAGMA software and inputs GTEx data, which links genetic variants to tissue specific gene expression, and the GWAS Catalog, which is a database of documented variant-phenotype associations. 63 – 69 We also extracted variant- and gene-level associations with the T2D phenotype on the Common Metabolic Disease Knowledge Portal 19 (T2DKP, https://t2d.hugeamp.org/ ), which meta-analyzed 44 individual T2D GWAS. We also used the T2DKP to identify our significant variants’ associations with other biologically relevant phenotypes Estimating heritability of PXS-T2D and behavior variables We used BOLT-REML for estimating narrow-sense GWAS-based heritability of the same set of PXS-T2D and 25 individual behavior constituent variables. We used the same SNP-filtering settings and covariates as in the BOLT-LMM GWAS. We used the --remlNoRefine flag in BOLT-REML, which speeds up computation time by a factor of 2 to 3 at the expense of standard errors being around 1.03 times greater. Computing genetic correlation between PXS-T2D and metabolic risk factors We obtained clinical risk factors including Body Mass Index (BMI), non-fasting glucose, triglycerides, systolic blood pressure, and high density lipoprotein (HDL) cholesterol, and hemoglobin A1c (HbA1c). Genetic correlation is one tool to help elucidate causal relationships between phenotypes in lieu of an experiment or a randomized trial. 70 Here, we wished to demonstrate the genetic correlation between PXS-T2D and T2D-related traits using observational association data and summary statistics. Using individual-level data from participants of the UK Biobank, we used BOLT-REML to estimate the genetic correlation between pairs of phenotypes and T2D-PXS. We used identical SNP-filtering steps, covariates, and --remlNoRefine flag as in the BOLT-LMM GWAS analysis. We performed genetic correlations between T2D-PXS (and a BMI-adjusted PXS-T2D) and the six clinical risk factors listed above. We also used summary statistics data and pipelines from the T2DKP 20 to estimate genetic correlation between PXS-T2D and fasting glucose, fasting insulin, 2-hour glucose, HOMeostatic Assessment of Insulin Resistance (HOMA-IR) and Beta-cell function (HOMA-B) phenotypes. 71 HOMA-IR and -B are predicted estimates of insulin resistance and beta-cell function respectively. 72 To estimate genetic correlation for summary statistics, we used LDsc 70 , 73 with European LD scores as a reference. 62 We also used the coloc R package to perform colocalization analysis to identify overlapping genetic signals between phenotypes in select regions 74 . Data Availability All code and methods for reproducing the results of this paper is publicly available on our github repository. We deposit the PXS-T2D summary statistics in FigShare (doi: 10.6084/m9.figshare.24975564). Author Contributions Conceptualization, N.C and C.P.; Methodology, N.C and C.P.; Formal Analysis, N.C, P.S., and C.P.; Writing - Original Draft, N.C and C.P.; Writing - Review & Editing, N.C, Y.H., P.S., J.F., J.M.M., M.U., J.M, and C.P.; Visualization: N.C and C.P.; Supervision, C.P.; Project Administration, C.P.; Funding Acquisition, C.P. Declaration of Interests The authors declare no competing interests. Figure Legends Fig. S1. Correlation matrix of the 25 behavioral exposures making up the PXS-T2D. A heatmap matrix displaying the correlation between every pair of 25 behavior variables in the UK Biobank. The polycor R package was used to compute correlations between mixed data type variables. The data types of each variable are shown in Table S1. Correlation values are shown on the plot, with positive correlations shaded in green and negative correlations shaded in red. Lower magnitude correlations have a more muted color that is closer to white. The main diagonal is omitted due to all correlations being 1. The matrix is mirrored across the diagonal. Fig. S2. Correlation between PRS-T2D and PXS-T2D. Scatterplot between polygenic risk score for T2D and polyexposure score for T2D for 264,704 individuals in the UK Biobank. Trend line for the two variables is shown. The standard PRS for T2D was used, meaning that the GWAS training data is external to the UK Biobank. Fig. S3. Enrichment of PXS-T2D SNP associations in the FTO region. Manhattan plot for PXS-T2D associations within the FTO region (in dark green; additional 50 kb regions in each direction shown in light green). Despite zero SNPs exceeding the threshold for genome-wide significance (red line, p < 5 x 10 -8 ), 19 SNPs surpass the suggestive significance threshold (blue line, p < 1 x 10 -5 ). Horizontal segmented bars represent the mean -log 10 (P) for SNPs in the region. SNPs in the FTO region have a significantly higher mean -log 10 (P) than surrounding non- FTO SNPs (t = 13.5, p = 3.9 x 10 -34 ). Fig. S4. Pairwise colocalization analysis of GWAS results in the FTO region across 25 behaviors and PXS-T2D. Colocalization analysis of GWAS results in the FTO region (± 50 kb) among all pairs of 25 behaviors and PXS-T2D. The number in each tile is the posterior probability of the two traits having one common causal variant as implemented by the coloc.abf() function in the coloc R package. Axis labels that are bolded denote that the FTO gene was deemed to be significant for that trait, meaning that at least one SNP that maps onto the FTO gene had genome-wide significance. Note that some traits without such a SNP, like PXS-T2D, have a high probability of sharing a common variant with traits that are associated with FTO . Fig. S5. Comparison of genetic correlation between PXS-T2D and T2D. Barplot comparison of the genetic correlation between clinical risk factors and PXS-T2D vs T2D. Error bars shown are 95% confidence intervals, and the asterisks denote non-overlap between intervals within each CRF. Data for T2D’s genetic correlations taken from the T2DKP. HDL is the only clinical risk factor with a negative genetic correlation with PXS-T2D and with T2D. Fig. S6: Enriched expression of behaviors’ associated genes across 30 tissue categories. GWAS results for PXS-T2D and its 25 component behaviors were fed into FUMA to calculate the significance of differential expression in 30 tissue types in GTEx. We further Bonferroni-adjusted the p-values for the number of traits tested. The top row consists of tissue expressions for PXS-T2D, and behaviors listed higher in the y-axis are also more strongly associated with incident T2D as reflected by their p-values in the PXS. Fig. S7. Enriched expression of behaviors’ associated genes across 53 tissues. GWAS results for PXS-T2D and its 25 component behaviors were fed into FUMA to calculate the significance of differential expression in 53 specific tissues in GTEx. Many specific tissues are also listed as tissue types in Figure S6. We further Bonferroni-adjusted the p-values for the number of traits tested. The top row consists of tissue expressions for PXS-T2D, and behaviors listed higher in the y-axis are also more strongly associated with incident T2D as reflected by their p-values in the PXS. Fig. S8. Genetic correlation between behaviors + PXS-T2D and select glycemic traits. Genetic correlations (r g ) between T2D-associated behaviors (including PXS-T2D itself) and select glycemic traits associated with T2D as estimated by LDsc. Only Bonferroni-adjusted significant genetic correlations have text displayed in the plot. Behaviors listed higher in the y-axis are also more strongly associated with incident T2D as reflected by their p-values in the PXS. Acknowledgements We thank Jose Florez and Shamil Sunyaev for providing valuable feedback on the initial findings. This study was funded by NIEHS R01 ESS032470 and NIA RF1AG074372. We thank all participants and contributors of the UK Biobank for making this study possible. References 1. ↵ Abdellaoui , A. , Dolan , C. V. , Verweij , K. J. H. & Nivard , M. G . Gene-environment correlations across geographic regions affect genome-wide association studies . Nat. Genet . 54 , 1345 – 1354 ( 2022 ). OpenUrl CrossRef 2. ↵ Abdellaoui , A. et al. Genetic correlates of social stratification in Great Britain . Nat Hum Behav 3 , 1332 – 1342 ( 2019 ). OpenUrl 3. ↵ Dick , D. M . Gene-environment interaction in psychological traits and disorders . Annu. Rev. Clin. Psychol . 7 , 383 – 409 ( 2011 ). OpenUrl CrossRef PubMed 4. ↵ Wild , C. P . The exposome: from concept to utility . Int. J. Epidemiol . 41 , 24 – 32 ( 2012 ). OpenUrl CrossRef PubMed Web of Science 5. ↵ Vermeulen , R. , Schymanski , E. L. , Barabási , A.-L. & Miller , G. W . The exposome and health: Where chemistry meets biology . Science 367 , 392 – 396 ( 2020 ). OpenUrl Abstract / FREE Full Text 6. ↵ Manrai , A. K. et al. Informatics and Data Analytics to Support Exposome-Based Discovery for Public Health . Annu. Rev. Public Health 38 , 279 – 294 ( 2017 ). OpenUrl PubMed 7. Patel , C. J. , Bhattacharya , J. & Butte , A. J . An Environment-Wide Association Study (EWAS) on type 2 diabetes mellitus . PLoS One 5 , e10746 ( 2010 ). OpenUrl CrossRef PubMed 8. ↵ Patel , C. J. & Ioannidis , J. P. A . Studying the elusive environment in large scale . JAMA 311 , 2173 – 2174 ( 2014 ). OpenUrl CrossRef PubMed 9. ↵ He , Y. et al. Comparisons of Polyexposure, Polygenic, and Clinical Risk Scores in Risk Prediction of Type 2 Diabetes . Diabetes Care 44 , 935 – 943 ( 2021 ). OpenUrl Abstract / FREE Full Text 10. ↵ He , Y. & Patel , C. J . Software Application Profile: PXStools—an R package of tools for conducting exposure-wide analysis and deriving polyexposure risk scores . Int. J. Epidemiol . 52 , 633 – 640 ( 2022 ). OpenUrl 11. ↵ Udler , M. S. et al. Type 2 diabetes genetic loci informed by multi-trait associations point to disease mechanisms and subtypes: A soft clustering analysis . PLoS Med . 15 , e1002654 ( 2018 ). OpenUrl PubMed 12. ↵ Udler , M. S . Type 2 Diabetes: Multiple Genes, Multiple Diseases . Curr. Diab. Rep . 19 , 55 ( 2019 ). OpenUrl PubMed 13. ↵ Merino , J. et al. Genetic analysis of dietary intake identifies new loci and functional links with metabolic traits . Nat Hum Behav 6 , 155 – 163 ( 2022 ). OpenUrl 14. ↵ Benjamini , Y. & Hochberg , Y . Controlling the False Discovery Rate: A Practical and Powerful Approach to Multiple Testing . J. R. Stat. Soc. Series B Stat. Methodol . 57 , 289 – 300 ( 1995 ). OpenUrl 15. ↵ Thompson , D. J. , et al. UK Biobank release and systematic evaluation of optimised polygenic risk scores for 53 diseases and quantitative traits . bioRxiv ( 2022 ) doi: 10.1101/2022.06.16.22276246 . OpenUrl CrossRef 16. ↵ Emdin , C. A. , Khera , A. V. & Kathiresan , S . Mendelian Randomization . JAMA 318 , 1925 – 1926 ( 2017 ). OpenUrl CrossRef PubMed 17. ↵ Burgess , S. , et al. Guidelines for performing Mendelian randomization investigations . Wellcome Open Research vol. 4 186 Preprint at doi: 10.12688/wellcomeopenres.15555.1 ( 2019 ). OpenUrl CrossRef PubMed 18. ↵ Bonaventura , E. et al. Clinical, molecular and glycophenotype insights in SLC39A8-CDG . Orphanet J. Rare Dis . 16 , 307 ( 2021 ). OpenUrl 19. ↵ Phenotype . https://t2d.hugeamp.org/phenotype.html?phenotype=T2D . 20. ↵ Costanzo , M. C. et al. The Type 2 Diabetes Knowledge Portal: An open access genetic resource dedicated to type 2 diabetes and related traits . Cell Metab . 35 , 695 – 710 .e6 ( 2023 ). OpenUrl CrossRef PubMed 21. ↵ Rueda , B. et al. BANK1 functional variants are associated with susceptibility to diffuse systemic sclerosis in Caucasians . Ann. Rheum. Dis . 69 , 700 – 705 ( 2010 ). OpenUrl Abstract / FREE Full Text 22. ↵ Gómez Hernández , G. , Morell , M. & Alarcón-Riquelme , M. E. The Role of BANK1 in B Cell Signaling and Disease . Cells 10 , ( 2021 ). 23. ↵ Cole , J. B. , Florez , J. C. & Hirschhorn , J. N . Comprehensive genomic analysis of dietary habits in UK Biobank identifies hundreds of genetic associations . Nat. Commun . 11 , 1467 ( 2020 ). OpenUrl CrossRef PubMed 24. ↵ Loos , R. J. F. & Yeo , G. S. H . The bigger picture of FTO: the first GWAS-identified obesity gene . Nat. Rev. Endocrinol . 10 , 51 – 61 ( 2014 ). OpenUrl CrossRef PubMed 25. ↵ Chen , J. et al. The trans-ancestral genomic architecture of glycemic traits . Nat. Genet . 53 , 840 – 860 ( 2021 ). OpenUrl CrossRef PubMed 26. ↵ Wang , T. J. et al. Metabolite profiles and the risk of developing diabetes . Nat. Med . 17 , 448 – 453 ( 2011 ). OpenUrl CrossRef PubMed Web of Science 27. ↵ Tabák , A. G. , Herder , C. , Rathmann , W. , Brunner , E. J. & Kivimäki , M . Prediabetes: a high-risk state for diabetes development . Lancet 379 , 2279 – 2290 ( 2012 ). OpenUrl CrossRef PubMed Web of Science 28. ↵ Kahn , S. E. , Hull , R. L. & Utzschneider , K. M . Mechanisms linking obesity to insulin resistance and type 2 diabetes . Nature 444 , 840 – 846 ( 2006 ). OpenUrl CrossRef PubMed Web of Science 29. ↵ Gibson , G . Decanalization and the origin of complex disease . Nat. Rev. Genet . 10 , 134 – 140 ( 2009 ). OpenUrl CrossRef PubMed Web of Science 30. ↵ Speliotes , E. K. et al. Association analyses of 249,796 individuals reveal 18 new loci associated with body mass index . Nat. Genet . 42 , 937 – 948 ( 2010 ). OpenUrl CrossRef PubMed Web of Science 31. ↵ Benjamin F Voight et al. Twelve type 2 diabetes susceptibility loci identified through large-scale association analysis . Nat. Genet . 42 , 579 – 589 ( 2010 ). OpenUrl CrossRef PubMed Web of Science 32. ↵ Kahn , B. B. & Flier , J. S. Obesity and insulin resistance . J. Clin. Invest . 106 , 473 – 481 ( 2000 ). OpenUrl CrossRef PubMed Web of Science 33. ↵ He , Y. & Patel , C. J . Shared exposure liability of type 2 diabetes and other chronic conditions in the UK Biobank . Acta Diabetol . ( 2022 ) doi: 10.1007/s00592-022-01864-5 . OpenUrl CrossRef 34. ↵ Doherty , A. et al. GWAS identifies 14 loci for device-measured physical activity and sleep duration . Nat. Commun . 9 , 5257 ( 2018 ). OpenUrl PubMed 35. ↵ Wang , Z. et al. Genome-wide association analyses of physical activity and sedentary behavior provide insights into underlying mechanisms and roles in disease prevention . Nat. Genet . 54 , 1332 – 1344 ( 2022 ). OpenUrl CrossRef 36. ↵ Goldberg , L. R . The structure of phenotypic personality traits . Am. Psychol . 48 , 26 – 34 . 37. ↵ Sanchez-Roige , S. , Gray , J. C. , MacKillop , J. , Chen , C.-H. & Palmer , A. A . The genetics of human personality . Genes Brain Behav . 17 , e12439 ( 2018 ). OpenUrl CrossRef PubMed 38. Jang , K. L. , Livesley , W. J. & Vernon , P. A . Heritability of the big five personality dimensions and their facets: a twin study . J. Pers . 64 , 577 – 591 ( 1996 ). OpenUrl CrossRef PubMed Web of Science 39. ↵ Vukasović , T. & Bratko , D . Heritability of personality: A meta-analysis of behavior genetic studies . Psychol. Bull . 141 , 769 – 785 ( 2015 ). OpenUrl CrossRef PubMed 40. ↵ Grotzinger , A. D. et al. Genomic structural equation modelling provides insights into the multivariate genetic architecture of complex traits . Nat Hum Behav 3 , 513 – 525 ( 2019 ). OpenUrl 41. ↵ Carey , C. E. , et al. Principled distillation of multidimensional UK Biobank data reveals insights into the correlated human phenome . bioRxiv ( 2022 ) doi: 10.1101/2022.09.02.22279546 . OpenUrl CrossRef 42. ↵ Lo , M.-T. et al. Genome-wide analyses for personality traits identify six genomic loci and show correlations with psychiatric disorders . Nat. Genet . 49 , 152 – 156 ( 2017 ). OpenUrl 43. ↵ Okbay , A. et al. Genetic variants associated with subjective well-being, depressive symptoms, and neuroticism identified through genome-wide analyses . Nat. Genet . 48 , 624 – 633 ( 2016 ). OpenUrl CrossRef PubMed 44. Nagel , M. et al. Meta-analysis of genome-wide association studies for neuroticism in 449,484 individuals identifies novel genetic loci and pathways . Nat. Genet . 50 , 920 – 927 ( 2018 ). OpenUrl CrossRef PubMed 45. Rietveld , C. A. et al. Common genetic variants associated with cognitive performance identified using the proxy-phenotype method . Proc. Natl. Acad. Sci. U. S. A . 111 , 13790 – 13794 ( 2014 ). OpenUrl Abstract / FREE Full Text 46. ↵ de Moor , M. H. M. et al. Meta-analysis of genome-wide association studies for personality . Mol. Psychiatry 17 , 337 – 349 ( 2010 ). OpenUrl PubMed 47. ↵ Zhao , Y. et al. Protein-truncating variants in BSN are associated with severe adult-onset obesity, type 2 diabetes and fatty liver disease . medRxiv ( 2023 ) doi: 10.1101/2023.06.14.23291368 . OpenUrl Abstract / FREE Full Text 48. ↵ Yang , J. et al. Genomic inflation factors under polygenic inheritance . Eur. J. Hum. Genet . 19 , 807 – 812 ( 2011 ). OpenUrl CrossRef PubMed 49. ↵ Price , A. L. et al. Principal components analysis corrects for stratification in genome-wide association studies . Nat. Genet . 38 , 904 – 909 ( 2006 ). OpenUrl CrossRef PubMed Web of Science 50. ↵ Yu , J. et al. A unified mixed-model method for association mapping that accounts for multiple levels of relatedness . Nat. Genet . 38 , 203 – 208 ( 2006 ). OpenUrl CrossRef PubMed Web of Science 51. ↵ Loh , P.-R. et al. Efficient Bayesian mixed-model analysis increases association power in large cohorts . Nat. Genet . 47 , 284 – 290 ( 2015 ). OpenUrl CrossRef PubMed 52. ↵ Carvalho , N. R. G. , Harris , A. M. & Lachance , J . Different genetic architectures of complex traits and their relevance to polygenic score performance in diverse populations . bioRxiv 2022.10.29.514295 ( 2023 ) doi: 10.1101/2022.10.29.514295 . OpenUrl Abstract / FREE Full Text 53. ↵ Popejoy , A. B. & Fullerton , S. M . Genomics is failing on diversity . Nature vol. 538 161 – 164 ( 2016 ). OpenUrl CrossRef PubMed 54. ↵ Fry , A. et al. Comparison of Sociodemographic and Health-Related Characteristics of UK Biobank Participants With Those of the General Population . Am. J. Epidemiol . 186 , 1026 – 1034 ( 2017 ). OpenUrl CrossRef PubMed 55. ↵ Sliz , E. et al. NAFLD risk alleles in PNPLA3, TM6SF2, GCKR and LYPLAL1 show divergent metabolic effects . Hum. Mol. Genet . 27 , 2214 – 2223 ( 2018 ). OpenUrl CrossRef PubMed 56. ↵ Simons , N. et al. A Common Gene Variant in Glucokinase Regulatory Protein Interacts With Glucose Metabolism on Diabetic Dyslipidemia: the Combined CODAM and Hoorn Studies . Diabetes Care 39 , 1811 – 1817 ( 2016 ). OpenUrl Abstract / FREE Full Text 57. ↵ Sudlow , C. et al. UK biobank: an open access resource for identifying the causes of a wide range of complex diseases of middle and old age . PLoS Med . 12 , e1001779 ( 2015 ). OpenUrl CrossRef PubMed 58. ↵ Bycroft , C. et al. The UK Biobank resource with deep phenotyping and genomic data . Nature 562 , 203 – 209 ( 2018 ). OpenUrl CrossRef PubMed 59. ↵ Millard , L. A. C. , Davies , N. M. , Gaunt , T. R. , Davey Smith , G. & Tilling , K . Software Application Profile: PHESANT: a tool for performing automated phenome scans in UK Biobank . Int. J. Epidemiol . 47 , 29 – 35 ( 2018 ). OpenUrl CrossRef PubMed 60. ↵ Yavorska , O. O. & Burgess , S . MendelianRandomization: an R package for performing Mendelian randomization analyses using summarized data . Int. J. Epidemiol . 46 , 1734 – 1739 ( 2017 ). OpenUrl CrossRef PubMed 61. ↵ Loh , P.-R. , Kichaev , G. , Gazal , S. , Schoech , A. P. & Price , A. L . Mixed-model association for biobank-scale datasets . Nat. Genet . 50 , 906 – 908 ( 2018 ). OpenUrl CrossRef PubMed 62. ↵ 1000 Genomes Project Consortium et al. A global reference for human genetic variation . Nature 526 , 68 – 74 ( 2015 ). OpenUrl CrossRef PubMed 63. ↵ Watanabe , K. , Taskesen , E. , van Bochoven , A. & Posthuma , D . Functional mapping and annotation of genetic associations with FUMA . Nat. Commun . 8 , 1826 ( 2017 ). OpenUrl CrossRef PubMed 64. Watanabe , K. , Umićević Mirkov , M. , de Leeuw , C. A. , van den Heuvel , M. P. & Posthuma , D. Genetic mapping of cell type specificity for complex traits . Nat. Commun . 10 , 3222 ( 2019 ). OpenUrl PubMed 65. GTEx Consortium. Human genomics . The Genotype-Tissue Expression (GTEx) pilot analysis: multitissue gene regulation in humans . Science 348 , 648 – 660 ( 2015 ). OpenUrl Abstract / FREE Full Text 66. GTEx Consortium et al. Genetic effects on gene expression across human tissues . Nature 550 , 204 – 213 ( 2017 ). OpenUrl CrossRef PubMed Web of Science 67. Aguet , F. , et al. The GTEx Consortium atlas of genetic regulatory effects across human tissues . bioRxiv 787903 ( 2019 ) doi: 10.1101/787903 . OpenUrl Abstract / FREE Full Text 68. de Leeuw , C. A. , Mooij , J. M. , Heskes , T. & Posthuma , D . MAGMA: generalized gene-set analysis of GWAS data . PLoS Comput. Biol . 11 , e1004219 ( 2015 ). OpenUrl CrossRef PubMed 69. ↵ Buniello , A. et al. The NHGRI-EBI GWAS Catalog of published genome-wide association studies, targeted arrays and summary statistics 2019 . Nucleic Acids Res . 47 , D1005 – D1012 ( 2019 ). OpenUrl CrossRef PubMed 70. ↵ Bulik-Sullivan , B. K. et al. LD Score regression distinguishes confounding from polygenicity in genome-wide association studies . Nat. Genet . 47 , 291 – 295 ( 2015 ). OpenUrl CrossRef PubMed 71. ↵ Dupuis , J. et al. New genetic loci implicated in fasting glucose homeostasis and their impact on type 2 diabetes risk . Nat. Genet . 42 , 105 – 116 ( 2010 ). OpenUrl CrossRef PubMed Web of Science 72. ↵ Wallace , T. M. , Levy , J. C. & Matthews , D. R . Use and abuse of HOMA modeling . Diabetes Care 27 , 1487 – 1495 ( 2004 ). OpenUrl Abstract / FREE Full Text 73. ↵ Bulik-Sullivan , B. et al. An atlas of genetic correlations across human diseases and traits . Nat. Genet . 47 , 1236 – 1241 ( 2015 ). OpenUrl CrossRef PubMed 74. ↵ Wallace , C . A more accurate method for colocalisation analysis allowing for multiple causal variants . PLoS Genet . 17 , e1009440 ( 2021 ). OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted January 31, 2024. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Assessing the genetic contribution of cumulative behavioral factors associated with longitudinal type 2 diabetes risk highlights adiposity and the brain-metabolic axis Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Assessing the genetic contribution of cumulative behavioral factors associated with longitudinal type 2 diabetes risk highlights adiposity and the brain-metabolic axis Nuno R. G. Carvalho , Yixuan He , Patrick Smadbeck , Jason Flannick , Josep M. Mercader , Miriam Udler , Arjun K Manrai , Jordi Moreno , Chirag J. Patel medRxiv 2024.01.30.24302019; doi: https://doi.org/10.1101/2024.01.30.24302019 Share This Article: Copy Citation Tools Assessing the genetic contribution of cumulative behavioral factors associated with longitudinal type 2 diabetes risk highlights adiposity and the brain-metabolic axis Nuno R. G. Carvalho , Yixuan He , Patrick Smadbeck , Jason Flannick , Josep M. Mercader , Miriam Udler , Arjun K Manrai , Jordi Moreno , Chirag J. Patel medRxiv 2024.01.30.24302019; doi: https://doi.org/10.1101/2024.01.30.24302019 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Endocrinology (including Diabetes Mellitus and Metabolic Disease) Subject Areas All Articles Addiction Medicine (574) Allergy and Immunology (865) Anesthesia (304) Cardiovascular Medicine (4462) Dentistry and Oral Medicine (445) Dermatology (383) Emergency Medicine (611) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1517) Epidemiology (15251) Forensic Medicine (31) Gastroenterology (1132) Genetic and Genomic Medicine (6621) Geriatric Medicine (669) Health Economics (1002) Health Informatics (4564) Health Policy (1372) Health Systems and Quality Improvement (1617) Hematology (544) HIV/AIDS (1272) Infectious Diseases (except HIV/AIDS) (15938) Intensive Care and Critical Care Medicine (1107) Medical Education (624) Medical Ethics (147) Nephrology (670) Neurology (6643) Nursing (346) Nutrition (1001) Obstetrics and Gynecology (1149) Occupational and Environmental Health (957) Oncology (3350) Ophthalmology (981) Orthopedics (369) Otolaryngology (421) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1698) Pharmacology and Therapeutics (694) Primary Care Research (714) Psychiatry and Clinical Psychology (5465) Public and Global Health (9259) Radiology and Imaging (2212) Rehabilitation Medicine and Physical Therapy (1372) Respiratory Medicine (1198) Rheumatology (598) Sexual and Reproductive Health (716) Sports Medicine (533) Surgery (715) Toxicology (100) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a03cf4239b8558d3',t:'MTc4MDEzNTg3NQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2024) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00