Analysis of rare coding variants in 470,000 UK Biobank participants reveals genetic associations with childhood asthma predisposition

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 42,197 characters · extracted from preprint-html · click to expand
Analysis of rare coding variants in 470,000 UK Biobank participants reveals genetic associations with childhood asthma predisposition | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Analysis of rare coding variants in 470,000 UK Biobank participants reveals genetic associations with childhood asthma predisposition Zhenzhen Liu , View ORCID Profile David Curtis doi: https://doi.org/10.1101/2025.02.12.25322158 Zhenzhen Liu 1 UCL Genetics Institute, University College London, Darwin Building , Gower Street, London WC1E 6BT, United Kingdom Find this author on Google Scholar Find this author on PubMed Search for this author on this site David Curtis 1 UCL Genetics Institute, University College London, Darwin Building , Gower Street, London WC1E 6BT, United Kingdom Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for David Curtis For correspondence: d.curtis{at}ucl.ac.uk Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Background Previous studies of genetic contributions to risk of childhood asthma have implicated common variants with small effect sizes. Some studies using exome sequence data have reported associations with rare coding variants having larger effects on risk, notably an analysis of 145,000 subjects which found association with loss of function (LOF) variants in FLG , the gene coding for filaggrin. Here we report the results of an analysis of rare nonsynonymous and LOF variants, carried out on the full UK Biobank cohort of 470,000 exome-sequenced participants. Methods The phenotype of childhood asthma was defined as reporting asthma with onset before 18. Regression analysis was applied to gene-wise tests for association LOF and nonsynonymous variants. 45 tests using different pathogenicity predictors were applied to the first cohort of 200,000 participants. Subsequently the 100 genes showing strongest evidence for association were analysed in the second cohort of 270,000 participants, using only the best-performing predictor for each gene. For FLG , separate analyses were carried out for participants with atopic dermatitis. Results Three genes achieved statistical significance, FLG, IL33 and PRKCQ . The effects on asthma risk and frequencies of variants in different functional categories were characterised for these genes. Damaging coding variants were associated with increased risk of asthma in FLG and IL33 but reduced risk in PRKCQ. FLG LOF variants were also associated with risk of atopic dermatitis and their effect on asthma risk was higher in people who reported a diagnosis of atopic dermatitis. Conclusions Rare coding variants in a small number of genes have important effects on asthma risk. Further study of individual variant effects might elucidate mechanisms of pathogenesis. This research has been conducted using the UK Biobank Resource. Introduction Asthma is a chronic inflammatory disease in which environmental risk factors are important but which has high heritability, with estimates ranging from 35% to 95% ( Ober and Yao, 2011 ; Pijnenburg et al ., 2022 ). Asthma can be broadly divided into two endotypes: the T2-high endotype, which is associated with early-onset, allergic asthma, and the T2-low endotype, which is associated with late-onset, non-allergic asthma ( Sansone et al ., 2020 ). The heritability of early-onset asthma is particularly high, at 68% to 92% ( Ma et al ., 2020 ). Genome-wide association studies (GWASs) have implicated hundreds of common variant associations with asthma traits ( Espuela-Ortiz et al., 2023 ). Genes in implicated regions are involved in inflammatory and secondary immune responses, including B-cell and T-cell receptors, immunoglobulin E levels and eosinophil counts, while other studies report genes associated with obesity, mucus secretion, the PI3K/AKT pathway and calcium ion transport ( Han et al ., 2020 ; Zhu et al ., 2021 ; Espuela-Ortiz et al ., 2023 ). Variants identified through GWAS are associated with small effect sizes and it can be difficult to determine their functional effects whereas rarer variants directly impacting coding regions of genes can have larger and more readily interpretable effects. Two low frequency loss of function (LOF) variants, denoted R501X and 2282del4, in FLG , the gene for filaggrin, increase the risk of ichthyosis vulgaris and atopic dermatitis in populations of European ancestry and increase the risk of asthma in children who have atopic dermatitis ( Marenholz et al ., 2006 ; Smith et al ., 2006 ). A subsequent meta-analysis found that LOF FLG variants were associated with asthma only in children with a prior diagnosis of atopic dermatitis ( Rodriguez et al ., 2009 ). A preprint presenting a study of exome sequence data from 24,576 asthma cases and 120,530 controls from the Scandinavian Asthma Genetic Study and UK Biobank also reports that rare LOF in FLG are collectively associated with increased childhood asthma risk ( Cameron-Christie A. Mackay Q. Wang H. Olsson B. Angermann G. Lassi J. Lindgren M. Hühn Y. Ohne M. Gavala J. Wang G. Povysil S. V. V. Deevi G. Belfield I. Dillmann D. Muthas S. Cohen S. Young A. Platt S. Petrovski, 2020 ). An early sequencing study of candidate genes claimed that rare, non-coding variants in IL12RB1 were associated with asthma but this finding has not been replicated ( Torgerson et al ., 2012 ). A study of rare and low frequency coding variants using array genotypes implicated gene-wise association with functional variants in GSDMB significant after correction for multiple testing ( Igartua et al ., 2015 ). However the authors report that this signal was mostly driven by rs12450091in the Mexican American subset of their data and since this variant has a high frequency in Latinos (minor allele frequency (MAF) 0.19) there is a possibility that this finding may be related to the previously identified common variant association at this locus. Whole-genome sequencing and imputation into the Icelandic population led to the identification of a rare canonical splice site variant, rs146597587-C, in the GWAS-implicated gene IL33 which is associated with lower eosinophil counts and reduced risk of asthma in Europeans ( Smith et al ., 2017 ). Exome sequence data has now been made available for 470,000 UK Biobank participants, allowing a more thorough exploration of the effects of rare coding variants on childhood asthma in the general population. Methods The exome sequence data for UK Biobank participants was released in two phases. Data had been downloaded for 200,632 subjects who had undergone exome-sequencing and genotyping by the UK Biobank Exome Sequencing Consortium using the GRCh38 assembly with coverage 20X at 95.6% of sites on average ( Szustakowski et al ., 2021 ). Subsequently, the UK Biobank Research Analysis Platform (RAP) made available the Final Release Population level exome variants in PLINK format for 469,818 exomes which had been produced at the Regeneron Genetics Center based on DNA extracted from stored blood samples and using the protocols described here: https://dnanexus.gitbook.io/uk-biobank-rap/science-corner/whole-exome-sequencing-oqfe-protocol/protocol-for-processing-ukb-whole-exome-sequencing-data-sets ( Backman et al ., 2021 ). Data from the first cohort of 200,000 participants was used for exploratory first stage analyses and then data from the remaining 270,000 participants was used in confirmatory analyses. UK Biobank had obtained ethics approval from the North West Multi-centre Research Ethics Committee which covers the UK (approval number: 11/NW/0382) and had obtained informed consent from all participants. The UK Biobank approved an application for use of the data (ID 51119) and ethics approval for the analyses was obtained from the UCL Research Ethics Committee (11527/003). The phenotype of childhood asthma was based on participants’ responses to the questionnaire item, “Age asthma diagnosed by doctor.” Participants who reported to be diagnosed at or before the age of 18 were categorised as cases, while the remainder served as controls. There was no effort to exclude control subjects who might have had alternative allergic disease diagnoses. Among 469,765 participants, 34,474 cases were identified. This ratio closely approximates the prevalence of childhood asthma in the British population (∼1 in 11 individuals). Attention was restricted to variants with minor allele frequency (MAF) < 0.01. All exonic variants were annotated using Variant Effect Predictor (VEP) ( McLaren et al ., 2016 ). Nonsynonymous variants were additionally annotated using the AlphaMissense plug-in of VEP, which produces a raw score and a categorisation of likely pathogenic, likely benign or ambiguous, these three categories being converted to numerical scores of 2, 0 or 1 respectively ( Cheng et al ., 2023 ). Additionally, rank prediction scores were obtained for an additional 43 different predictors of pathogenicity as provided for all possible nonsynonymous variants in dbNSFP v4 ( Liu et al ., 2020 ). To obtain population principal components reflecting ancestry, version 2.0 of plink ( https://www.cog-genomics.org/plink/2.0/ ) was run with the options --maf 0.1 --pca 20 approx ( Chang et al ., 2015 ; Galinsky et al ., 2016 ). In order to carry out weighted burden analysis, for each LOF or nonsynonymous variant a score was defined. For LOF variants this score used a parabolic function of allele frequency as previously described, with extremely rare variants (MAF ∼ 0) being assigned a score of 10 and less rare variants (MAF=0.01) being assigned a score of 1 ( Curtis, 2012 , 2022). For nonsynonymous variants, this frequency score was assigned in the same way but was then multiplied by the score for a pathogenicity predictor in order to produce an overall score for that variant. For each gene, each participant would receive a LOF score and a nonsynonymous score, consisting of the sums of the scores for the individual variants of each class carried by that participant. To test for association, multiple logistic regression was performed using sex and 20 principal components as covariates. For the null model, asthma phenotype was predicted solely from these covariates. For the alternative model, asthma phenotype was predicted from these covariates along with the LOF and nonsynonymous scores. The likelihoods of these models were compared and a p value obtained assuming that twice the log likelihood difference followed a chi-squared distribution with two degrees of freedom and the statistical evidence for association was summarised as minus log10(p) (MLP). Because previous work had shown that LOF variants and nonsynonymous variants could make different relative contributions to disease risk and because different predictors of pathogenicity had differential performance across different genes, a two-stage approach to analysis was followed ( Curtis, 2024 ). In the first stage, the first cohort of 200,000 exome-sequenced participants was used to carry out 45 different regression analyses as described above for each protein-coding gene using each of the 45 pathogenicity predictors. This yielded 45 MLPs for each gene, the maximum being denoted MaxMLP. In the second stage, the remaining 270,000 participants were used for analyses of only the 100 genes showing the strongest evidence for association in the first phase and each gene was analysed using only the predictor which had produced the maximum MLP for that gene in the first phase. Thus only 100 tests were performed in the second phase, meaning that a gene could be declared statistically significant if it produced a test statistic significant at p < 0.05/100. For each gene achieving statistical significance, the analysis was repeated using the best predictor in all 470,000 participants. In the case of FLG , this analysis was repeated separately in those with and without a diagnosis of atopic dermatitis, determined from having a relevant ICD9 or ICD10 code or a self-report of “eczema/dermatitis”. Additionally, a full logistic regression analysis was carried out in all participants including the same covariates and using the raw counts for all categories of variants as characterised by VEP, along with counts of variants having a dbNSFP rank score for the best performing predictor of more than a threshold value of 0.35. Results In the first stage analysis, MLPs were obtained for 19,008 protein coding genes using 45 different predictors and these are listed in Supplementary Table 1. The 100 genes with the highest MaxMLPs went forward into the second stage analysis and Supplementary Table 2 shows the MLPs obtained in the second cohort of 270,000 participants using the same predictor as had yielded the maximum MLP in the first 200,000 participants. Of these, three genes reached the threshold for statistical significance, FLG, PRKCQ and IL33 , and these results are shown in Table 1 . As can be seen, all three of these genes produced MLPs exceeding the critical threshold of -log10(0.05/100) = 3.3 in the second stage analysis. In the full sample of 470,000, these three genes all also produced MLPs which would exceed a conservative threshold for multiple-testing of -log10(0.05/(19008*45)) = 7.23. View this table: View inline View popup Download powerpoint Table 1. For each gene achieving statistical significance in the second stage analysis, the table shows the maximum -log10(p) (MLP) produced by any of 45 pathogenicity predictors in the first stage analysis of 200,000 participants along with the predictor producing this MLP, results obtained using the same predictor in the second stage using 270,000 participants and in the total sample of 470,000. All results are obtained from multiple logistic regression analyses of childhood asthma with sex and 20 principal components as covariates and MAF-weighted LOF scores and pathogenicity scores as predictors. View this table: View inline View popup Download powerpoint Table 2. Table showing results of multiple logistic regression analysis of childhood asthma using raw counts of LOF and protein altering variants as well as those variants having a score of > 0.35 for the relevant predictor. Analyses were carried out in the full sample of 470,000 participants. For FLG , results were statistically significant for both the 13,828 participants with a diagnosis of eczema and those without, with MLPs of 19.40 and 9.08, respectively. However the estimate for the effect size of LOF variants was higher in those with eczema (beta = 0.0913, SE = 0.0096) than those without (beta = 0.0249, SE = 0.0039). Table 2 shows the results for these genes of analysing the raw counts, not weighted by frequency, of variants in LOF and protein altering categories assigned by VEP along with variants scoring higher than 0.35 with the relevant predictor. Multiple linear regression analysis to quantify the effect on childhood asthma was carried out using all variant counts along with sex and 20 principal components. Other variant categories were included in the analyses, consisting of 3’ and 5’ UTR, splice region, synonymous and intronic but no category was significant even at a nominal level of 0.05 for any gene so results for these other variant categories are not shown. It can be seen that for FLG LOF variants are observed at hundreds of separate locations and are cumulatively not very rare, with an average rare variant load per participant of around 3%. (This does not include the two previously reported common LOF variants, R501X and 2282del4, which were not considered in this analysis.) On average, they exert a modest effect on risk of childhood asthma with OR 1.38. By contrast, there is no detectable effect on risk from nonsynonymous variants, even those with high scores with AlphaMissense, the best performing predictor for this gene. Detailed inspection of the results from the first cohort of 200,000 participants revealed that in fact the overall MLP obtained varied very little between predictors of nonsynonymous variant pathogenicity, consistent with the notion that the observed association was entirely due to LOF rather than nonsynonymous variants. This situation is reversed for IL33 , where the effect on risk is due to nonsynonymous variants with high scores for the BayesDel addAF predictor while LOF variants have no detectable effect ( Feng, 2017 ). The nonsynonymous variants with the high scores have a protective effective, with OR 0.65. Although LOF variants are not associated with any overall effect on risk, detailed inspection of the results revealed that the essential splice site variant rs146597587-C at chr9:6255967 had MAF 0.0045 in controls and 0.0030 in controls, equivalent to 0R = 0.67, uncorrected for covariates, and consistent with the previous reports of a protective effect for this variant ( Smith et al ., 2017 ). Finally, PRKCQ demonstrates clear signals for both LOF variants and those having high scores with AlphaMissense. While the LOF variants variants are rare, they have a larger estimated effect size than those with high AlphaMissense scores, with OR of 3.24 versus 1.09. Discussion The findings from this study of a rare coding variants in a large exome-sequenced sample enlarges our understanding of the role of FLG and IL33 in susceptibility to childhood asthma, while the findings for PRKCQ are novel. For FLG we observe effects for hundreds of rare LOF variants, similar to those previously noted for common LOF variants and we note that nonsynonymous variants do not influence risk. For IL33 we note that although the previously reported essential splice site variant is protective, other LOF variants appear to have no effect whereas some rare nonsynonymous variants are also protective. For PRKCQ, both LOF and nonsynonymous variants increase risk. The findings obtained for FLG are entirely consistent with what is known about its biological function. The gene expressed in the keratohyalin granules of skin keratinocytes codes for profilaggrin is a 400-kDa, highly phosphorylated, inactive polymer that contains 10-12 filaggrin repeats ( Osawa, Akiyama and Shimizu, 2011 ). Upon being secreted into the intercellular space, it is rapidly dephosphorylated and cleaved into multiple filaggrin monomers and these contribute to the epidermal differentiation process and the barrier function of the stratum corneum of the skin. Notably, the C-terminal domain of profilaggrin, approximately 160 amino acids in length, is essential for the proper cleavage and subsequent release of filaggrin monomers ( Shamilov, Robinson and Aneskievich, 2021 ). This means that any LOF variant within FLG will mean that it will yield no filaggrin molecules. By contrast, a single nonsynonymous variant in FLG can only affect one of the filaggrin copies it codes for. This accords with our observation that LOF variants can produce an effect on risk while nonsynonymous variants do not. Notably, FLG is expressed in the outer layers of the oral and nasal mucosae but not in the epithelial cells of the bronchi and bronchioles, which are the primary tissues affected by asthma ( Ying et al ., 2006 ). As previously noted, LOF variants in FLG increase the risk of ichthyosis vulgaris and atopic dermatitis and increase the risk of asthma only in children who have atopic dermatitis ( Marenholz et al ., 2006 ; Smith et al ., 2006 ; Rodriguez et al ., 2009 ). In our own study, we note that the effect of FLG LOF variants on asthma risk is much larger in participants who report a diagnosis of dermatitis or eczema than those who do not. Although the effect is still highly significant in those who do not report this diagnosis, this does not in fact mean that FLG LOF variants can cause asthma in people who do not have atopic dermatitis because some participants might have actually had this diagnosis without reporting it. It remains plausible that FLG LOF variants exert their effect on asthma risk by interfering with the barrier function of the skin, allowing external allergens to enter and provoke allergic responses which can include both atopic dermatitis and asthma ( Hsu, Akiyama and Shimizu, 2008 ). The rare essential splice site variant in IL33 , rs146597587-C, has been previously reported to be protective against childhood asthma and associated with lower blood eosinophil counts ( Smith et al ., 2017 ). IL33 codes for interleukin-33 and common variants in it are also associated with asthma risk ( Queiroz et al ., 2017 ; Saikumar Jayalatha et al ., 2021 ). Alternative splicing of IL33 has been reported to be associated with cytoplasmic localisation in epithelial cells and with markers of increased type 2 inflammation in asthma ( Gordon et al ., 2016 ). Interestingly, in our dataset we note that while rs146597587-C has a protective effect with raw OR = 0.67, overall LOF variants in IL33 have a null effect, with OR (95% CI) = 0.99 (0.80-1.22), suggesting that the effect of rs146597587-C might not be simply due to haploinsufficiency. We also note a substantial protective effect of nonsynonymous variants with high scores for the BaysDel addAF predictor, with OR (95% CI) = 0.65 (0.51-0.84). An inhibitor of interleukin-33 activity, astegolimab, which binds to its receptor has been found to reduce exacerbations in patients with severe asthma but was not effective against atopic dermatitis ( Kelsen et al ., 2021 ; Maurer et al ., 2022 ). Our results enhance the evidence that interleukin-33 activity does have some role in asthma pathogenesis and that further attempts to perturb this activity may have therapeutic potential. PRKCQ encodes the protein kinase C theta (PKCθ), a member of the protein kinase C (PKC) family, which plays a role in the activation and regulation of T cells. PKCθ is involved in T-cell receptor signalling, particularly in the formation of the immune synapse ( Brezar, Tu and Seddiki, 2015 ). Upon recruitment to the immune synapse, PKCθ activates downstream signalling pathways to drive T-cell activation, differentiation, and immune function ( Lin and Wang, 2004 ). ( Lin and Wang, 2004 ). PKCθ also modulates the balance between effector T cells (Teff) and regulatory T cells (Treg), influencing the inflammatory responses in various immune-related conditions ( Brezar, Tu and Seddiki, 2015 ). Studies in PKCθ-deficient mice have demonstrated a reduction in the numbers and activation of type 2 innate lymphoid cells (ILC2s) and TH2 cells, while pharmacological inhibition of PKCθ led to decreased airway inflammation ( Madouri et al ., 2017 ). Additionally, PKCθ-deficient mice showed impaired T-cell responses and reduced cytokine production ( Anderson et al ., 2006 ). Based on expected therapeutic applications, a range of PKCθ inhibitors have been developed ( Curnock et al ., 2014 ; Papa et al ., 2021 ; Crosignani et al ., 2024 ). However taken at face value our own findings suggest that reduced function of PKCθ might not lead to reduction in inflammatory processes, at least in the context of childhood asthma. This is because our results show an association of increased, not reduced, asthma risk for both LOF variants and those scored highly by AlphaMissense. To conclude, this study of rare coding variants in a large exome-sequenced sample provides some further insights into the biological processes involved in susceptibility to childhood asthma. Specific functional studies of the effects of individual variants might provide further illumination and suggest novel therapeutic approaches. Data availability The raw data is available on application to UK Biobank at https://ams.ukbiobank.ac.uk/ams/ . Derived variables will be returned to UK Biobank, from which they will become available in due course. Software and scripts used to perform the analyses is available at https://github.com/davenomiddlenamecurtis . Disclosure statement The authors declare no conflict of interest. Acknowledgments This research has been conducted using the UK Biobank Resource under Application Number 51119. The authors wish to acknowledge the staff supporting the High Performance Computing Cluster, Computer Science Department, University College London. The authors wish to thank the participants who volunteered for the UK Biobank project. This work uses data provided by patients and collected by NHS England as part of their care and support. This research also used data assets made available by National Safe Haven as part of the Data and Connectivity National Core Study, led by Health Data Research UK in partnership with the Office for National Statistics and funded by UK Research and Innovation (grants MC_PC_20029 and MC_PC_20058). For the work to carry out the analyses reported here, the authors did not receive any specific grant from funding agencies in the public, commercial, or not-for-profit sectors. References ↵ Anderson , K. et al. ( 2006 ) ‘Mice deficient in PKC theta demonstrate impaired in vivo T cell activation and protection from T cell-mediated inflammatory diseases’ , Autoimmunity , 39 ( 6 ), pp. 469 – 478 . Available at : doi: 10.1080/08916930600907954 . OpenUrl CrossRef PubMed ↵ Backman , J.D. et al. ( 2021 ) ‘Exome sequencing and analysis of 454,787 UK Biobank participants’ , Nature , 599 ( 7886 ), pp. 628 – 634 . Available at : doi: 10.1038/S41586-021-04103-Z . OpenUrl CrossRef PubMed ↵ Brezar , V. , Tu , W.J. and Seddiki , N. ( 2015 ) ‘PKC-Theta in Regulatory and Effector T-cell Functions’ , Front Immunol . 20151013th edn, 6 , p. 530 . Available at : doi: 10.3389/fimmu.2015.00530 . OpenUrl CrossRef PubMed ↵ Cameron-Christie A. Mackay Q. Wang H. Olsson B. Angermann G. Lassi J. Lindgren M. Hühn Y. Ohne M. Gavala J. Wang G. Povysil S.V.V. Deevi G. Belfield I. Dillmann D. Muthas S. Cohen S. Young A. Platt S. Petrovski , S. ( 2020 ) ‘A broad exome study of the genetic architecture of asthma reveals novel patient subgroups’ , bioRxiv [Preprint] . Available at : doi: 10.1101/2020.12.10.419663 . OpenUrl Abstract / FREE Full Text ↵ Chang , C.C. et al. ( 2015 ) ‘Second-generation PLINK: rising to the challenge of larger and richer datasets’ , GigaScience , 4 ( 1 ), p. 7 . Available at : doi: 10.1186/s13742-015-0047-8 . OpenUrl CrossRef PubMed ↵ Cheng , J. et al. ( 2023 ) ‘Accurate proteome-wide missense variant effect prediction with AlphaMissense’ , Science , 381 ( 6664 ). Available at : doi: 10.1126/SCIENCE.ADG7492 . OpenUrl CrossRef ↵ Crosignani , S. et al. ( 2024 ) ‘Discovery of a novel series of selective macrocyclic PKCTheta inhibitors’ , Bioorg Med Chem Lett . 20240201st edn, 100 , p. 129630 . Available at : doi: 10.1016/j.bmcl.2024.129630 . OpenUrl CrossRef PubMed ↵ Curnock , A. et al. ( 2014 ) ‘Selective protein kinase Ctheta (PKCtheta) inhibitors for the treatment of autoimmune diseases’ , Biochem Soc Trans , 42 ( 6 ), pp. 1524 – 1528 . Available at : doi: 10.1042/BST20140167 . OpenUrl Abstract / FREE Full Text ↵ Curtis , D. ( 2012 ) ‘A rapid method for combined analysis of common and rare variants at the level of a region, gene, or pathway’ , Adv Appl Bioinform Chem , 5 , pp. 1 – 9 . OpenUrl PubMed Curtis , D. ( 2022 ) ‘Exploration of weighting schemes based on allele frequency and annotation for weighted burden association analysis of complex phenotypes’ , Gene , 809 . Available at : doi: 10.1016/J.GENE.2021.146039 . OpenUrl CrossRef ↵ Curtis , D. ( 2024 ) ‘Assessment of ability of AlphaMissense to identify variants affecting susceptibility to common disease’ , European Journal of Human Genetics 2024 , pp. 1 – 9 . Available at : doi: 10.1038/s41431-024-01675-y . OpenUrl CrossRef ↵ Espuela-Ortiz , A. et al. ( 2023 ) ‘Genomics of Treatable Traits in Asthma’ , Genes (Basel) . 20230920th edn, 14 ( 9 ). Available at : doi: 10.3390/genes14091824 . OpenUrl CrossRef ↵ Feng , B.J. ( 2017 ) ‘PERCH: A Unified Framework for Disease Gene Prioritization’ , Human mutation , 38 ( 3 ), pp. 243 – 251 . Available at : doi: 10.1002/HUMU.23158 . OpenUrl CrossRef PubMed ↵ Galinsky , K.J. et al. ( 2016 ) ‘Fast Principal-Component Analysis Reveals Convergent Evolution of ADH1B in Europe and East Asia’ , American Journal of Human Genetics , 98 ( 3 ), pp. 456 – 472 . Available at : doi: 10.1016/j.ajhg.2015.12.022 . OpenUrl CrossRef PubMed ↵ Gordon , E.D. et al. ( 2016 ) ‘Alternative splicing of interleukin-33 and type 2 inflammation in asthma’ , Proc Natl Acad Sci U S A. 20160718th edn , 113 ( 31 ), pp. 8765 – 8770 . Available at : doi: 10.1073/pnas.1601914113 . OpenUrl Abstract / FREE Full Text ↵ Han , Y. et al. ( 2020 ) ‘Genome-wide analysis highlights contribution of immune system pathways to the genetic architecture of asthma’ , Nat Commun. 20200415th edn , 11 ( 1 ), p. 1776 . Available at : doi: 10.1038/s41467-020-15649-3 . OpenUrl CrossRef PubMed ↵ Hsu , C.K. , Akiyama , M. and Shimizu , H. ( 2008 ) ‘Filaggrin: an emerging star in atopic march’ , J Formos Med Assoc , 107 ( 6 ), pp. 429 – 431 . Available at : doi: 10.1016/s0929-6646(08)60149-7 . OpenUrl CrossRef PubMed ↵ Igartua , C. et al. ( 2015 ) ‘Ethnic-specific associations of rare and low-frequency DNA sequence variants with asthma’ , Nat Commun . 20150116th edn, 6, p. 5965 . Available at : doi: 10.1038/ncomms6965 . OpenUrl CrossRef PubMed ↵ Kelsen , S.G. et al. ( 2021 ) ‘Astegolimab (anti-ST2) efficacy and safety in adults with severe asthma: A randomized clinical trial’ , The Journal of allergy and clinical immunology , 148 ( 3 ), pp. 790 – 798 . Available at : doi: 10.1016/J.JACI.2021.03.044 . OpenUrl CrossRef ↵ Lin , X. and Wang , D. ( 2004 ) ‘The roles of CARMA1, Bcl10, and MALT1 in antigen receptor signaling’ , Semin Immunol , 16 ( 6 ), pp. 429 – 435 . Available at : doi: 10.1016/j.smim.2004.08.022 . OpenUrl CrossRef PubMed Web of Science ↵ Liu , X. et al. ( 2020 ) ‘dbNSFP v4: a comprehensive database of transcript-specific functional predictions and annotations for human nonsynonymous and splice-site SNVs’ , Genome Medicine , 12 ( 1 ). Available at : doi: 10.1186/s13073-020-00803-9 . OpenUrl CrossRef PubMed Ma , X.Q. et al. ( 2020 ) ‘Integrative genomics analysis of various omics data and networks identify risk genes and variants vulnerable to childhood-onset asthma’ , Bmc Medical Genomics , 13 ( 1 ). Available at: https://doi.org/ARTN12310.1186/s12920-020-00768-z . ↵ Madouri , F. et al. ( 2017 ) ‘Protein kinase Ctheta controls type 2 innate lymphoid cell and T(H)2 responses to house dust mite allergen’ , J Allergy Clin Immunol. 20161014th edn , 139 ( 5 ), pp. 1650 – 1666 . Available at : doi: 10.1016/j.jaci.2016.08.044 . OpenUrl CrossRef ↵ Marenholz , I. et al. ( 2006 ) ‘Filaggrin loss-of-function mutations predispose to phenotypes involved in the atopic march’ , The Journal of Allergy and Clinical Immunology , 118 ( 4 ), pp. 866 – 871 . Available at : doi: 10.1016/J.JACI.2006.07.026 . OpenUrl CrossRef PubMed Web of Science ↵ Maurer , M. et al. ( 2022 ) ‘Phase 2 randomized clinical trial of astegolimab in patients with moderate to severe atopic dermatitis’ , The Journal of allergy and clinical immunology , 150 ( 6 ), pp. 1517 – 1524 . Available at : doi: 10.1016/J.JACI.2022.08.015 . OpenUrl CrossRef ↵ McLaren , W. et al. ( 2016 ) ‘The Ensembl Variant Effect Predictor.’ , Genome biology , 17 ( 1 ), p. 122 . Available at : doi: 10.1186/s13059-016-0974-4 . OpenUrl CrossRef PubMed ↵ Ober , C. and Yao , T.C. ( 2011 ) ‘The genetics of asthma and allergic disease: a 21st century perspective’ , Immunol Rev , 242 ( 1 ), pp. 10 – 30 . Available at : doi: 10.1111/j.1600-065X.2011.01029.x . OpenUrl CrossRef PubMed ↵ Osawa , R. , Akiyama , M. and Shimizu , H. ( 2011 ) ‘Filaggrin gene defects and the risk of developing allergic disorders’ , Allergol Int . 20111225th edn, 60 ( 1 ), pp. 1 – 9 . Available at : doi: 10.2332/allergolint.10-RAI-0270 . OpenUrl CrossRef PubMed ↵ Papa , P. et al. ( 2021 ) ‘Discovery of the Selective Protein Kinase C-theta Kinase Inhibitor, CC-90005’ , J Med Chem. 20210806th edn , 64 ( 16 ), pp. 11886 – 11903 . Available at : doi: 10.1021/acs.jmedchem.1c00388 . OpenUrl CrossRef ↵ Pijnenburg , M.W. et al. ( 2022 ) ‘Childhood asthma: pathogenesis and phenotypes’ , Eur Respir J . 20220609th edn, 59 ( 6 ). Available at : doi: 10.1183/13993003.00731-2021 . OpenUrl Abstract / FREE Full Text ↵ Queiroz , G.A. et al. ( 2017 ) ‘IL33 and IL1RL1 variants are associated with asthma and atopy in a Brazilian population’ , Int J Immunogenet , 44 ( 2 ), pp. 51 – 61 . Available at : doi: 10.1111/iji.12306 . OpenUrl CrossRef PubMed ↵ Rodriguez , E. et al. ( 2009 ) ‘Meta-analysis of filaggrin polymorphisms in eczema and asthma: robust risk factors in atopic disease’ , J Allergy Clin Immunol , 123 ( 6 ), pp. 1361 – 70 e7 . Available at : doi: 10.1016/j.jaci.2009.03.036 . OpenUrl CrossRef PubMed Web of Science ↵ Saikumar Jayalatha , A.K. et al. ( 2021 ) ‘The central role of IL-33/IL-1RL1 pathway in asthma: From pathogenesis to intervention’ , Pharmacol Ther . 20210402nd edn, 225 , p. 107847 . Available at : doi: 10.1016/j.pharmthera.2021.107847 . OpenUrl CrossRef PubMed ↵ Sansone , F. et al. ( 2020 ) ‘Asthma and Obesity in Children’ , Biomedicines . 20200721st edn, 8 ( 7 ). Available at : doi: 10.3390/biomedicines8070231 . OpenUrl CrossRef ↵ Shamilov , R. , Robinson , V.L. and Aneskievich , B.J. ( 2021 ) ‘Seeing Keratinocyte Proteins through the Looking Glass of Intrinsic Disorder’ , International Journal of Molecular Sciences , 22 ( 15 ). Available at: https://doi.org/ARTN791210.3390/ijms22157912 . ↵ Smith , D. et al. ( 2017 ) ‘A rare IL33 loss-of-function mutation reduces blood eosinophil counts and protects from asthma’ , PLoS Genet . 20170308th edn, 13 ( 3 ), p. e1006659 . Available at : doi: 10.1371/journal.pgen.1006659 . OpenUrl CrossRef PubMed ↵ Smith , F.J. et al. ( 2006 ) ‘Loss-of-function mutations in the gene encoding filaggrin cause ichthyosis vulgaris’ , Nat Genet. 20060129th edn , 38 ( 3 ), pp. 337 – 342 . Available at : doi: 10.1038/ng1743 . OpenUrl CrossRef PubMed Web of Science ↵ Szustakowski , J.D. et al. ( 2021 ) ‘Advancing human genetics research and drug discovery through exome sequencing of the UK Biobank’ , Nature Genetics , 53 ( 7 ), pp. 942 – 948 . Available at : doi: 10.1038/s41588-021-00885-0 . OpenUrl CrossRef PubMed ↵ Torgerson , D.G. et al. ( 2012 ) ‘Resequencing Candidate Genes Implicates Rare Variants in Asthma Susceptibility’ , American Journal of Human Genetics , 90 ( 2 ), pp. 273 – 281 . Available at : doi: 10.1016/j.ajhg.2012.01.008 . OpenUrl CrossRef PubMed ↵ Ying , S. et al. ( 2006 ) ‘Lack of filaggrin expression in the human bronchial mucosa’ , J Allergy Clin Immunol. 20061013th edn , 118 ( 6 ), pp. 1386 – 1388 . Available at : doi: 10.1016/j.jaci.2006.08.030 . OpenUrl CrossRef PubMed ↵ Zhu , Z. et al. ( 2021 ) ‘Investigating asthma heterogeneity through shared and distinct genetics: Insights from genome-wide cross-trait analysis’ , J Allergy Clin Immunol . 20200718th edn, 147 ( 3 ), pp. 796 – 807 . Available at : doi: 10.1016/j.jaci.2020.07.004 . OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted February 13, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Analysis of rare coding variants in 470,000 UK Biobank participants reveals genetic associations with childhood asthma predisposition Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Analysis of rare coding variants in 470,000 UK Biobank participants reveals genetic associations with childhood asthma predisposition Zhenzhen Liu , David Curtis medRxiv 2025.02.12.25322158; doi: https://doi.org/10.1101/2025.02.12.25322158 Share This Article: Copy Citation Tools Analysis of rare coding variants in 470,000 UK Biobank participants reveals genetic associations with childhood asthma predisposition Zhenzhen Liu , David Curtis medRxiv 2025.02.12.25322158; doi: https://doi.org/10.1101/2025.02.12.25322158 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Genetic and Genomic Medicine Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (297) Cardiovascular Medicine (4421) Dentistry and Oral Medicine (443) Dermatology (382) Emergency Medicine (606) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1507) Epidemiology (15212) Forensic Medicine (30) Gastroenterology (1121) Genetic and Genomic Medicine (6581) Geriatric Medicine (667) Health Economics (996) Health Informatics (4520) Health Policy (1366) Health Systems and Quality Improvement (1611) Hematology (539) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15906) Intensive Care and Critical Care Medicine (1103) Medical Education (620) Medical Ethics (144) Nephrology (667) Neurology (6580) Nursing (345) Nutrition (998) Obstetrics and Gynecology (1141) Occupational and Environmental Health (956) Oncology (3324) Ophthalmology (970) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (663) Pediatrics (1689) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5433) Public and Global Health (9212) Radiology and Imaging (2193) Rehabilitation Medicine and Physical Therapy (1368) Respiratory Medicine (1194) Rheumatology (593) Sexual and Reproductive Health (709) Sports Medicine (529) Surgery (709) Toxicology (99) Transplantation (288) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9ff4f346dc51aa64',t:'MTc3OTM4MDg2NQ=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00