TRiXi: A Multi-Target Tandem Repeat-Based Method for Accurate Detection of X-Inactivation Skewing in Humans

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 72,413 characters · extracted from preprint-html · click to expand
TRiXi: A Multi-Target Tandem Repeat-Based Method for Accurate Detection of X-Inactivation Skewing in Humans | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search TRiXi: A Multi-Target Tandem Repeat-Based Method for Accurate Detection of X-Inactivation Skewing in Humans Dóra Goldmann , View ORCID Profile Björn Gylemo , View ORCID Profile Maike Bensberg , Ingela Johansson , Svenja Löffert , Júlia Goldmann , View ORCID Profile Lisa Haglund , Magdalena Vitkova , View ORCID Profile Janos Kondri , View ORCID Profile Sandra Hellberg , Engla Haglund , View ORCID Profile Shadi Jafari , View ORCID Profile Johnny Ludvigsson , View ORCID Profile Colm E. Nestor doi: https://doi.org/10.1101/2025.11.24.25340860 Dóra Goldmann 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site Björn Gylemo 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Björn Gylemo Maike Bensberg 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Maike Bensberg Ingela Johansson 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site Svenja Löffert 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site Júlia Goldmann 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site Lisa Haglund 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Lisa Haglund Magdalena Vitkova 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site Janos Kondri 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Janos Kondri Sandra Hellberg 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Sandra Hellberg Engla Haglund 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site Shadi Jafari 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Shadi Jafari Johnny Ludvigsson 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Johnny Ludvigsson Colm E. Nestor 1 Crown Princess Victoria Childreńs Hospital, Department of Biomedical and Clinical Sciences (BKV), Linköping University , Linköping, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Colm E. Nestor For correspondence: colm.nestor{at}liu.se Abstract Full Text Info/History Metrics Supplementary material Preview PDF ABSTRACT Preferential usage of either X-chromosome, skewed X-inactivation (sXCI), can profoundly alter the penetrance and expressivity of X-linked traits in females, often with life-threatening consequences. Despite its clinical relevance, the true frequency, origins, and stability of sXCI in human tissues remain poorly understood, in part due to a lack of effective and sensitive methods for assessing XCI status. Here, we present TRiXi ( T andem R epeat-based Identification of X -Inactivation), a simple and highly sensitive technique capable of detecting sXCI from as little as 10 ng of archived human DNA. Applying TRiXi to over 1,000 neonatal cord blood samples from healthy infants, we demonstrate that extreme sXCI is a common constitutional feature in humans. Use of longitudinal samples from the same donors revealed that sXCI patterns in skewed neonates were stably maintained into adolescence, whereas in non-skewed females, patterns fluctuated considerably over time. Using low-pass short-read sequencing, whole-genome long-read sequencing, and targeted exon sequencing, we exclude most known genetic drivers of sXCI in extremely skewed infants, supporting stochastic processes as the primary origin of skewed XCI. Further, by inferring X-inactivation patterns in 4,571 adult tissues from 264 females in the GTEx cohort, we demonstrate that skewed XCI is not restricted to blood, revealing widespread multi-organ sXCI in females. Our study represents the most comprehensive analysis of constitutional sXCI to date and reveals sXCI as a widespread and stable epigenetic trait. This can profoundly modify the penetrance of X-linked conditions with immediate implications for genetic diagnostics and our understanding of human disease variability. TRiXi provides a convenient and accessible approach to inform diagnosis of X-linked traits by assaying sXCI. Studying individuals with sXCI may yield critical insights into (1) the initiation of XCI and its underlying genomic elements, (2) previously unrecognized lethal X-linked traits and (3) improved polygenic risk prediction through incorporation of X-chromosome variation. INTRODUCTION Typically, human females possess two X-chromosomes (46, XX) whereas males have one X-chromosome and one Y-chromosome (46, XY). To prevent lethality due to a double dose of X-linked genes in females, one X-chromosome is inactivated in all female cells during the peri-implantation stage of human development 1 . X-chromosome inactivation (XCI) is initiated by expression of the long non-coding RNA, XIST , from one X-chromosome. XIST progressively coats the chromosome from which it is expressed, which in turn becomes marked with DNA methylation and repressive histone marks, ultimately resulting in compaction and transcriptional silencing 2 – 4 . The choice of parental X-chromosome to undergo XCI in each cell is random; different cells in the same female will have inactivated the paternal X-chromosome (Xp) or maternal X-chromosome (Xm). Although the initial choice of X-chromosome for inactivation is random in humans, the inactivated X-chromosome is stably inherited in a clonal fashion throughout all subsequent cell divisions 5 . Consequently, women are ‘mosaic’ for XCI, typically exhibiting a ratio of ∼1:1 between cells having inactivated Xp or Xm 6 . The mosaic nature of XCI generally reduces the penetrance and expressivity of traits encoded on the X-chromosome in females, as roughly half of their cells express the wild-type allele, which compensates for the effects of the mutant allele in the remaining cells. In contrast, many X-linked diseases, such as Rett syndrome and Fragile X syndrome, are considerably more severe and often embryonic lethal in males due to mono-allelic expression of the mutated X-linked gene 7 . However, females can manifest similarly severe and life-threatening symptoms of X-linked disorders due to skewed X-inactivation (sXCI), a state in which most, or all, cells within or across tissues have inactivated the same parental X-chromosome. While much of the sXCI observed in adult females results from secondary selection in the form of clonal hematopoiesis, which tends to increase with age, we and others have reported that extreme skewing of XCI may also be a common and potentially constitutional genetic characteristic in humans 6 , 8 – 12 . Clinically, constitutional sXCI would have a more profound and earlier effect on the penetrance and expressivity of X-linked traits in females. The determination of sXCI in bulk tissues such as blood is complex, requiring both an informative (heterozygous) genetic variant and an additional layer of information such as DNA methylation or gene expression. The most commonly used method for detection of skewing, the HUMARA assay, lacks sensitivity, failing to provide a result in 20-30% of samples tested 13 . The lack of an effective and sensitive approach to assay sXCI has limited our ability to characterize the prevalence and origin of XCI skewing in humans, a phenomenon predominantly studied in adult females, where constitutional skewing is often obscured by clonal cell expansion. We introduce T andem R epeat-based Identification of X -chromosome Inactivation (TRiXi), an improved method for high-sensitivity detection of skewed XCI. Applying TRiXi to archived DNA from over 1,000 cord blood samples revealed that constitutional sXCI is surprisingly frequent in humans (>5%). Using a range of whole genome and targeted approaches we further investigate the genetic origin and stability of sXCI during childhood. Finally, through multi-omic analysis of ∼4,500 tissues from the GTEx project, we characterize sXCI patterns across healthy human adult tissues and reveal skewing as a powerful and far more frequent modifier of X-linked traits than previously appreciated. RESULTS TRiXi - an efficient method for high-sensitivity detection of skewed X-inactivation Measuring the degree of sXCI in females requires the use of techniques that combine an informative genetic variant with an additional layer of molecular information such as DNA methylation or gene expression. Whereas a plethora of methods for sXCI detection have been proposed over the last decade 14 – 20 , the HUMARA assay, developed by Allen et al in 1992 21 , remains the gold-standard method in the field. The HUMARA assay involves methyl-sensitive restriction digest (only the unmethylated active X is cut) of the highly polymorphic short tandem repeat (STR) in the androgen receptor gene ( AR ; formerly HUMARA) followed by PCR amplification and electrophoresis to reveal XCI skewing; only the methylated, uncut inactive X allele will be amplified after digestion and the ratio between each allele represents XCI skewing in a given sample ( Supplementary Fig. 1a ). However, the HUMARA assay is uninformative in the 20-30% of females that are homozygous at the AR repeat. Moreover, the accuracy of the HUMARA assay is further affected by locus-specific alterations in DNA methylation, the presence of genetic variants in the target sequence, and preferential PCR amplification of the shorter allele 22 . To overcome the limitations of the HUMARA assay, we developed TRiXi to enhance the detection of sXCI. Using a similar concept to the HUMARA assay we aimed to identify multiple polymorphic tandem repeats across both arms of the X-chromosome and combined these into a single multiplex PCR reaction, thereby increasing assay sensitivity while requiring no additional experimental steps, expense or equipment. Using whole genome sequencing (whole blood) from 50 randomly selected females from the GTEx project and whole genome methylation data (isolated T-cells) from four females in the BLUEPRINT project we identified all X-linked repeat sequences that (i) are highly polymorphic tri- and tetra-nucleotide repeats, (ii) are flanked by at least one Hpa II site, and (iii) are characterized by 50% methylation, indicating that the locus is subject to XCI ( Fig. 1a, b , Supplementary Table 1 ). The AR locus was intentionally omitted from the TRiXi assay, as hyper-expanded AR repeats are common in the general population. Such long expansions are typically undetectable in the HUMARA assay, as they fall outside the expected size range and PCR amplification tends to favor the shorter, non-expanded (healthy) allele. The normal repeat length range of the AR locus is unusually broad (7–27 CAG repeats), often resulting in substantial allele length differences within individuals ( Fig. 1b ), increasing the probability of PCR bias due to size-dependent amplification efficiency 13 . In total, we identified six tri-and nine tetra-nucleotide repeats that satisfied all selection criteria ( Supplementary Table 1 ). Through exhaustive iterative testing we succeeded in multiplexing five informative loci, allowing robust detection of all ten alleles in a single assay ( Fig. 1c, d , Supplementary Table 2 ). We next performed both the HUMARA assay and TRiXi on 50 umbilical cord samples from the All-Babies in Southeast Sweden (ABIS) birth cohort 23 , 24 . Results from TRiXi and HUMARA were highly correlated ( Fig. 1e , Supplementary Table 3 ), but as expected, HUMARA failed to determine sXCI in 12 samples (12/50, 24%) due to homozygosity at the AR locus while TRiXi was informative in all samples ( Fig. 1f ). To further validate TRiXi we performed whole genome Oxford Nanopore Technologies (ONT) long-read sequencing on one highly skewed sample (97% sXCI; blue dot in Fig. 1e, f ). Following phasing of reads based on repeat length, ONT long-read sequencing confirmed the extreme skewing observed in this sample ( Fig. 1g ). Further, using a recently published method for calculating skewing from X-chromosome ONT data 17 , resulted in a global X-chromosome skewing of 88.1%, again highly concordant with that obtained with TRiXi (97%). Download figure Open in new tab Figure 1. Development of T andem R epeat-based Identification of X -chromosome Inactivation (TRiXi) for high-sensitivity detection of skewed X-inactivation. a, forward (blue) and reverse (green) primer binding sites, repeat location (hg38), repeat sequence, PCR product GC content (%) and methylation of CpG sites in TRiXi 1-5 PCR target regions. Hpa II (CCGG) sites are highlighted in red. b , allele length distribution of all five TRiXi repeats estimated from 50 randomly selected female WGS samples from the GTEx dataset. The highly polymorphic AR (X-Linked) and HTT (autosomal) tandem repeats are shown for comparison. c , schematic illustration of the TRiXi method involving methylation-sensitive digest of the alleles on the active X-chromosome followed by multiplex PCR of all 10 alleles (five polymorphic loci) followed by fragment size determination by capillary electrophoresis. d , Representative results of a single TRiXi assay. Top and bottom panels show undigested and digested runs of a highly skewed female sample from the ABIS cohort (sample ABIS 1). e , Scatterplot of XCI skew of 50 neonatal samples determined by HUMARA and TRiXi. Spearman’s rank correlation test; ρ = 0.75, p = 7.1×10 −8 . f , Boxplot of XCI skew of 50 neonatal samples determined by HUMARA and TRiXi. Samples which were uninformative in HUMARA assay are indicated in grey. Two-tailed Wilcoxon rank-sum test; p = 0.68. e , f , light-blue dots highlight sample ABIS 1. g , Clustering of ONT reads by repeat length at all five repeat loci in the ABIS 1 sample. Color gradient indicates CpG DNA methylation level. Red arrows indicate CCGG sites. Over 5% of newborns exhibit extreme XCI skewing We next set out to determine the frequency of constitutional skewing in humans by performing TRiXi on 500 archived umbilical cord blood samples from healthy infants in the ABIS birth cohort 23 , 24 . We determined the true heterozygosity and allele frequencies for all five polymorphic loci, resulting in a TRiXi sensitivity of 99.82%—equivalent to only 1 in 500 females being homozygous at all five repeats ( Supplementary Fig. 1b ). Skewing estimates were highly concordant across all loci within each sample, supporting the use of DNA methylation patterns across both arms of the X-chromosome as reliable proxies for XCI status ( Supplementary Fig. 1c, Supplementary Table 4 ). Whereas including five or more polymorphic repeats in the assay provides the highest sensitivity, fewer repeats can be used. Indeed, estimating sXCI in an additional 683 umbilical cord blood samples incorporating only the two most polymorphic repeats TRiXi 1 and TRiXi 2 offered a detection rate of 97% (21/683 samples homozygous for both repeats), a vast improvement over the HUMARA assay ( Supplementary Table 5 ). Altogether, analyzing skewed X-inactivation in 1,027 neonates revealed that 10.42% of females were highly skewed (mean +1 SD, >71.09% skewing) for XCI at birth and 5.16% exhibited extreme skewing (mean +2 SD, >79.76% skewing) ( Fig. 2a ). To investigate whether repeat length affects the accuracy of XCI skewing measurement by TRiXi, we compared the distributions of the repeat lengths between mosaic, skewed and extremely skewed females, which showed very similar distributions ( Supplementary Fig. 1d ). Furthermore, similar skewing values were obtained for each individual repeat, indicating that, in the case of homozygosity of one or more repeats, TRiXi reliably reveals XCI skew ( Supplementary Fig. 1e ). Download figure Open in new tab Figure 2. The distribution of skewed X-inactivation in 1,000 newborns revealed by TRiXi. a, XCI status of 1,027 neonatal blood samples determined by TRiXi. b, XCI skew of longitudinal samples collected between 0-1 years of age and between 14-16 years of age. c , Frequency of mosaic, highly or extremely skewed XCI at 0-1 and 14-16 years of age. d , classification and change (%) in skewing between timepoints for samples that were highly or extremely skewed at 14-16 years of age. e , XIST promoter region and first exon of 7 skewed samples (ABIS 1-7) and 3 controls (ABIS 8-10) investigated with sanger sequencing. Sequences spanning a previously reported variant (C-43G) associated with constitutional skewing highlighted in red. f, copy number analysis using low-pass whole genome sequencing data for the same skewed females. g, targeted exon sequencing of clonal hematopoiesis-associated genes revealed no mutations in any of the genes included in the oncoReveal™ Myeloid Panel. To determine whether the observed skewing represented a stable, intrinsic property of the hematopoietic lineage or a transient phenomenon, we analyzed follow-up samples from 50 individuals at 14–16 years of age ( Fig. 2b , Supplementary Table 6 ). The majority of females were classified as mosaic at both timepoints as 39 out of 50 (78%) females were mosaic at both at 0-1 and 14-16 years of age. Interestingly, the degree of XCI skew changed considerably (≤5%) in 16 out of 50 (32%) females, leading to an almost doubling of extremely and highly skewed females ( Fig. 2c ). Further, females that were classified as extremely skewed or skewed at age 0-1 exhibited relatively small changes in XCI skew, maintaining their skewed status into adolescence ( Fig. 2d ). These results suggest that in up to 30% of females, considerable selection of X-allele usage is occurring from birth. No clear genetic basis for skewed X-inactivation in neonates The observation of pronounced skewing at birth, that is subsequently maintained throughout childhood suggests a primary or constitutional etiology. Organism-wide, extreme skewing may result from constitutional genetic variants that directly bias the inactivation process toward a specific parental X-chromosome. Examples include mutations in the XIST gene promoter or balanced X:autosome translocations. Similarly, disruptions of the X-inactivation center (XIC) or autosomal elements involved in X-chromosome choice have been implicated in promoting or directly mediating primary skewing of X-inactivation 25 – 27 . Using seven of the most skewed samples (ABIS 1-7) and three mosaic females (ABIS 8-10), we conducted a thorough investigation of the genetic origin of skewed XCI. We first performed tiled sanger sequencing across the XIST promoter but failed to identify previously reported or novel variants that could affect XIST expression ( Fig. 2e ). Similarly, low-pass short-read sequencing failed to identify copy number variations or aneuploidies recently reported in completely skewed females 6 ( Fig. 2f ). The levels of skewing were highly variable during childhood ( Fig. 2b, c, d ), which could indicate an ongoing process of clonal selection that drive XCI skewing. Whereas clonal hematopoiesis (CH) is primarily studied in older individuals, mutations in key CH genes such as TP53 , JAK2 , TET2 and DNMT3A are often observed in childhood malignancies and familial disorders 26 , 28 – 30 . We thus investigated whether the observed extreme skewing could have resulted from intense CH due to a constitutional mutation in CH genes. Again, exon sequencing of the 58 most well-characterized CH genes failed to identify any previously identified CH-associated mutations in these genes ( Fig. 2g , Supplementary Table 7 ). Finally, deep (40X) ONT long-read sequencing of the most skewed sample ( Fig. 1g ), failed to identify any clearly pathogenic X-linked or autosomal mutations that could explain the observed skewing, including an absence of balanced X:autosome translocations. Together, our genetic analysis of skewed females did not identify a definitive underlying cause, suggesting that the observed extreme skewing arose from purely stochastic processes or as of yet unknown genetic modifiers of XCI. Evidence of multi-organ constitutional sXCI in adult females A recent cross-tissue analysis of XCI skewing suggested that XCI initiation occurs before germ-layer specification 31 . Whereas stochastic selection of a limited number of progenitor cells for lineage specification can lead to sXCI within a given tissue, it is highly unlikely that such a process would independently give rise to similar skewing across multiple, distinct tissue types within the same individual. To investigate sXCI across tissues in the same individual, we used the GTEx dataset, which contains RNA-sequencing data for 4,571 individual tissues across 264 female donors. sXCI levels for each tissue were determined by measuring the allele-specific expression of reads arising from genes that undergo XCI, as recently described by us 6 . Whereas the average skewing across tissues per individual was highly similar to that observed at birth; with 12.89% of females highly skewed (median +1 SD, >71.4% skewing) for XCI and 6.25% exhibiting extreme skewing (median +2 SD, >79% skewing) ( Fig. 3a, b ), whole blood exhibited significantly higher levels of sXCI in older adults ( Fig. 3c ), consistent with the selective effects of clonal hematopoiesis. Notably, across all adults tested, constitutional skewing was the likely origin of 23.4% of extremely skewed females and in individuals under 50 years of age, constitutional skewing was still the dominant cause of extreme sXCI ( Fig. 3c ). Unexpectedly, sXCI was also highly prevalent across non-hematopoietic tissues, with 70% of females (181/256) having at least one extremely skewed tissue ( Fig. 3d ). In total, 13.6% (622/4571, ∼1 in 7) of tissues examined exhibited extreme sXCI with adrenal gland, whole blood, liver and pancreas among the most frequently skewed ( Fig. 3e ). Together, these results indicate that multi-tissue constitutive skewing is a common phenomenon in the normal human population. Download figure Open in new tab Figure 3. Allelic-resolution analysis reveals widespread, multi-organ skewing in adults. a,b , XCI status determined by TRiXi in 1,027 neonatal blood samples (a) and by median non-PAR X-linked allelic expression across 4,571 tissues in 264 female donors from the GTEx dataset (b). c , Density plot of skewing in whole blood as determined by TRiXi in newborns and allelic expression in adults from GTEx. d , bar plot showing adults grouped by the number of skewed tissues per individual. e , bar plot of fraction of extremely skewed (skewing >79%) samples per tissue (top) and ridge plot showing the distribution of skewing in all 45 tissues examined (bottom). DISCUSSION We present TRiXi, a novel method for measurement of sXCI that offers considerable improvements over other techniques to detect sXCI, such as the HUMARA assay or next-generation sequencing approaches. TRiXi is highly sensitive (>99% sensitivity), accessible, affordable, and readily scalable for high-throughput use. Because the assay requires minimal DNA input and is compatible with short or degraded fragments, it is well-suited for screening samples with limited or compromised DNA, such as those commonly stored in biobanks. The AR locus was intentionally excluded from the TRiXi assay to avoid PCR bias associated with its broad normal repeat range. This also prevents unintended detection of premutation alleles linked to Kennedy’s disease, which are relatively common in the general population and often missed by the HUMARA assay due to preferential amplification of shorter alleles. Levels of sXCI assessed by TRiXi and HUMARA in the same samples were highly correlated, reinforcing the validity of historical HUMARA-based measurements and addressing persistent concerns about their accuracy 20 , 22 , 32 , 33 . This comparison also underscored the key limitation of the HUMARA assay, with 24% (12/50) of samples being uninformative, representing a substantial waste of resources, including precious and limited patient-derived material. We applied TRiXi to over 1,000 archived umbilical cord blood samples from the ABIS birth cohort; making it the largest study of neonatal XCI status to date. Our findings demonstrate that high (>70%) and extreme (>80%) levels of XCI skewing are common at birth, occurring more frequently than previously recognized (15.55%), validating and expanding upon the results of earlier, smaller studies using the HUMARA assay 34 . Applying TRiXi to peripheral blood samples collected from the same ABIS donors at 14-16 years of age ( N = 50) revealed sXCI to be highly variable throughout childhood with the exception of those females skewed at birth, which were more likely to remain skewed or proceed to extreme skewing, suggesting an ongoing selective process. Thus, even by 14 years of age, ∼10% of healthy females are already highly clonal in their peripheral blood and an additional 14% proceeding clearly proceeding towards clonality. The origin of sXCI in any given individual is often unknown and can have a complex etiology. Skewed XCI can result either from variants that directly influence the XCI process on one of the two X-chromosomes such as mutations in the XIST promoter 25 , balanced X:autosome translocations (primary selection) or indirectly from variants that confer a growth advantage to specific cells or clones, such as those associated with clonal hematopoiesis (secondary selection) 25 – 27 . However, low-pass whole genome sequencing, targeted sequencing of established clonal hematopoiesis genes, Sanger sequencing of the XIST promoter, and ONT long-read sequencing did not identify any known genetic features previously linked to sXCI. Given that the drivers and molecular mechanisms establishing XCI remain incompletely defined, our investigation may not have captured genetic alterations in genes not yet known to be essential for XCI. Further, sXCI can originate stochastically, where, by chance, the small number of progenitor cells establishing a given tissue all independently inactivate the same parental X chromosome 12 , 31 . The absence of identifiable genetic drivers of sXCI at birth may suggest a stochastic origin; however, this interpretation remains tentative without data on XCI patterns across other tissues from the same individual. We assessed multi-organ skewing in humans leveraging the extensive genomic and transcriptomic data available for 264 post-mortem female donors in the GTEx database. Utilizing heterozygous genetic variants in X-linked genes, XCI status could be determined by measuring allele-specific expression levels in each tissue. As expected, we observed increased levels of sXCI in blood, consistent with progressive effects of clonal hematopoiesis over time. Whereas blood was the most frequently skewed tissue in adults, it surprisingly represented only 17% of all skewed tissues, with seven out of ten adult females skewed in at least one tissue. Skewed X-inactivation is an intriguing and poorly understood genetic phenomenon in humans. However, it is also a genetic trait with a profound effect on the lives of thousands of carriers of X-linked disease, often resulting in the unpredictable manifestation of life-threatening symptoms of typically male X-linked disorders in females 35 – 38 . These X-linked diseases show variable symptoms correlated to the degree of XCI skewing with higher expression of the diseased allele resulting in more severe phenotypes 39 , 40 . While most causative X-linked mutations can be detected by genetic testing, their heterozygous nature and possible inactivation during XCI does not currently allow for prediction of disease prognosis. A reliable estimation of sXCI in combination with genetic screening would provide more accurate clinical diagnoses to allow for individual approaches for treatment and interventions. TRiXi will allow for rapid, cost effective, and sensitive assessment of XCI status in carriers of X-linked diseases. Furthermore, TRiXi will facilitate the inclusion of sXCI measures in large-scale studies of genetic association in humans. Our results identify sXCI as a common and often multi-organ feature of humans, with potentially profound implications for our understanding of both the process of XCI, but also the potential impact of X-linked traits in females. Our findings also highlight the importance of studying multiple tissues when trying to understand X-linked process in humans. We further showed that extremely skewed XCI is likely to have a genetic origin, which remains to be identified. It should be considered that such a molecular basis for extreme sXCI is likely to be heritable even though previous studies did not find a heritable component to moderate levels of sXCI 12 , 15 . METHODS Study population Umbilical cord blood samples (n=1,027) were obtained from All Babies in Southeast Sweden (ABIS) cohort. ABIS is a prospective birth cohort study inviting all 21,700 children born between October 1997 and October 1999 in the southeast region of Sweden to participate 23 , 24 . For longitudinal analysis of sXCI, paired whole blood samples collected at 1 year (when cord blood was not available; n= 30 1-year samples/n= 20 cord blood samples) and at 15 years of age were used. This study was approved by the Swedish Ethical Review Authority (#2022-06443-02). Automated DNA isolation Genomic DNA from frozen umbilical cord blood samples was extracted using the QIAcube system with the QIAamp DNA Blood Mini QIAcube Kit (Qiagen, 51126) according to the manufacturer’s instructions. In short, blood samples were thawed at room temperature followed by incubation of 200 µl blood with 20 µl proteinase K and 200 µl lysis buffer for 10 minutes at 56°C. Lysed samples were mixed with 200 µl 99.9% ethanol and transferred to QIAamp spin columns. After two washing steps, DNA was eluted in 200 µl elution buffer. Manual DNA isolation DNA from umbilical cord blood samples that were dried due to long-term storage and from capillary blood at 1 year of age were extracted manually using the QIAamp DNA Blood Mini Kit (Qiagen, 51106). Samples were thawed at room temperature, and a clump of dried blood (approximately 2 mm²) was transferred to a fresh microcentrifuge tube using pipette tips or scalpels, as needed. Each sample was then treated with 20 µL of proteinase K and 200 µL of lysis buffer (Qiagen, 939011), followed by thorough vortexing. The tubes were incubated at 56°C and shaken at 800 rpm for up to 6 hours. Buffer volume and incubation time were adjusted as necessary to ensure complete lysis. Once the blood was fully dissolved and lysed, DNA was purified using spin columns according to the manufacturer’s instructions, with elution performed in 100 µL of elution buffer. DNA quantification and quality assessment DNA was quantified using a NanoDrop™ 2000/2000c Spectrophotometer (Thermo Scientific, ND-2000). For dried blood samples of questionable quality, DNA integrity was evaluated on agarose and only non-or lowly degraded DNA was included in this study. Identification of informative X-linked tandem repeats To identify X-linked repeats that were (i) polymorphic, (ii) within 300 bp of a Hpa II digestion site (CCGG), and (iii) 50% methylated, the human genome reference (hg38) X-chromosome was screened for tri-and tetra-nucleotide repeats (containing one or two C or G combined) with at least six repeats in succession. To assess repeat length variability, we used whole genome sequencing (WGS data from the GTEx database from 50 females. Briefly, WGS CRAM files were downloaded from AnVIL using the Gen3 client. The files were sorted and converted into fastq files using Samtools 41 (v1.9). Reads containing previously identified repeats of interest were extracted through detection of the ten bases upstream of each given repeat and repeat length was calculated for each individual read to identify polymorphic repeats. Repeats with a similar length distribution to the AR repeat were determined as having sufficient heterozygosity. To identify 50% methylated tandem repeat sites 300bp from either end of the repeat, pre-processed whole-genome bisulfite sequencing (WGBS) methylation score and coverage bigwig files from four females were downloaded from BLUEPRINT 42 (CD4+ alpha-beta T cells; S009W451, P586, S007DD51, P582). Bigwigs were converted to Wig and then to bed file format with bigWigToWig 43 and wig2bed 44 , respectively. CpG methylation scores were calculated by taking the mean methylation score per CpG site across all four samples. CpG sites not covered in all samples were removed. Sites with a methylation score between 0.34 and 0.66 were considered as 50% methylated and retained. Repeats lacking a 50% methylated CCGG sites within 300bp of either end of the repeat were excluded. Utilizing this approach we identified 15 repeats (see Supplementary Table 1 ) which were further tested in the lab. From these repeats, we utilized a total of five repeats (TRiXi 1-5) to reduce the chance of completely uninformative samples. Hpa II digestion Genomic DNA (20-40 ng) was digested at 37°C for 60 minutes using 1× rCutsmart buffer and 1U of methylation-sensitive restriction enzyme Hpa II per sample, as per the manufacturer’s instructions (New England Biolabs, NEB-R0171M). The enzyme was inactivated at 80°C for 20 minutes after digestion. Additionally, for each run, a blank sample and a highly skewed sample were included as positive and negative controls, respectively. PCR amplification After Hpa II digestion polymorphic tri- and tetra-nucleotide repeats from digested and undigested samples were amplified by PCR using a Phusion High-Fidelity Polymerase (New England Biolabs, NEB-M0530L). PCR amplification mix contained 1× GC PCR buffer, 8 nM dNTP mix, 3% v/v DMSO, and 0.4 U Phusion Polymerase. 10% v/v TRiXi primer mix was added to the master mix. PCR was performed using the entire volume of digested DNA (2 µl). For each sample 2 µl of undigested DNA (20 – 40 ng) were also PCR amplified as an undigested control. PCR amplification was performed using the following thermocycler protocol: One cycle of 30 seconds at 98°C; 30 cycles of 10 seconds at 98°C, followed by 30 seconds at 63°C, followed by 40 seconds at 72°C; one cycle of 5 minutes at 72°C. Capillary electrophoresis For fragment analysis, 1 µl of the PCR reaction was transferred to a 96-well plate and diluted in 8 µl Hi-Di Formamide (Thermo Fisher, 4311320) and 0.2 µl GeneScan 600 LIZ sizig standard (Thermo Fisher, 4408399) mix. Sample plates were denatured at 95°C for 5 minutes, cooled on ice, and resolved using a 3500 Genetic Analyzer (Thermo Fisher). Calculating skewing and repeat length Peak area, peak height and nucleotide size was utilized to calculate skewing and repeat length was obtained using GeneMapper5 and calculations were performed in R. Briefly, the .fsa files obtained from the Genetic Analyzer 3500 were loaded into GeneMapper v5 (Thermo Fisher). Peaks were called using microsatellite analysis (default setting with LIZ600+normalization as ladder). The resulting table with peak information was exported and loaded into R where skewing was calculated. First, the two highest peaks (separated by at least 2.5 bases) for each undigested sample were identified and matched to the closest sized peaks in the digested sample, obtaining two peaks for both undigested and digested sample. Samples where the peaks were not distinguishable from each other ( i.e., the peaks were not separated by more than 2.5 bases) in the undigested sample were deemed homozygous and the repeat was excluded from skewing calculations for that sample. Skewing was assessed individually for each repeat, and the mean of all informative repeats were used to determine degree of skewing. The skewing calculation itself was performed as previously described 45 : For each sample, the mean XCI percentage (ranging from 0 to 100%) was calculated, with 50% representing perfectly balanced XCI. XCI values were collapsed to a 50–100% range (as the direction of deviation from 50% is uninformative). Finally, the standard deviation and mean of the total data set was used to determine thresholds for skewing and extreme skewing: Where μ is the population mean and σ is the population standard deviation. Consequently, skewed XCI equated to values > 71.09% and extremely skewed XCI to values > 79.76% ( Fig. 2a ). XCI skew values above either threshold were classified as skewed, or extremely skewed, respectively. Finally, the repeat length was determined by comparing the obtained peak size to the expected PCR product length of a sample with a known number of repeats. Analysis of skewed X-inactivation in Genotype-Tissue Expression (GTEx) donors Skewing was assessed from coupled RNA sequencing (RNA-seq) and whole exome sequencing data (WES) as previously described 6 . Briefly, WES BAM files for 256 female donors were downloaded from AnVIL using the Gen3 client. The files were sorted and converted into fastq files using Samtools (v1.9). Raw fastq reads were quality trimmed using FastP 46 (v.0.20.0) with default settings. BWA-MEM 47 was used for mapping reads to the human genome build 38 (hg38, GCA_000001405.15_GRCh38_no_alt_analysis_set.fna) using default settings. Sambamba 48 v0.8.2 was used to mark duplicate reads. The GATK best practice germline short variant discovery pipeline was used to process the aligned reads, using base quality score recalibration and local realignment at known insertions and deletions (indels) (GATK v.4.2.6.1). Default filters were applied to indel and SNP calls using the variant quality score recalibration (VQSR) approach of GATK. All RNA-seq samples available for each participant (total of 4571 RNA-seq samples) were downloaded from AnVIL as aligned BAM files using the Gen3 client. Samtools (v1.9) was used to sort and convert the BAM files to fastq files and quality trimming was done with FastP (v.0.20.0) with default settings. RNA-seq reads were aligned with STAR 49 2-pass mode (v2.7.10a) with GCA_000001405.15_GRCh38_no_alt_analysis_set.fna and --sjdbGTFfile gencode.v40.annotation.gtf index. WASP filtering was performed to reduce reference bias 50 . Briefly, GATK SelectVariants was used to extract hetSNPs (that passed the VQSR filtering) for each individual from the WES VCFs and subsequently passed to STAR via --varVCFfile and–waspOutputMode. Reads failing WASP filtering were removed. Following data pre-processing, allele-specific expression analysis of the allele counts for hetSNPs was retrieved from RNA-seq data using GATK ASEReadCounter. Heterozygous variants that passed VQSR filtering were first extracted for each sample from WES VCFs using GATK SelectVariants. Sample-specific VCFs and RNA-seq BAMs were input to ASEReadCounter requiring minimum base quality of 20 in RNA-seq data. To remove potentially spurious sites, conservative filters were applied to the data (variant call read depth >= 10 per allele and minor allele read count > 10% of the total variant read count for WES data, and an RNA-seq read depth of at least seven reads). If a gene carried multiple hetSNPs, the hetSNP with the highest read count per tissue and individual was kept. Allele-specific expression was calculated as previously described 51 : Skewing can then be calculated by taking the median allele-specific expression of all expressed non-pseudoautosomal (PAR) X-linked genes in each sample. The closer that value is to 0.5, the more preferential use of either parental allele. For instance, a female with a 100% skewed XCI would have a value of 0.5 while a female with a 50/50 usage of parental alleles would have 0. Similarly to how XCI skew was classified using TRiXi, the standard deviation and mean of the total data set was used to determine thresholds for skewing and extreme skewing: Consequently, skewed XCI equated to values >0.214 and extremely skewed XCI to values >0.29 ( Fig.2A ). XCI skew values above either threshold was classified as skewed, or extremely skewed, respectively. Low-pass whole genome sequencing Whole genome DNA sequencing libraries were prepared with the NEBNext Ultra II DNA Library Prep Kit for Illumina (New England Biolabs, E7645S) and the NEBNext Multiplex Oligos for Illumina Index Primers Set 1 (New England Biolabs, E7335S). 200 ng of DNA were diluted to 50 µl in 1X TE (10 mM Tris-HCl (pH 8.0), 0.1 mM EDTA) and fragmented on the Bioruptor sonicator (Diagenode) to an average fragment size of 300 bp. End prep, sequencing adaptor ligation and PCR amplification with indexing primers were conducted according to the manufacturer’s instructions. Adaptor-ligated DNA was cleaned up and size selected for 250 – 400 bp fragments with AMPure XP beads (Beckman Coulter, A63881) by performing a two-step bead clean up with 25 µl beads in step one and subsequently adding 15 µl beads to the supernatant. Libraries were amplified for three PCR cycles. Quality and size of all libraries was assessed on the TapeStation using the D1000 ScreenTape (Agilent, 5067-5582) and corresponding reagents (Agilent, 5067-5583). Quantification was done with the 1X dsDNA High Sensitivity assay (Invitrogen, Q33231) on the Qubit fluorimeter. Libraries were sequenced on Illumina’s MiSeq machine using v2 reagents (Illumina, MS-102-2002) as 150bp paired-end reads. Each library was sequenced for a minimum of 2.4 million reads resulting in a coverage of >0.2x. Copy number analysis was performed using the R-package QDNASeq 52 . Briefly, the low pass WGS data was mapped to hg38 with BWA-MEM2 53 using default parameters. Raw copy numbers were then estimated by counting the number of reads mapped to non-overlapping bins of 500kb. Sanger sequencing Skewed ABIS samples were analyzed for mutations in the XIST minimal promoter region and the first exon by sanger sequencing. Briefly, 200 ng of sample DNA were amplified with FastStart Taq DNA Polymerase at 5 U/μl (Roche Applied Science, 12032902001). Appropriate DNA primers (Integrated DNA Technologies) were used at a concentration of 5 µM per reaction and designed to amplify the promoter region (Forward: 5’ TGG TTG GGGA GCC ATA CAA GG 3’, reverse: 5’ AGA ATG GGG GAA GGG ATA GG 3’) as well as the minimal promoter, including exon 1 (Forward: 5’ GGT GGA GGA GTT ACA AAT TCT GG 3’, reverse: 5’ TGC AGA GAG ATC TTC AGT CAG G 3’). The reaction mix was incubated on a SimpliAmp Thermal Cycler (Applied Biosystems, A24811) at 95°C for 4 minutes to allow enzyme activation. Thereafter, denaturation was performed at 95°C, followed by annealing at 62°C for 30 seconds each, and extension at 72°C for 60 seconds. This cycle profile was repeated 30 times before terminating with a final extension step for 7 minutes at 72°C. Amplified DNA was diluted to 50 ng/µL and cleaned using the DNA Clean & Concentrator-5 Kit (Zymo research, D4014) according to the manufacturers protocol. The DNA was washed twice and eluted in 20 µL of water. DNA concentration was determined using the NanoDrop™ 2000/2000c Spectrophotometer (Thermo Scientific, ND-2000) and adjusted to 5 ng per µL. Sanger Sequencing was performed at Eurofins genomics using the Mix2Seq LightRun service. The quality of the sequences obtained was inspected using Chromas 2.6.6 DNA sequencing software (Technelysium Pty Ltd, Australia). Sequence alignment was performed using the UCSC Genome browser’s BLAT tool as well as NCBI’s BLASTn to identify possible mutations. Identification of clonal hematopoiesis variants by Amplicon Sequencing We performed amplicon sequencing with the help of the Pillar oncoReveal Myeloid Panel (Illumina, HDA-MY-1001-24), which includes 58 genes involved in clonal hematopoiesis 54 following the protocol provided by the manufacturer (version 4.0). In brief, 40 ng of DNA was diluted in nuclease-free water to a total volume of 4.25 µl followed by targeted PCR amplification of coding sequences and mutation hotspot location of genes of interest using a target-specific pool of primers. Unused primers were removed by digestion with exonuclease I and clean-up of PCR products with AMPure XP magnetic beads (Beckman Coulter, A63881). Gene-specific amplicons were further PCR amplified for six cycles with Pillar Custom Indexing Primers Kit A, Indices PI501-6 and PI701-2 (Illumina, IDX-PI-1001-96). Libraries were quantified and quality controlled on the TapeStation with the D1000 ScreenTape and reagents (Agilent, 5067-5582 and 5067-5583). More than 2.4 million reads were sequenced per sample as 150 bp paired-end reads on the MiSeq sequencer (Illumina). To identify variants associated with clonal hematopoiesis of indeterminate potential, we performed somatic variant calling in the amplicon sequencing data. Briefly, raw fastq reads were quality trimmed using fastp (0.24.0, default settings) and BWA-MEM2 was used to align reads to hg38 (GCA_000001405.15_GRCh38_no_alt_analysis_set.fna) using default settings. Sambamba v1.0.1 was used to mark duplicate reads. The GATK best practice ‘Somatic short variant discovery (SNVs + Indels)’ pipeline was used to process the aligned reads, using base quality score recalibration and local realignment at known insertions and deletions (indels) (GATK v.4.6.1.0). Default filters were applied to indel and SNP calls using the variant quality score recalibration (VQSR) approach of GATK. HaplotypeCaller, Mutect2, GetPileupSummaries, CalculateContamination and FilterMutectCalls (all default settings) were used to obtain analysis-ready vcf files with somatic variant calls. Only variants with ‘PASS’ filter status which had previously been reported as affecting clonal hematopoiesis 55 , 56 were considered to indicate clonal hematopoiesis. Oxford Nanopore long-read sequencing 1.5 µg of genomic DNA was sheared to approximately 10 kb using Covaris g-TUBEs (Covaris, 500291) in an Eppendorf 5415 R centrifuge at 5,000 RPM for 1 minute at room temperature. Library preparation was performed using the Ligation Sequencing Kit V14 (ONT, SQK-LSK114) according to the manufacturer’s protocol (GDE_9161_v114_revY, 30 January 2025). Briefly, DNA repair and end-preparation were conducted using the NEBNext FFPE DNA Repair Mix and Ultra™ II End Prep Enzyme Mix (NEB, E7672S) followed by adapter ligation. The final library was eluted and quantified using the Qubit 1X dsDNA High Sensitivity Assay (Thermo Fisher Scientific, Q33231). A total of 50 fmol of the prepared library was loaded onto a PromethION Flow Cell (ONT, FLO-PRO114) and sequenced on the PromethION 2 integrated device for 72 hours. The sequencing run generated 20.4 million reads at ∼46X coverage with a basecalled N50 read length of approximately 10kbp. The long-read sequencing was performed in collaboration with Clinical Genomics Linköping, SciLifeLab, who also provided technical support. Determining XCI skew from the ONT long-read data was performed as previously described 17 . POD5 files were basecalled and aligned to the human genome build 38 (hg38, GCA_000001405.15_GRCh38_no_alt_analysis_set.fna) using dorado v0.7.4 ( https://github.com/nanoporetech/dorado , which utilizes minimap2 57 for mapping) and the [email protected] model. For modified basecalling, 5mC and 5hmC were called in a GC context. To allow phasing, high-quality variants were called X-linked variants were called using DeepVariant 58 v1.8.0 using the model ‘ONT_R104’ and subsequent filtering with BCFtools 41 (only ‘PASS’ variants were kept). Phasing of the VCF and subsequent haplotag assignment was performed using LongPhase 59 v1.7.3. Reads assigned to incorrect haplotype blocks were identified in Integrative Genomics Viewer 60 (v. 2.19.4) and subsequently corrected. Each finalized modbam file (with haplotags) was then processed individually in R using NanoMethViz 61 v3.2.0. Methylation probabilities for each CCGG site in the TRiXi 1-5 PCR products were extracted per read, using the ‘query_methy’ function. Methylation probabilities were classified as low (and thus, associated with the active X (Xa) if below 0.1 and high (and associated with the Xi) if above 0.9. Within each repeat, the number of haplotype 1/Xa, haplotype 2/Xi, haplotype 1/Xi, and haplotype 2/Xa reads were counted to estimate the repeat-wise skew. To assess XCI skew, the mean of all repeat-wise skew values was used. Code Availability Software for analysis of TRiXi data and the GTEx data is available on github: https://github.com/ColmNestorLab/skewing_XCI . Data availability All sequencing data generated in this study have been deposited in the Swedish National Data Service (SND, https://snd.gu.se/ , a data repository certified by Core Trust Seal). Access to restricted data will require completion of a Data Access Request (DAR) via the SND website. Each Data Access Request will be evaluated individually according to Swedish legislation. Source data are provided with this paper. Author information Contributions C.E.N. managed and designed the study. D.G., M.B., I.J., J.G., J.K., L.H., and M.V. performed experiments. D.G., B.G., M.B. and C.E.N analyzed the data. B.G. performed all bioinformatics analysis. B.G., E.H., S.J., S.H., S.L., M.B., J.L. and C.E.N wrote the manuscript and prepared the figures. Ethics declaration Competing interests C.E.N has filed a patent application for the TRiXi method. The authors declare no other competing interests. SUPPLEMENTARY FIGURE LEGENDS Download figure Open in new tab Supplementary Figure 1. a, overview of the HUMARA assay based on the polymorphic CAG repeat in the AR gene. b, fraction of samples that were heterozygous for TRiXi repeat 1-5. c , boxplot of skewing of the five TriXi repeats across the three XCI skew groups. d , distribution of repeat lengths identified with TRiXi for repeat 1-5, split on XCI skew status. A Kolmogorov–Smirnov (K-S) test was used to statistically test if there was a difference between the XCI skew groups. e , skewing per individual (left) and per repeat (right), from samples classified as ‘skewed’ or ‘extremely skewed’ samples. ANOVA test; ρ = 0.85. SUPPLEMENTARY TABLES Supplementary Table 1. Highly polymorphic tri- and tetra-nucleotide X-linked repeat sequences flanked by 50% methylated HpaII sites tested by multiplexing for suitability in TRiXi. Supplementary Table 2. PCR primers used to amplify the 5 most suitable repeat sequences included in TRiXi. Supplementary Table 3. Skewing of 50 ABIS-samples as measured using the AR-repeat based HUMARA assay, rendering 24% inconclusive samples due to homozygosity at the repeat. Supplementary Table 4. TRiXi-based assessment of allelic skewing in 365 ABIS-samples, with conclusive results showing no individuals homozygous across all five repeat loci. Supplementary Table 5. Skewing of ABIS-samples as measured by mini-TRiXi using 2 out of 5 repeats. Supplementary Table 6. Longitudinal analysis of allelic skewing at age 0-1 year and 14-16 years as determined by the 2-repeat-based miniTRiXi for 50 ABIS-individuals. Supplementary Table 7. Mutation analysis of genes associated with clonal hematopoiesis using the oncoRevealTM Myeloid Panel. 0= no mutation Acknowledgements We acknowledge the Core Facility at the Faculty of Medicine and Health Sciences, Linköping University, for their support with equipment and assistance for sequencing. This work was funded by the European Research Council (XX-Health-101045171). Footnotes ↵ 2 joint first authorship ↵ 3 joint senior authorship REFERENCES 1. ↵ Moreira de Mello , J.C. , Fernandes , G.R. , Vibranovski , M.D. & Pereira , L.V. Early X chromosome inactivation during human preimplantation development revealed by single-cell RNA-sequencing . Sci Rep 7 , 10794 ( 2017 ). 2. ↵ Cerase , A. , Pintacuda , G. , Tattermusch , A. & Avner , P . Xist localization and function: new insights from multiple levels . Genome Biol 16 , 166 ( 2015 ). 3. Chu , C. et al. Systematic discovery of Xist RNA binding proteins . Cell 161 , 404 – 416 ( 2015 ). OpenUrl CrossRef PubMed 4. ↵ Fang , H. , Disteche , C.M. & Berletch, J.B. X Inactivation and Escape: Epigenetic and Structural Features . Front Cell Dev Biol 7 , 219 ( 2019 ). OpenUrl PubMed 5. ↵ Vandenberg , S.G. , Mc , K.V. & Mc , K.A . Twin data in support of the Lyon hypothesis . Nature 194 , 505 – 506 ( 1962 ). OpenUrl PubMed 6. ↵ Gylemo , B. , Bensberg , M. & Nestor , C.E . A whole-organism landscape of X-inactivation in humans . Elife 14 ( 2025 ). 7. ↵ Bartholomay , K.L. , Lee , C.H. , Bruno , J.L. , Lightbody , A.A. & Reiss , A.L . Closing the Gender Gap in Fragile X Syndrome: Review on Females with FXS and Preliminary Research Findings . Brain Sci 9 ( 2019 ). 8. ↵ Wong , C.C. et al. A longitudinal twin study of skewed X chromosome-inactivation . PLoS One 6 , e17873 ( 2011 ). OpenUrl CrossRef PubMed 9. Sharp , A. , Robinson , D. & Jacobs , P . Age- and tissue-specific variation of X chromosome inactivation ratios in normal women . Hum Genet 107 , 343 – 349 ( 2000 ). OpenUrl CrossRef PubMed Web of Science 10. Tukiainen , T. et al. Landscape of X chromosome inactivation across human tissues . Nature 550 , 244 – 248 ( 2017 ). OpenUrl CrossRef PubMed 11. Gylemo , B. et al. A landscape of X-inactivation during human T cell development . Nat Commun 15 , 10527 ( 2024 ). 12. ↵ Shvetsova , E. et al. Skewed X-inactivation is common in the general female population . Eur J Hum Genet 27 , 455 – 465 ( 2019 ). OpenUrl CrossRef PubMed 13. ↵ Bharaj , B.S. , Vassilikos , E.J. & Diamandis , E.P . Rapid and accurate determination of (CAG)n repeats in the androgen receptor gene using polymerase chain reaction and automated fragment analysis . Clin Biochem 32 , 327 – 332 ( 1999 ). OpenUrl CrossRef PubMed Web of Science 14. ↵ Mossner , M. et al. Skewed X-inactivation patterns in ageing healthy and myelodysplastic haematopoiesis determined by a pyrosequencing based transcriptional clonality assay . J Med Genet 50 , 108 – 117 ( 2013 ). OpenUrl Abstract / FREE Full Text 15. ↵ Zito , A. et al. Heritability of skewed X-inactivation in female twins is tissue-specific and associated with age . Nat Commun 10 , 5339 ( 2019 ). OpenUrl PubMed 16. Zito , A. et al. Escape from X-inactivation in twins exhibits intra- and inter-individual variability across tissues and is heritable . PLoS Genet 19 , e1010556 ( 2023 ). OpenUrl PubMed 17. ↵ Gocuk , S.A. et al. Measuring X-Chromosome inactivation skew for X-linked diseases with adaptive nanopore sequencing . Genome Res 34 , 1954 – 1965 ( 2024 ). OpenUrl Abstract / FREE Full Text 18. Swierczek , S.I. et al. Hematopoiesis is not clonal in healthy elderly women . Blood 112 , 3186 – 3193 ( 2008 ). OpenUrl Abstract / FREE Full Text 19. el-Kassar , N. , Hetet, G., Briere, J. & Grandchamp, B. Clonality analysis of hematopoiesis in essential thrombocythemia: advantages of studying T lymphocytes and platelets . Blood 89 , 128 – 134 ( 1997 ). OpenUrl Abstract / FREE Full Text 20. ↵ Busque , L. et al. Skewing of X-inactivation ratios in blood cells of aging women is confirmed by independent methodologies . Blood 113 , 3472 – 3474 ( 2009 ). OpenUrl Abstract / FREE Full Text 21. ↵ Allen , R.C. , Zoghbi , H.Y. , Moseley , A.B. , Rosenblatt , H.M. & Belmont , J.W . Methylation of HpaII and HhaI sites near the polymorphic CAG repeat in the human androgen-receptor gene correlates with X chromosome inactivation . Am J Hum Genet 51 , 1229 – 1239 ( 1992 ). OpenUrl PubMed Web of Science 22. ↵ Chen , G.L. & Prchal , J.T . X-linked clonality testing: interpretation and limitations . Blood 110 , 1411 – 1419 ( 2007 ). OpenUrl Abstract / FREE Full Text 23. ↵ Ludvigsson , J.F. & Abis Study , G . Epidemiological study of constipation and other gastrointestinal symptoms in 8000 children . Acta Paediatr 95 , 573 – 580 ( 2006 ). OpenUrl CrossRef PubMed Web of Science 24. ↵ Nygren , M. , Carstensen , J. , Koch , F. , Ludvigsson , J. & Frostell , A . Experience of a serious life event increases the risk for childhood type 1 diabetes: the ABIS population-based prospective cohort study . Diabetologia 58 , 1188 – 1197 ( 2015 ). OpenUrl CrossRef PubMed 25. ↵ Plenge , R.M. et al. A promoter mutation in the XIST gene in two unrelated families with skewed X-chromosome inactivation . Nat Genet 17 , 353 – 356 ( 1997 ). OpenUrl CrossRef PubMed Web of Science 26. ↵ Busque , L. et al. Recurrent somatic TET2 mutations in normal elderly individuals with clonal hematopoiesis . Nat Genet 44 , 1179 – 1181 ( 2012 ). OpenUrl CrossRef PubMed 27. ↵ Huang , N. et al. Characteristics and clinical evaluation of X chromosome translocations . Mol Cytogenet 16 , 36 ( 2023 ). 28. ↵ Bensberg , M. et al. TET2 as a tumor suppressor and therapeutic target in T-cell acute lymphoblastic leukemia . Proc Natl Acad Sci U S A 118 ( 2021 ). 29. Heyn , P. et al. Gain-of-function DNMT3A mutations cause microcephalic dwarfism and hypermethylation of Polycomb-regulated regions . Nat Genet 51 , 96 – 105 ( 2019 ). OpenUrl CrossRef PubMed 30. ↵ Langemeijer , S.M. et al. TET2 mutations in childhood leukemia . Leukemia 25 , 189 – 192 ( 2011 ). OpenUrl CrossRef PubMed Web of Science 31. ↵ Werner , J.M. , Ballouz , S. , Hover , J. & Gillis , J . Variability of cross-tissue X-chromosome inactivation characterizes timing of human embryonic lineage specification events . Dev Cell 57 , 1995 – 2008 e1995 ( 2022 ). OpenUrl CrossRef PubMed 32. ↵ Agarwal , N. , Nussenzveig , R.H. , Swierczek , S.I. , Parker , C.J. & Prchal , J.T . Does HUMARA assay for assessment of clonal hematopoiesis have shortcomings? Blood 114 , 2357 – 2358 ; author reply 2358-2359 ( 2009 ). OpenUrl FREE Full Text 33. ↵ Swierczek , S.I. et al. Methylation of AR locus does not always reflect X chromosome inactivation state . Blood 119 , e100 – 109 ( 2012 ). OpenUrl Abstract / FREE Full Text 34. ↵ Bolduc , V. et al. No evidence that skewing of X chromosome inactivation patterns is transmitted to offspring in humans . J Clin Invest 118 , 333 – 341 ( 2008 ). OpenUrl CrossRef PubMed Web of Science 35. ↵ Sun , M.X. et al. A female patient carrying a novel DMD mutation with non-random X-chromosome inactivation from a DMD family . BMC Med Genomics 17 , 46 ( 2024 ). 36. Dardik , R. et al. Molecular Mechanisms of Skewed X-Chromosome Inactivation in Female Hemophilia Patients-Lessons from Wide Genome Analyses . Int J Mol Sci 22 ( 2021 ). 37. Sun , Z. , Fan , J. & Wang, Y. X- Chromosome Inactivation and Related Diseases . Genet Res (Camb) 2022 , 1391807 ( 2022 ). 38. ↵ Matsumoto , A. et al. Unfavorable switching of skewed X chromosome inactivation leads to Menkes disease in a female infant . Sci Rep 14 , 440 ( 2024 ). 39. ↵ He , W.B. et al. X-chromosome inactivation pattern of amniocytes predicts the risk of dystrophinopathy in fetal carriers of DMD mutations . Prenat Diagn 39 , 603 – 608 ( 2019 ). OpenUrl PubMed 40. ↵ Choi , J. et al. Not just carriers: experiences of X-linked female heterozygotes . J Assist Reprod Genet 38 , 2757 – 2767 ( 2021 ). OpenUrl PubMed 41. ↵ Danecek , P. et al. Twelve years of SAMtools and BCFtools . Gigascience 10 ( 2021 ). 42. ↵ Stunnenberg , H.G. , International Human Epigenome, C. & Hirst, M. The International Human Epigenome Consortium: A Blueprint for Scientific Collaboration and Discovery . Cell 167 , 1145 – 1149 ( 2016 ). OpenUrl CrossRef PubMed 43. ↵ Kent , W.J. , Zweig , A.S. , Barber , G. , Hinrichs , A.S. & Karolchik , D . BigWig and BigBed: enabling browsing of large distributed datasets . Bioinformatics 26 , 2204 – 2207 ( 2010 ). OpenUrl CrossRef PubMed Web of Science 44. ↵ Neph , S. et al. BEDOPS: high-performance genomic feature operations . Bioinformatics 28 , 1919 – 1920 ( 2012 ). OpenUrl CrossRef PubMed Web of Science 45. ↵ Roberts , A.L. et al. Age acquired skewed X chromosome inactivation is associated with adverse health outcomes in humans . Elife 11 ( 2022 ). 46. ↵ Chen , S. Ultrafast one-pass FASTQ data preprocessing, quality control, and deduplication using fastp . Imeta 2 , e107 ( 2023 ). 47. ↵ Li , H. & Durbin , R . Fast and accurate short read alignment with Burrows-Wheeler transform . Bioinformatics 25 , 1754 – 1760 ( 2009 ). OpenUrl CrossRef PubMed Web of Science 48. ↵ Tarasov , A. , Vilella , A.J. , Cuppen , E. , Nijman , I.J. & Prins , P . Sambamba: fast processing of NGS alignment formats . Bioinformatics 31 , 2032 – 2034 ( 2015 ). OpenUrl CrossRef PubMed 49. ↵ Dobin , A. et al. STAR: ultrafast universal RNA-seq aligner . Bioinformatics 29 , 15 – 21 ( 2013 ). OpenUrl CrossRef PubMed Web of Science 50. ↵ van de Geijn , B. , McVicker , G. , Gilad , Y. & Pritchard , J.K . WASP: allele-specific software for robust molecular quantitative trait locus discovery . Nat Methods 12 , 1061 – 1063 ( 2015 ). OpenUrl CrossRef PubMed 51. ↵ Castel , S.E. , Levy-Moonshine , A. , Mohammadi , P. , Banks , E. & Lappalainen , T . Tools and best practices for data processing in allelic expression analysis . Genome Biol 16 , 195 ( 2015 ). 52. ↵ Scheinin , I. et al. DNA copy number analysis of fresh and formalin-fixed specimens by shallow whole-genome sequencing with identification and exclusion of problematic regions in the genome assembly . Genome Res 24 , 2022 – 2032 ( 2014 ). OpenUrl Abstract / FREE Full Text 53. ↵ Vasimuddin , M. , Misra , S. , Li , H. & Aluru , S . Efficient Architecture-Aware Acceleration of BWA-MEM for Multicore Systems . Int Parall Distrib P , 314 – 324 ( 2019 ). 54. ↵ Pich , O. , Reyes-Salazar , I. , Gonzalez-Perez , A. & Lopez-Bigas , N . Discovering the drivers of clonal hematopoiesis . Nat Commun 13 , 4267 ( 2022 ). OpenUrl CrossRef PubMed 55. ↵ Kar , S.P. et al. Genome-wide analyses of 200,453 individuals yield new insights into the causes and consequences of clonal hematopoiesis . Nat Genet 54 , 1155 – 1166 ( 2022 ). OpenUrl CrossRef PubMed 56. ↵ Weinstock , J.S. et al. Aberrant activation of TCL1A promotes stem cell expansion in clonal haematopoiesis . Nature 616 , 755 – 763 ( 2023 ). OpenUrl CrossRef PubMed 57. ↵ Li , H . Minimap2: pairwise alignment for nucleotide sequences . Bioinformatics 34 , 3094 – 3100 ( 2018 ). OpenUrl CrossRef PubMed 58. ↵ Poplin , R. et al. A universal SNP and small-indel variant caller using deep neural networks . Nat Biotechnol 36 , 983 – 987 ( 2018 ). OpenUrl CrossRef PubMed 59. ↵ Lin , J.H. , Chen , L.C. , Yu , S.C. & Huang , Y.T . LongPhase: an ultra-fast chromosome-scale phasing algorithm for small and large variants . Bioinformatics 38 , 1816 – 1822 ( 2022 ). OpenUrl CrossRef PubMed 60. ↵ Robinson , J.T. et al. Integrative genomics viewer . Nat Biotechnol 29 , 24 – 26 ( 2011 ). OpenUrl CrossRef PubMed Web of Science 61. ↵ Su , S. et al. NanoMethViz: An R/Bioconductor package for visualizing long-read methylation data . PLoS Comput Biol 17 , e1009524 ( 2021 ). OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted November 27, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following TRiXi: A Multi-Target Tandem Repeat-Based Method for Accurate Detection of X-Inactivation Skewing in Humans Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share TRiXi: A Multi-Target Tandem Repeat-Based Method for Accurate Detection of X-Inactivation Skewing in Humans Dóra Goldmann , Björn Gylemo , Maike Bensberg , Ingela Johansson , Svenja Löffert , Júlia Goldmann , Lisa Haglund , Magdalena Vitkova , Janos Kondri , Sandra Hellberg , Engla Haglund , Shadi Jafari , Johnny Ludvigsson , Colm E. Nestor medRxiv 2025.11.24.25340860; doi: https://doi.org/10.1101/2025.11.24.25340860 Share This Article: Copy Citation Tools TRiXi: A Multi-Target Tandem Repeat-Based Method for Accurate Detection of X-Inactivation Skewing in Humans Dóra Goldmann , Björn Gylemo , Maike Bensberg , Ingela Johansson , Svenja Löffert , Júlia Goldmann , Lisa Haglund , Magdalena Vitkova , Janos Kondri , Sandra Hellberg , Engla Haglund , Shadi Jafari , Johnny Ludvigsson , Colm E. Nestor medRxiv 2025.11.24.25340860; doi: https://doi.org/10.1101/2025.11.24.25340860 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Genetic and Genomic Medicine Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (300) Cardiovascular Medicine (4435) Dentistry and Oral Medicine (444) Dermatology (382) Emergency Medicine (608) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1509) Epidemiology (15227) Forensic Medicine (30) Gastroenterology (1124) Genetic and Genomic Medicine (6597) Geriatric Medicine (668) Health Economics (997) Health Informatics (4534) Health Policy (1368) Health Systems and Quality Improvement (1613) Hematology (540) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15916) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (146) Nephrology (667) Neurology (6599) Nursing (346) Nutrition (998) Obstetrics and Gynecology (1144) Occupational and Environmental Health (957) Oncology (3332) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (663) Pediatrics (1693) Pharmacology and Therapeutics (691) Primary Care Research (711) Psychiatry and Clinical Psychology (5447) Public and Global Health (9230) Radiology and Imaging (2198) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (593) Sexual and Reproductive Health (712) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a005b6096864ad07',t:'MTc3OTU1NjYxNA=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00