Genetic Spectrum of Autism Spectrum Disorder Associated Variants in the Indian Population: Insights from 1,029 IndiGenomes

preprint OA: closed Public-Domain
📄 Open PDF Full text JSON View at publisher
Full text 50,286 characters · extracted from preprint-html · click to expand
Genetic Spectrum of Autism Spectrum Disorder Associated Variants in the Indian Population: Insights from 1,029 IndiGenomes | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Genetic Spectrum of Autism Spectrum Disorder Associated Variants in the Indian Population: Insights from 1,029 IndiGenomes View ORCID Profile Mukesh Kumar , Treesa Issen , Mohammed Swalih , View ORCID Profile Srishti Sharma , View ORCID Profile Sheffali Gulati , View ORCID Profile Sridhar Sivasubbu , View ORCID Profile Vinod Scaria , View ORCID Profile BK Binukumar doi: https://doi.org/10.1101/2025.08.14.25333641 Mukesh Kumar 1 CSIR Institute of Genomics and Integrative Biology , Mall Road, New Delhi - 110007, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Mukesh Kumar Treesa Issen 1 CSIR Institute of Genomics and Integrative Biology , Mall Road, New Delhi - 110007, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Mohammed Swalih 1 CSIR Institute of Genomics and Integrative Biology , Mall Road, New Delhi - 110007, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Srishti Sharma 1 CSIR Institute of Genomics and Integrative Biology , Mall Road, New Delhi - 110007, India 2 Academy of Scientific and Innovative Research (AcSIR) , Ghaziabad-201002, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Srishti Sharma Sheffali Gulati 3 All India Institute of Medical Sciences , New Delhi, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Sheffali Gulati Sridhar Sivasubbu 1 CSIR Institute of Genomics and Integrative Biology , Mall Road, New Delhi - 110007, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Sridhar Sivasubbu Vinod Scaria 1 CSIR Institute of Genomics and Integrative Biology , Mall Road, New Delhi - 110007, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Vinod Scaria BK Binukumar 1 CSIR Institute of Genomics and Integrative Biology , Mall Road, New Delhi - 110007, India 2 Academy of Scientific and Innovative Research (AcSIR) , Ghaziabad-201002, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for BK Binukumar For correspondence: binukumar{at}igib.res.in binukumarbk{at}gmail.com Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Background Autism spectrum disorder (ASD) is a lifelong neurodevelopmental condition characterised by social and behavioural challenges. It is highly heritable, with estimates ranging from 40-90% and a liability-scale heritability of 0.924, underscoring the role of genetic variants in its pathogenesis. Limited studies from India hinder an accurate assessment of the country’s true ASD genetic spectrum. Aim To investigate the genetic spectrum in an Indian control dataset, providing baseline variant frequency data to facilitate interpretation of disease-associated variants in the Indian population. Methods We compiled a strongly ASD-linked gene panel from the SFARI and ClinGen databases, followed by the extraction of gene-associated variants from the IndiGenomes dataset. A stepwise analysis pipeline was implemented, including variant annotation, filtering for minor allele frequency (MAF 0.75), and loss-of-function prediction with LoFTEE (high confidence). Variants were then classified according to ACMG-AMP guidelines. Results We identified 1,531,327 variants from 517 ASD panel genes (MAF 0.75) and 537 LoF variants (LoFTEE; high confidence). Missense and LoF variants contributed 37% and 63% of the filtered data, respectively. Fifty-five variants from 28 genes were classified as pathogenic/likely pathogenic, while 10 variants in 6 genes showed significantly higher MAF (p < 0.05; Fisher’s exact test). Carrier numbers were estimated for autosomal recessive inheritance models. Conclusion This study provides a comprehensive spectrum of ASD-related genetic variants in the Indian population, offering valuable insights for ASD diagnosis, genetic interpretation, and understanding of underlying molecular mechanisms. Introduction The term "autism" originally described self-withdrawal in schizophrenia but was redefined in the 1940s by Dr. Leo Kanner and Dr. Hans Asperger to describe children with social, communication, and repetitive behavioural challenges [ 1 ]. Their work, influenced by Georg Frankl’s idea of disrupted ‘affective language’ and ‘word language’, helped define autism as a neurobiological spectrum, now recognised as Autism Spectrum Disorder (ASD) under Diagnostic and Statistical Manual of Mental Disorders (DSM-5; a reference book on mental health and brain-related conditions and disorders) [ 2 ]. ASD includes neurodevelopmental conditions affecting social interaction, communication, and behaviour, encompassing autism, Asperger syndrome, PDD-NOS, and related genetic conditions [ 3 ]. Global ASD prevalence is 0.77%, with higher rates (1.14%) observed in males [ 4 ]. The four studies, including rural (4,750 children) and urban populations totalling 125,849 children, highlight urban-focused ASD prevalence research. The pooled ASD prevalence was 0.11% (95% CI: 0.01–0.20) in rural children (1–18 years old) and 0.09% (95% CI: 0.02–0.16) in urban children (0–15 years old) [ 5 – 9 ]. Limited ASD studies in India hinder the understanding of the true national burden [ 5 ]. ASD is highly heritable, with a liability-scale heritability of 0.924, with twin and family studies estimating heritability between 40% and 90%[ 10 , 11 ]. Genetic causes, including de novo mutations and rare variants (MAF ≤ 0.1%) and common variants (small effect), explain 20–25% of ASD cases [ 10 , 12 – 15 ]. In a cohort of 199 individuals (144 ASD cases and 55 siblings), 243 rare de novo variants (DNVs) were identified. Rare de novo variants (DNVs) were observed in 71.5% of ASD cases and 63% of unaffected siblings, with a comparable mean DNV rate per child (1.24 in ASD vs. 1.18 in siblings), aligning with previous studies [ 15 ]. ASD-associated genes are catalogued in well-known databases, including SFARI [ 16 ] and ClinGen [ 17 ], though a standardised and stringent, clinically validated ASD gene panel remains lacking. Despite research identifying many ASD-associated genes, the pathogenic variant spectrum remains unclear, especially in underrepresented populations like India. To address this, we analysed whole-genome sequencing data from 1,029 self-reported healthy individuals in the IndiGenomes project [ 18 ]. This study developed a stringent ASD gene panel using the SFARI and ClinGen databases to explore the distribution of rare variants in the underrepresented Indian population. METHODS IndiGenome population dataset The IndiGen project involved whole-genome sequencing of 1,029 self-declared healthy individuals from diverse geographical regions across India, representing the country’s broad ancestral diversity. The cohort comprised 495 males (mean age: 41.35 years) and 534 females (mean age: 32.96 years). All participants underwent health screening to exclude major known diseases and provided informed consent per the Institutional Human Ethics Committee (IHEC) guidelines of the CSIR-Institute of Genomics and Integrative Biology. Variant data and allele frequencies from this cohort have been previously published in the IndiGenomes database[ 18 ]. Collation and Prioritisation of Autism Spectrum Disorder Genes A curated list of ASD-associated genes was compiled from two well-established resources: the Simons Foundation Autism Research Initiative (SFARI) Gene database and the ClinGen Intellectual Disability and Autism Gene Curation Expert Panel. A total of 1333 genes from the SFARI and the ClinGen database. To generate a stringent ASD gene list, we prioritised genes with an EAGLE (Evaluation of Autism Gene Link Evidence; quantitative metric for ASD genes) score, greater than 12, as well as those classified as Syndromic (S; genes cause syndromes often featuring ASD) or High Confidence 1 (HC=1; genes have strong replicated ASD evidence) in the SFARI database, and genes marked as Definitive (DE; genes have long-established, proven disease links) or Strong (convincing but shorter-term supporting evidence) in ClinGen. Genes from ClinGen were excluded if they had an EAGLE score below 12 and lacked both Syndromic and HC1 classification, and a final, non-redundant ASD gene list was compiled ( Figure 1 ). Download figure Open in new tab Figure 1: Workflow outlining the gene prioritisation strategy using curated gene lists from the SFARI and ClinGen databases. High-confidence ASD-associated genes were selected through stringent filtering criteria to ensure relevance and specificity. Preparation of BED File for Targeted Genomic Analysis of ASD-Associated Genes The targeted BED file was prepared using Matched Annotation from NCBI and EMBL-EBI (MANE) transcripts, covering the entire gene regions of the prioritised ASD gene panel. BED file generation was performed using a Linux-based command-line interface (CLI), with hg38 refGene annotations downloaded from the NCBI FTP platform (release 1.4). BCFtools was used to extract targeted variants from the IndiGenomes normalised VCF, representing whole-genome data of 1,029 self-reported healthy individuals, using the prepared BED file as the target region input. Variant Annotation Variant annotation was conducted using a customised and updated ANNOVAR pipeline via a Linux-based command-line interface. Gene-based annotations utilised the RefSeq refGene database. Known variants were annotated using avsnp151 (dbSNP build 151). Functional predictions were derived from dbNSFP v4.7a, which integrates multiple in silico tools. Clinical significance was assessed using ClinVar (April 2025 release). Population allele frequencies were annotated using IndiGenomes1029 (Indian dataset), 1000 Genomes (August 2015), gnomAD v4.1 exome/genome (2023), and the GME Variome Project. Splicing effects were assessed using dbscSNV v1.1, while regulatory intronic variants were annotated using regSNP-intron. REVEL scores were used to prioritise potentially damaging missense variants. Variants were prioritised through a structured, multi-step filtering process. Initially, variants with a minor allele frequency (MAF) greater than 5% in the 1000 Genomes Project, gnomAD exome, and gnomAD genome datasets were excluded to remove common polymorphisms. Synonymous variants and those with unknown consequences were filtered out to focus on potentially functional changes. Prioritisation of Missense ASD Gene Panel Variants Following variant annotation using ANNOVAR, missense variants were extracted using variant class annotation filters from ExonicFunc_refGene. Subsequently, predicted deleterious missense (nonsynonymous) variants were prioritised using the REVEL in-silico predictor, which integrates scores from multiple tools, including MutPred, FATHMM v2.3, VEST 3.0, PolyPhen-2, SIFT, PROVEAN, MutationAssessor, MutationTaster, LRT, GERP++, SiPhy, phyloP, and phastCons[ 19 ]. REVEL is a meta-predictor trained on new diseases and harmless variants for better accuracy. Missense variants with a REVEL score greater than 0.75 were retained for further analysis. LoF (Loss-of-Function) Variant Annotation and Prioritisation Loss-of-function (LoF) variants were annotated and assessed for high-confidence (HC) classification using the Variant Effect Predictor (VEP) integrated with the LoFTEE plugin[ 20 ]. Annotation was performed by focusing specifically on MANE (Matched Annotation from NCBI and EMBL-EBI) transcripts to ensure consistency and accuracy in transcript selection. High-confidence LoF variants were prioritised for downstream analysis based on LoFTEE’s stringent filtering criteria. Classification of Prioritised Variants Prioritised genetic variants from the IndiGenome control dataset were processed for the classification recommended by ACMG-AMP (American College of Medical Genomics & Genetics - Association of Molecular Pathology) standard guidelines and previously published work [ 21 , 22 ]. Variants were categorised: pathogenic, likely pathogenic, benign, likely benign, and variants of uncertain significance (VUS). In the first step, classification based on allele frequency thresholds used data from the 1000 Genomes Project, gnomAD v4.1 exome and gnomAD v4.1 genome: BA1 (>5%), BS1 (1–5%), and PM2 (<0.05%). Next, computational predictions from SIFT, PolyPhen-2, and CADD assigned PP3 if at least two predicted deleterious effects, or BP4 if two predicted tolerated effects. The third step involved evidence from ClinVar for PP5 (pathogenic) and BP6 (benign) classifications. PM1 was applied when variants occurred within critical protein domains identified from Pfam. In the fourth step, literature evidence was integrated: PS3/BS3 (functional assays), PS4/BP5 (case-control studies), PP1/BS4 (cosegregation analysis), PS2/PM6 (confirmed or assumed de novo variants), and PP4 (clinical phenotyping supporting variant-disease association). Additional ACMG criteria were considered: BP7 (silent changes), PS1 and PM5 (same or different amino acid change at the same residue), PM3 and BP2 (compound heterozygosity in trans or cis), PM4 (indels outside repeat regions), and BP3 (indels within repeats). All evidence was compiled and interpreted using the University of Maryland’s Genetic Variant Interpretation Tool [ 23 ]. The PVS1 criterion was assigned to a loss-of-function (LoF) variant only if it satisfied five specific conditions. First, the variant had to be located in the major transcript of the gene, as defined by MANE. Second, the gene needed to be reported in ClinVar with at least 20 pathogenic or likely pathogenic (P/LP) LoF variants, contributing at least 5% of all the P/LP variants reported in that gene (that is, the variant count should be at least 20, contributing ≥5% of the total P/LP variants). Third, the variant had to be predicted as deleterious by AutoPVS1, either classified as ‘definitive’ in ClinGen or as ‘high confidence’ in SFARI. Fourth, the gene should have published literature supporting its association with autism spectrum disorder (ASD) or related overlapping clinical conditions involving a loss-of-function mechanism. Finally, any variant showing a relatively high minor allele frequency (MAF ≥ 1%) in the IndiGen dataset was excluded from PVS1 assignment. IndiGenomes vs Global: Frequency Comparison of Pathogenic Variants For comparative analysis, ASD gene-panel-based variants classified as P/LP according to ACMG-AMP standards were considered. Minor allele frequencies (MAFs) of these variants were then extracted from the gnomAD database version 4.1.0 for major global populations represented by the following abbreviations: AFR (African/African American), AMR (Latino/Admixed American), ASJ (Ashkenazi Jewish), EAS (East Asian), FIN (Finnish), NFE (Non-Finnish European), SAS (South Asian), AMI (Amish), MID (Middle Eastern), and OTH (Other/Unassigned). Variant frequency comparisons across these populations were conducted, and statistical significance was determined using Fisher’s exact test with Bonferroni correction for multiple testing (p-value < 0.05). RESULTS Autism Spectrum Gene Prioritised from SFARI and ClinGen Databases A total of 1,230 genes were retrieved from the SFARI database, and 329 genes from the ClinGen panel. The SFARI gene list included 304 Syndromic (S) genes, 234 High Confidence Score 1 (HC=1) genes, 711 strong candidate (SC=2) genes, and 191 suggestive evidence (SE=3) genes. The ClinGen panel comprised 254 genes in the Definitive (DE) category, 2 genes in the Strong category, 17 genes in the Moderate category, and 47 genes in the Other category. To generate a stringent ASD gene panel, genes from SFARI with an EAGLE score greater than 12 were combined with ClinGen genes classified as Definitive and Strong, resulting in a filtered set of genes. Additionally, SFARI genes categorised as Syndromic (S) and HC1 were integrated with ClinGen’s DE and Strong genes. After merging and removing duplicates, a final unique list of 517 ASD-associated genes was prepared for downstream analysis. The details of the stringent gene panel and its constituent genes are summarised in Figure 1 and Supplementary Table 1. Genetic Spectrum of ASD Related Gene Variants A total of 1,798,502 variants were identified across ∼88 Mb of cumulative genomic regions spanning 517 ASD-associated genes, based on the gene panel selected for analysis. Following the initial filtering, 1,531,327 variants were retained with a minor allele frequency (MAF) < 5%, eliminating common variants and enriching the dataset for rare variants potentially relevant to ASD. To assess missense variant pathogenicity, REVEL scores were used as a predictive filter. Applying a threshold of REVEL greater than 0.75, indicative of a high likelihood of deleterious impact, yielded 298 missense variants across 130 genes. Parallelly, loss-of-function (LoF) variants were identified using Variant Effect Predictor (VEP) in conjunction with the LoFTEE plugin. Initial annotation identified 584 LoF variants. High-confidence filtering was then applied by: (i) restricting to MANE Select transcripts, and (ii) retaining only those LoF variants flagged as high-confidence (HC) by LoFTEE. This filtering resulted in a refined set of 537 high-confidence LoF variants. A total of 835 prioritised variants, including 298 missense and 537 loss-of-function (LoF) variants, were identified across 264 ASD-associated genes. Among these, 67 genes carried both missense and LoF variants, underscoring the broad spectrum of potentially impactful genetic alterations observed within ASD-associated genes. These variants represent a comprehensive set of potentially pathogenic alterations in ASD-associated genes within the Indian control population. The distribution and composition of these prioritised variants are detailed in Supplementary Table 2. The final list of predicted damaging variants based on the ASD gene panel is summarised in Figure 2 , offering a visual overview of the genetic landscape. Download figure Open in new tab Figure 2: Percentage distribution of genetic variants across 517 genes in the IndiGenomes control dataset after variant prioritisation. The figure illustrates the proportion of different variant types or classes observed within the prioritised gene set. Assessment of Non-Synonymous/Missense Variants In this analysis, 298 missense variants across 130 ASD-associated genes were assessed using ACMG-AMP classification criteria to evaluate their potential clinical significance. Among these, 1 variant was classified as pathogenic and 11 as likely pathogenic, collectively spanning 10 genes. Additionally, 3 variants were likely benign, each found in a distinct gene. Notably, the majority, 283 variants across 128 genes, were classified as variants of uncertain significance (VUS), reflecting the current limitations in variant interpretation. The classification distribution, including pathogenic, likely pathogenic, likely benign, and VUS categories, is illustrated in Figure 3 as a stacked bar plot for visual clarity. Download figure Open in new tab Figure 3: Distribution of classified non-synonymous variants based on ACMG guidelines in the ASD panel gene list. The figure includes two panels, Set-1 and Set-2, each showing the number of variants per gene categorised by ACMG classification (Pathogenic, Likely Pathogenic, VUS, and Likely Benign). This representation highlights the gene-wise burden of clinically relevant variants across the IndiGenomes dataset. Evaluation of Loss-of-Function (LoF) Variants A total of 537 loss-of-function (LoF) variants were analysed and classified according to ACMG-AMP guidelines. This dataset included 47 splice-acceptor variants, 35 splice-donor variants, 356 frameshift insertions/deletions (indels), and 99 stop-gain variants. These were distributed across 201 ASD-associated genes, of which 18 genes harboured 43 variants classified as pathogenic. The remaining 494 variants across 187 genes were designated as variants of uncertain significance (VUS). The distribution of pathogenic variants across these 18 genes is depicted in Figure 4 , showcasing the spectrum of high-confidence LoF variants and their ACMG classifications. Download figure Open in new tab Figure 4: Depiction of all variants in genes containing Pathogenic (P) and Likely Pathogenic (LP) variants prioritised based on loss-of-function (LoF) impact from the ASD panel gene list. The stacked bar plot illustrates the number of LP and P variants across 19 genes harbouring LoF variants. ACMG Attributes Matrix of Classified Pathogenic and Likely Pathogenic Variants According to the ACMG-AMP guidelines, all sorted, filtered, and prioritised variants, including missense and loss-of-function (LoF) variants, were systematically organised. A total of 55 variants were classified, comprising 44 pathogenic (P) and 11 likely pathogenic (LP) variants. These are visualised in Figure 5 , where each variant is shown along the x-axis and the corresponding ACMG evidence attributes are plotted on the y-axis in a binary matrix. The presence of an ACMG attribute is marked as ’1’, and its absence is left blank. The matrix allows intuitive visualisation of the supporting evidence for each variant, with colour-coded bars indicating final classifications (pathogenic or likely pathogenic) based on ACMG criteria. Download figure Open in new tab Figure 5: ACMG classification and supporting evidence for all Likely Pathogenic (LP) and Pathogenic (P) variants. The heatmap displays the presence of ACMG attributes used for classification across LP and P variants identified in the ASD panel gene list from the IndiGenomes control dataset. Zygosity Profiles and Inheritance Correlation of Variants in IndiGenome To understand the individual-level genotype of 55 variants, LP (likely pathogenic) and P (Pathogenic) in the IndiGenome dataset, we investigated the homozygous (hom), heterozygous (het), and total allele count (AC) called across the IndiGenome dataset for a total of 28 genes. The thorough literature investigation of all the genes revealed that 3 genes follow the autosomal recessive (AR), 25 genes are autosomal dominant with conflicting evidence of mode of inheritance (AD), and 3 genes are X-linked with conflicting mode of inheritance (MOI). This analysis yielded an interesting observation regarding the zygosity of gene variants with MOI in the context of carriers and the anticipated genetic backgrounds of individuals with ASD. We identified 11 (1 in 93; 1.06%) expected carriers with a predicted genetic predisposition to ASD in control data, considering certain limitations of MOI, such as conflicting MOI and variability in disease penetrance. The complete set of analysed information is presented in Figure 6 and Table 1 . Download figure Open in new tab Figure 6: Zygosity distribution of ACMG-classified variants in the ASD gene panel. (A) Heatmap illustrating the counts of individuals with homozygous (hom) and heterozygous (het) Likely Pathogenic (LP) and Pathogenic (P) variants. (B) Heatmap showing the zygosity counts (hom and het) of LP and P variants stratified by gene. (C) Heatmap depicting counts of unique individuals with hom or het LP/P variants, where multiple occurrences of the same zygosity state within an individual are counted only once. View this table: View inline View popup Table 1: Haplotype profile of likely pathogenic (LP) and pathogenic (P) variants in the IndiGen control dataset. Notations: het_raw_per_variant = number of heterozygous genotypes per variant, hom_raw_per_variant = number of homozygous genotypes per variant, het_raw_per_gene = number of heterozygous genotypes per gene, hom_raw_per_gene = number of homozygous genotypes per gene, uniq_het_for_moi_per_gene = unique heterozygous variants per gene based on mode of inheritance (MOI) for the condition (ASD), uniq_hom_for_moi_per_gene = unique homozygous variants per gene based on MOI for the condition (ASD) and uniq_het_for_rec_pcond_CARRIER = unique heterozygous variants for recessive MOI per condition (ASD) representing carriers. Global Allele Frequency Analysis of ASD Gene Variants A total of 55 genetic variants, 11 likely pathogenic and 44 pathogenic based on ACMG guidelines across 28 genes, were analysed to explore population-specific associations with Autism Spectrum Disorder (ASD). Minor Allele Frequencies (MAF) from the IndiGen dataset were compared with those from global populations. This comparison revealed 10 variants across 6 genes that are significantly enriched in the Indian population, using a corrected p-value threshold of less than 0.05. These enriched variants are visualised in a bubble plot, where they are encircled, with the corresponding genes prominently highlighted at the top of the graph ( Figure 7 ). This population-specific enrichment underscores the importance of including diverse genetic backgrounds in ASD research for improved diagnosis and understanding of genetic risk in underrepresented groups. Download figure Open in new tab Figure 7: Cross-population comparison of minor allele frequencies (MAF) for Likely Pathogenic (LP) and Pathogenic (P) variants from IndiGenomes. This bubble plot visualises the MAF of LP and P variants identified in the IndiGenomes control dataset across major gnomAD v4.1 populations, including: African/African-American (AFR), Latino/Admixed American (AMR), Amish (AMI), Ashkenazi Jewish (ASJ), East Asian (EAS), Finnish (FIN), Non-Finnish European (NFE), Middle Eastern (MID), South Asian (SAS), and the Overall population. Variants are plotted on the x-axis, grouped by their respective genes, indicated at the top of the plot with an overlay graphic. Bubble size reflects the MAF in each population. Red-circled data points indicate statistically significant allele frequency differences (p < 0.05) based on Fisher’s exact test with Bonferroni correction. Discussion This study offers the first insight into the genetic landscape and potential predisposition to Autism Spectrum Disorder (ASD) in an Indian control cohort, contributing to our broader understanding of its molecular basis in underrepresented populations. We analysed 1,798,502 variants from 517 genes with strong evidence of ASD association, sourced from the IndiGenomes dataset. Through stringent filtering, we prioritised 844 potentially damaging variants. Missense variants were filtered using a high-level confidence REVEL score greater than 0.75, while LoF variants were filtered using LoFTEE’s high-confidence (HC) designation[ 19 , 20 ]. Pathogenicity assessment using ACMG guidelines identified 55 variants composed of 44 pathogenic (P) and 11 likely pathogenic (LP) that include 12 missense from 10 genes and 43 loss-of-function (LoF) variants from 18 genes. This concealed the finding with a higher burden observed in the LoF category in our analysis. Our findings underscore the importance of population-specific variant interpretation and lay the groundwork for future ASD-focused genetic studies in Indian populations. The data from 55 P/LP variants, as interpreted by ACMG in 28 ASD-associated genes, suggest that 10 variants have been observed in other populations, as depicted in Figure 7 . Literature evidence indicates that PAH, NBEA, ANKRD11, CYP27A1, and FMR1 each have atleast 2 P/LP variants linked to ASD, including biallelic, loss-of-function, truncating, and repeat-expansion mutations [ 24 – 28 ]. Similarly, DYRK1A, ANK2, ARID1B, KMT2C, and ZNF462 harbour atleast 3 or more such variants, spanning loss-of-function, rare damaging, and protein-truncating alterations associated with ASD [ 29 – 33 ]. Importantly, the analysis revealed LP/P variants in 13 genes from the 28-gene ASD panel (KDM5B, CHD8, CHD2, CREBBP, ANKRD11, DYRK1A, ANK2, ARID1B, KMT2C, CACNA1C, GFAP, SCN2A, and SCN1A), each previously present in a large ASD cohort study [ 34 ]. The recurrence of these genes and variant classes across studies not only reinforces their clinical relevance but also emphasises the value of integrating population-specific genomic data with global literature to refine diagnostic panels and improve risk assessment in ASD. Genotyping of control data at the individual level was used to assess the distributions of homozygous and heterozygous variants across the 28 genes. Literature-supported classification of these genes by mode of inheritance (MOI), autosomal recessive (AR), autosomal dominant (AD), X-linked recessive (XLR), and X-linked dominant (XLD), revealed notable patterns in variant zygosity consistent with established MOIs, offering insights into carrier status and genetic backgrounds in the control population ( Table 1 and Table 2 ). We identified 11 carrier individuals with genotypes potentially linked to ASD, while noting limitations such as uncertain MOI annotations and incomplete penetrance of certain genes ( Figure 6 , Table 1 ). Many ASD-associated genes containing pathogenic or likely pathogenic variants are reported to follow an autosomal dominant MOI, often exhibiting variable penetrance, incomplete dominance, and differing degrees of heritability. In this study, the control dataset comprised individuals already designated as healthy controls; therefore, the analysis was not based on their clinical disease status, as penetrance and heritability can vary between individuals [ 10 , 11 ]. This approach offers a comprehensive perspective on LP/P variants classified and organised according to rigorously standardised ACMG guidelines. View this table: View inline View popup Table 2: Genes Implicated in Autism Spectrum Disorder: Modes of Inheritance (MOI), Phenotypic Spectrum, and Evidence from Literature. Population-level analysis revealed 10 variants across six genes (PAH, NF1, ADSL, TRIO, and ZNF462) with significantly higher frequencies in the Indian population (corrected p < 0.05, Fisher’s exact test). Most of these variants showed concordance with minor allele frequencies reported in South Asian (SAS) populations. These enriched variants, illustrated in the bubble plot ( Figure 7 ), highlight the importance of incorporating diverse and underrepresented genetic backgrounds into ASD research. Such inclusion can improve the diagnostic yield, refine variant interpretation, and enhance our understanding of population-specific genetic risk factors in ASD. Data Availability All data produced in the present study are available upon reasonable request to the authors Authors Contribution BK conceived the study, supervised the analysis, and proofread the manuscript. MK designed the data analysis pipeline, prepared the initial manuscript draft, interpreted the variants, and performed a thoroughly conceptualised analysis. TI carried out formal data analysis, interpreted variants, and proofread the manuscript. MS and SS conducted formal analysis, variant interpretation and proofread the manuscript. SG contributed valuable insights that informed and strengthened the study. SSB and VS provided genomic sequencing data and proofread the manuscript. Data Availability The datasets supporting the findings of this study are available from the corresponding author upon reasonable request. However, the necessary supplementary data are provided with the manuscript as supplementary files. Statement of Ethics The authors attest that they obtained all the necessary participant consent papers. The participant has provided his agreement in the form of his clinical information to be published in the journal. The participants understand that their names and initials will not be published. Declaration of Conflict of Interest The author affirms no conflicts of interest regarding research, authorship, or publication. Funding This research was supported by grants from Waters India Pvt. Ltd. (Grant No. CLP009037). Supplementary data Supplementary Table 1: Supplementary Table 1: Prioritisation of ASD gene panel, showing 517 unique genes from SFARI and ClinGen. Abbreviations: S-Syndromic, HC-High Confidence, SC-Strong Candidate, SE-Suggestive Evidence, DE-Definitive, 1S (HC+S),2S(SC+S), 3S(SE+S) Supplementary Table 2: Predicted damaging genetic variants identified from the IndGenomes dataset using the ASD gene panel (517 genes), filtered using REVEL scores >0.75 for missense variants and LoFTEE-predicted high-confidence loss-of-function (LoF) variants. Supplementary Table 3: Highlighting the PVS1 assignment criteria, the satisfying variants (P/LP) are listed with their parameters. Acknowledgement MK, TI, and MS acknowledge financial support from the project grant (Code: CLP009037). SS acknowledges the University Grants Commission, Senior Research Fellowship (UGC-SRF) for fellowship support. This research was additionally supported by funding from the Council of Scientific and Industrial Research (CSIR). Computational analyses were performed using the High-Performance Computing (HPC) facility at CSIR-IGIB. References 1. ↵ Dell’Osso L , Luche RD , Gesi C , Moroni I , Carmassi C , Maj M . From Asperger’s to DSM-5 Autism Spectrum Disorder and Beyond: A Subthreshold Autism Spectrum Model . Clin Pract Epidemiol Ment Health [Internet ]. 2016 ; 12 : 120 – 31 . Available from : doi: 10.2174/1745017901612010120 OpenUrl CrossRef 2. ↵ Muratori F , Bizzari V . Autism as a Disruption of Affective Contact: The Forgotten Role of George Frankl . Clin Neuropsychiatry [Internet ]. 2019 ; 16 : 159 – 64 . Available from: https://www.ncbi.nlm.nih.gov/pubmed/34908951 OpenUrl 3. ↵ Website [Internet] . Available from: https://doi/book/10.1176/appi.books.9780890425596 4. ↵ Issac A , Halemani K , Shetty A , Thimmappa L , Vijay VR , Koni K , et al. The global prevalence of autism spectrum disorder in children: a systematic review and meta-analysis . Osong Public Health Res Perspect [Internet ]. 2025 ; 16 : 3 – 27 . Available from : doi: 10.24171/j.phrp.2024.0286 OpenUrl CrossRef 5. ↵ Chauhan A , Sahu JK , Jaiswal N , Kumar K , Agarwal A , Kaur J , et al. Prevalence of autism spectrum disorder in Indian children: A systematic review and meta-analysis . Neurol India [Internet ]. 2019 ; 67 : 100 – 4 . Available from : doi: 10.4103/0028-3886.253970 OpenUrl CrossRef PubMed 6. Nair MKC , Harikumaran Nair GS , Beena M , Princly P , Abhiram Chandran S , George B , et al. CDC Kerala 16: Early Detection of developmental delay/disability among children below 6 y--a district model . Indian J Pediatr [Internet ]. 2014 ; 81 Suppl 2 : S151 – 5 . Available from : doi: 10.1007/s12098-014-1589-y OpenUrl CrossRef 7. Raina SK , Kashyap V , Bhardwaj AK , Kumar D , Chander V . Prevalence of autism spectrum disorders among children (1-10 years of age) - findings of a mid-term report from Northwest India . J Postgrad Med [Internet ]. 2015 ; 61 : 243 – 6 . Available from : doi: 10.4103/0022-3859.166512 OpenUrl CrossRef 8. Poovathinal SA , Anitha A , Thomas R , Kaniamattam M , Melempatt N , Anilkumar A , et al. Prevalence of autism spectrum disorders in a semiurban community in south India . Ann Epidemiol [Internet ]. 2016 ; 26 : 663 – 5 .e8. Available from : doi: 10.1016/j.annepidem.2016.07.003 OpenUrl CrossRef 9. ↵ Rudra A , Belmonte MK , Soni PK , Banerjee S , Mukerji S , Chakrabarti B . Prevalence of autism spectrum disorder and autistic symptoms in a school-based cohort of children in Kolkata , India. Autism Res [Internet ]. 2017 ; 10 : 1597 – 605 . Available from : doi: 10.1002/aur.1812 OpenUrl CrossRef 10. ↵ Abrahams BS , Geschwind DH . Advances in autism genetics: on the threshold of a new neurobiology . Nat Rev Genet [Internet ]. 2008 ; 9 : 341 – 55 . Available from : doi: 10.1038/nrg2346 OpenUrl CrossRef PubMed Web of Science 11. ↵ Wang K , Gaitsch H , Poon H , Cox NJ , Rzhetsky A . Classification of common human diseases derived from shared genetic and environmental determinants . Nat Genet [Internet ]. 2017 ; 49 : 1319 – 25 . Available from : doi: 10.1038/ng.3931 OpenUrl CrossRef 12. ↵ Miles JH . Autism spectrum disorders--a genetics review . Genet Med [Internet ]. 2011 ; 13 : 278 – 94 . Available from : doi: 10.1097/GIM.0b013e3181ff67ba OpenUrl CrossRef PubMed 13. Geschwind DH . Genetics of autism spectrum disorders . Trends Cogn Sci [Internet ]. 2011 ; 15 : 409 – 16 . Available from : doi: 10.1016/j.tics.2011.07.003 OpenUrl CrossRef PubMed Web of Science 14. Lord C , Brugha TS , Charman T , Cusack J , Dumas G , Frazier T , et al. Autism spectrum disorder . Nat Rev Dis Primers [Internet ]. 2020 ; 6 : 5 . Available from : doi: 10.1038/s41572-019-0138-4 OpenUrl CrossRef PubMed 15. ↵ Viggiano M , Ceroni F , Visconti P , Posar A , Scaduto MC , Sandoni L , et al. Genomic analysis of 116 autism families strengthens known risk genes and highlights promising candidates . NPJ Genom Med [Internet ]. 2024 ; 9 : 21 . Available from : doi: 10.1038/s41525-024-00411-1 OpenUrl CrossRef 16. ↵ Arpi MNT , Simpson TI . SFARI genes and where to find them; modelling Autism Spectrum Disorder specific gene expression dysregulation with RNA-seq data . Sci Rep [Internet ]. 2022 ; 12 : 10158 . Available from : doi: 10.1038/s41598-022-14077-1 OpenUrl CrossRef PubMed 17. ↵ Rehm HL , Berg JS , Brooks LD , Bustamante CD , Evans JP , Landrum MJ , et al. ClinGen--the Clinical Genome Resource . N Engl J Med [Internet ]. 2015 ; 372 : 2235 – 42 . Available from : doi: 10.1056/NEJMsr1406261 OpenUrl CrossRef PubMed 18. ↵ Jain A , Bhoyar RC , Pandhare K , Mishra A , Sharma D , Imran M , et al. IndiGenomes: a comprehensive resource of genetic variants from over 1000 Indian genomes . Nucleic Acids Res [Internet ]. 2021 ; 49 : D1225 – 32 . Available from : doi: 10.1093/nar/gkaa923 OpenUrl CrossRef PubMed 19. ↵ REVEL: An Ensemble Method for Predicting the Pathogenicity of Rare Missense Variants . The American Journal of Human Genetics [Internet] . 2016 [cited 2025 Jul 15]; 99 : 877 – 85 . Available from : doi: 10.1016/j.ajhg.2016.08.016 OpenUrl CrossRef PubMed 20. ↵ Karczewski KJ , Francioli LC , Tiao G , Cummings BB , Alföldi J , Wang Q , et al. Author Correction: The mutational constraint spectrum quantified from variation in 141,456 humans . Nature [Internet ]. 2021 ; 590 : E53 . Available from : doi: 10.1038/s41586-020-03174-8 OpenUrl CrossRef 21. ↵ Richards S , Aziz N , Bale S , Bick D , Das S , Gastier-Foster J , et al. Standards and guidelines for the interpretation of sequence variants: a joint consensus recommendation of the American College of Medical Genetics and Genomics and the Association for Molecular Pathology . Genet Med [Internet ]. 2015 ; 17 : 405 – 24 . Available from : doi: 10.1038/gim.2015.30 OpenUrl CrossRef PubMed 22. ↵ Kumar M , Gaharwar U , Paul S , Poojary M , Pandhare K , Scaria V , et al. WilsonGen a comprehensive clinically annotated genomic variant resource for Wilson’s Disease . Sci Rep [Internet ]. 2020 ; 10 : 9037 . Available from : doi: 10.1038/s41598-020-66099-2 OpenUrl CrossRef 23. ↵ Kleinberger J , Maloney KA , Pollin TI , Jeng LJB . An openly available online tool for implementing the ACMG/AMP standards and guidelines for the interpretation of sequence variants . Genet Med [Internet ]. 2016 ; 18 : 1165 . Available from : doi: 10.1038/gim.2016.13 OpenUrl CrossRef PubMed 24. ↵ Yu TW , Chahrour MH , Coulter ME , Jiralerspong S , Okamura-Ikeda K , Ataman B , et al. Using whole-exome sequencing to identify inherited causes of autism . Neuron [Internet ]. 2013 ; 77 : 259 – 73 . Available from : doi: 10.1016/j.neuron.2012.11.002 OpenUrl CrossRef PubMed Web of Science 25. Tuand K , Stijnen P , Volders K , Declercq J , Nuytens K , Meulemans S , et al. Nuclear Localization of the Autism Candidate Gene Neurobeachin and Functional Interaction with the NOTCH1 Intracellular Domain Indicate a Role in Regulating Transcription . PLoS One [Internet ]. 2016 ; 11 : e0151954 . Available from : doi: 10.1371/journal.pone.0151954 OpenUrl CrossRef 26. Ka M , Kim W-Y . ANKRD11 associated with intellectual disability and autism regulates dendrite differentiation via the BDNF/TrkB signaling pathway . Neurobiol Dis [Internet ]. 2018 ; 111 : 138 – 52 . Available from : doi: 10.1016/j.nbd.2017.12.008 OpenUrl CrossRef PubMed 27. Stelten BML , Bonnot O , Huidekoper HH , van Spronsen FJ , van Hasselt PM , Kluijtmans LAJ , et al. Autism spectrum disorder: an early and frequent feature in cerebrotendinous xanthomatosis . J Inherit Metab Dis [Internet ]. 2018 ; 41 : 641 – 6 . Available from : doi: 10.1007/s10545-017-0086-7 OpenUrl CrossRef 28. ↵ Fyke W , Velinov M . and Autism, an Intriguing Connection Revisited . Genes (Basel) [Internet ]. 2021 ; 12 . Available from : doi: 10.3390/genes12081218 OpenUrl CrossRef PubMed 29. ↵ Earl RK , Turner TN , Mefford HC , Hudac CM , Gerdts J , Eichler EE , et al. Clinical phenotype of ASD-associated haploinsufficiency . Mol Autism [Internet ]. 2017 ; 8 : 54 . Available from : doi: 10.1186/s13229-017-0173-5 OpenUrl CrossRef PubMed 30. Yoon S , Penzes P . Roles of ANK2/ankyrin-B in neurodevelopmental disorders: Isoform functions and implications for autism spectrum disorder and epilepsy . Curr Opin Neurobiol [Internet ]. 2025 ; 90 : 102938 . Available from : doi: 10.1016/j.conb.2024.102938 OpenUrl CrossRef PubMed 31. Halgren C , Kjaergaard S , Bak M , Hansen C , El-Schich Z , Anderson CM , et al. Corpus callosum abnormalities, intellectual disability, speech impairment, and autism in patients with haploinsufficiency of ARID1B . Clin Genet [Internet ]. 2012 ; 82 : 248 – 55 . Available from : doi: 10.1111/j.1399-0004.2011.01755.x OpenUrl CrossRef PubMed 32. Brauer B , Merino-Veliz N , Ahumada-Marchant C , Arriagada G , Bustos FJ . KMT2C knockout generates ASD-like behaviors in mice . Front Cell Dev Biol [Internet ]. 2023 ; 11 : 1227723 . Available from : doi: 10.3389/fcell.2023.1227723 OpenUrl CrossRef PubMed 33. ↵ Kruszka P , Hu T , Hong S , Signer R , Cogné B , Isidor B , et al. Phenotype delineation of ZNF462 related syndrome . Am J Med Genet A [Internet ]. 2019 ; 179 : 2075 – 82 . Available from : doi: 10.1002/ajmg.a.61306 OpenUrl CrossRef PubMed 34. ↵ Satterstrom FK , Kosmicki JA , Wang J , Breen MS , De Rubeis S , An J-Y , et al. Large-Scale Exome Sequencing Study Implicates Both Developmental and Functional Changes in the Neurobiology of Autism . Cell [Internet ]. 2020 ; 180 : 568 – 84.e23 . Available from : doi: 10.1016/j.cell.2019.12.036 OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted August 19, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Genetic Spectrum of Autism Spectrum Disorder Associated Variants in the Indian Population: Insights from 1,029 IndiGenomes Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Genetic Spectrum of Autism Spectrum Disorder Associated Variants in the Indian Population: Insights from 1,029 IndiGenomes Mukesh Kumar , Treesa Issen , Mohammed Swalih , Srishti Sharma , Sheffali Gulati , Sridhar Sivasubbu , Vinod Scaria , BK Binukumar medRxiv 2025.08.14.25333641; doi: https://doi.org/10.1101/2025.08.14.25333641 Share This Article: Copy Citation Tools Genetic Spectrum of Autism Spectrum Disorder Associated Variants in the Indian Population: Insights from 1,029 IndiGenomes Mukesh Kumar , Treesa Issen , Mohammed Swalih , Srishti Sharma , Sheffali Gulati , Sridhar Sivasubbu , Vinod Scaria , BK Binukumar medRxiv 2025.08.14.25333641; doi: https://doi.org/10.1101/2025.08.14.25333641 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Epidemiology Subject Areas All Articles Addiction Medicine (569) Allergy and Immunology (863) Anesthesia (300) Cardiovascular Medicine (4442) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1511) Epidemiology (15230) Forensic Medicine (30) Gastroenterology (1126) Genetic and Genomic Medicine (6610) Geriatric Medicine (668) Health Economics (998) Health Informatics (4542) Health Policy (1370) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1266) Infectious Diseases (except HIV/AIDS) (15923) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (147) Nephrology (668) Neurology (6607) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1146) Occupational and Environmental Health (957) Oncology (3338) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (664) Pediatrics (1693) Pharmacology and Therapeutics (692) Primary Care Research (712) Psychiatry and Clinical Psychology (5448) Public and Global Health (9238) Radiology and Imaging (2202) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (596) Sexual and Reproductive Health (714) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a01d9566693058d3',t:'MTc3OTgwNjkzNg=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall
last seen: 2026-05-23T02:00:01.238055+00:00
License: Public-Domain